diff --git "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" --- "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" +++ "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 1.7532, "train/learning_rate": 2.109619952494062e-05, "train/epoch": 6.73, "train/global_step": 6000, "_runtime": 38937, "_timestamp": 1646700176, "_step": 6003, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 27.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 29384.0, 1023.0, 35.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-283.75, -277.6923828125, -271.634765625, -265.5771484375, -259.51953125, -253.4619140625, -247.404296875, -241.3466796875, -235.2890625, -229.2314453125, -223.173828125, -217.1162109375, -211.05859375, -205.0009765625, -198.943359375, -192.8857421875, -186.828125, -180.7705078125, -174.712890625, -168.6552734375, -162.59765625, -156.5400390625, -150.482421875, -144.4248046875, -138.3671875, -132.3095703125, -126.251953125, -120.1943359375, -114.13671875, -108.0791015625, -102.021484375, -95.9638671875, -89.90625, -83.8486328125, -77.791015625, -71.7333984375, -65.67578125, -59.6181640625, -53.560546875, -47.5029296875, -41.4453125, -35.3876953125, -29.330078125, -23.2724609375, -17.21484375, -11.1572265625, -5.099609375, 0.9580078125, 7.015625, 13.0732421875, 19.130859375, 25.1884765625, 31.24609375, 37.3037109375, 43.361328125, 49.4189453125, 55.4765625, 61.5341796875, 67.591796875, 73.6494140625, 79.70703125, 85.7646484375, 91.822265625, 97.8798828125, 103.9375]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 2.0, 4.0, 5.0, 10.0, 7.0, 15.0, 15.0, 14.0, 20.0, 14.0, 22.0, 27.0, 28.0, 30.0, 38.0, 37.0, 57.0, 39.0, 56.0, 56.0, 43.0, 44.0, 57.0, 42.0, 36.0, 33.0, 41.0, 34.0, 33.0, 32.0, 22.0, 18.0, 16.0, 20.0, 9.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 4.0], "bins": [-99.3861312866211, -97.02130889892578, -94.65648651123047, -92.29166412353516, -89.92684173583984, -87.56201171875, -85.19718933105469, -82.83236694335938, -80.46754455566406, -78.10272216796875, -75.73789978027344, -73.37307739257812, -71.00825500488281, -68.6434326171875, -66.27861022949219, -63.913780212402344, -61.5489616394043, -59.184139251708984, -56.81931686401367, -54.454490661621094, -52.08966827392578, -49.72484588623047, -47.360023498535156, -44.995201110839844, -42.63037872314453, -40.26555633544922, -37.900733947753906, -35.535911560058594, -33.171085357666016, -30.806262969970703, -28.44144058227539, -26.076616287231445, -23.7117919921875, -21.346969604492188, -18.982145309448242, -16.61732292175293, -14.2524995803833, -11.887676239013672, -9.52285385131836, -7.158029556274414, -4.793207168579102, -2.4283840656280518, -0.06356096267700195, 2.3012619018554688, 4.666085243225098, 7.030908584594727, 9.395730972290039, 11.760555267333984, 14.125377655029297, 16.49020004272461, 18.855024337768555, 21.219846725463867, 23.584671020507812, 25.949493408203125, 28.314315795898438, 30.679140090942383, 33.04396057128906, 35.408782958984375, 37.77360534667969, 40.138427734375, 42.50325393676758, 44.86807632446289, 47.2328987121582, 49.59772491455078, 51.962547302246094]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 11.0, 13.0, 15.0, 6.0, 11.0, 19.0, 28.0, 22.0, 26.0, 29.0, 26.0, 38.0, 39.0, 33.0, 29.0, 38.0, 42.0, 37.0, 29.0, 43.0, 35.0, 46.0, 31.0, 34.0, 38.0, 36.0, 24.0, 27.0, 26.0, 21.0, 25.0, 15.0, 16.0, 12.0, 18.0, 13.0, 6.0, 6.0, 8.0, 9.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.51362228393555, -47.64765930175781, -45.781700134277344, -43.91573715209961, -42.049774169921875, -40.183815002441406, -38.31785202026367, -36.45188903808594, -34.58592987060547, -32.719966888427734, -30.854007720947266, -28.98804473876953, -27.12208366394043, -25.256122589111328, -23.390159606933594, -21.524198532104492, -19.65823745727539, -17.79227638244629, -15.926314353942871, -14.060352325439453, -12.194391250610352, -10.32843017578125, -8.462468147277832, -6.596506118774414, -4.7305450439453125, -2.8645834922790527, -0.998621940612793, 0.8673396110534668, 2.7333011627197266, 4.599262237548828, 6.465224266052246, 8.331186294555664, 10.1971435546875, 12.063104629516602, 13.92906665802002, 15.795028686523438, 17.66098976135254, 19.52695083618164, 21.392913818359375, 23.258874893188477, 25.124835968017578, 26.99079704284668, 28.85675811767578, 30.722721099853516, 32.58868408203125, 34.45464324951172, 36.32060623168945, 38.18656921386719, 40.052528381347656, 41.91849136352539, 43.78445053100586, 45.650413513183594, 47.51637268066406, 49.3823356628418, 51.24829864501953, 53.1142578125, 54.980220794677734, 56.84618377685547, 58.71214294433594, 60.57810592651367, 62.444068908691406, 64.31002807617188, 66.17598724365234, 68.04195404052734, 69.90791320800781]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 8.0, 18.0, 34.0, 37.0, 66.0, 123.0, 171.0, 322.0, 458.0, 759.0, 1244.0, 1875.0, 3155.0, 4690.0, 7238.0, 10788.0, 15990.0, 23160.0, 32884.0, 44462.0, 58545.0, 74099.0, 89667.0, 107658.0, 129804.0, 100719.0, 85855.0, 69099.0, 53624.0, 40702.0, 29076.0, 20645.0, 14196.0, 9677.0, 6168.0, 4132.0, 2774.0, 1705.0, 1064.0, 714.0, 446.0, 272.0, 155.0, 104.0, 60.0, 60.0, 24.0, 14.0, 8.0, 5.0, 2.0, 3.0, 1.0], "bins": [-200.125, -194.462890625, -188.80078125, -183.138671875, -177.4765625, -171.814453125, -166.15234375, -160.490234375, -154.828125, -149.166015625, -143.50390625, -137.841796875, -132.1796875, -126.517578125, -120.85546875, -115.193359375, -109.53125, -103.869140625, -98.20703125, -92.544921875, -86.8828125, -81.220703125, -75.55859375, -69.896484375, -64.234375, -58.572265625, -52.91015625, -47.248046875, -41.5859375, -35.923828125, -30.26171875, -24.599609375, -18.9375, -13.275390625, -7.61328125, -1.951171875, 3.7109375, 9.373046875, 15.03515625, 20.697265625, 26.359375, 32.021484375, 37.68359375, 43.345703125, 49.0078125, 54.669921875, 60.33203125, 65.994140625, 71.65625, 77.318359375, 82.98046875, 88.642578125, 94.3046875, 99.966796875, 105.62890625, 111.291015625, 116.953125, 122.615234375, 128.27734375, 133.939453125, 139.6015625, 145.263671875, 150.92578125, 156.587890625, 162.25]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 4.0, 8.0, 13.0, 7.0, 11.0, 13.0, 19.0, 23.0, 19.0, 17.0, 33.0, 31.0, 40.0, 48.0, 35.0, 33.0, 33.0, 58.0, 49.0, 58.0, 48.0, 39.0, 42.0, 35.0, 30.0, 36.0, 31.0, 29.0, 18.0, 15.0, 20.0, 16.0, 9.0, 14.0, 10.0, 11.0, 8.0, 4.0, 6.0, 2.0, 6.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-78.375, -75.9140625, -73.453125, -70.9921875, -68.53125, -66.0703125, -63.609375, -61.1484375, -58.6875, -56.2265625, -53.765625, -51.3046875, -48.84375, -46.3828125, -43.921875, -41.4609375, -39.0, -36.5390625, -34.078125, -31.6171875, -29.15625, -26.6953125, -24.234375, -21.7734375, -19.3125, -16.8515625, -14.390625, -11.9296875, -9.46875, -7.0078125, -4.546875, -2.0859375, 0.375, 2.8359375, 5.296875, 7.7578125, 10.21875, 12.6796875, 15.140625, 17.6015625, 20.0625, 22.5234375, 24.984375, 27.4453125, 29.90625, 32.3671875, 34.828125, 37.2890625, 39.75, 42.2109375, 44.671875, 47.1328125, 49.59375, 52.0546875, 54.515625, 56.9765625, 59.4375, 61.8984375, 64.359375, 66.8203125, 69.28125, 71.7421875, 74.203125, 76.6640625, 79.125]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 11.0, 8.0, 12.0, 23.0, 7.0, 27.0, 23.0, 29.0, 31.0, 29.0, 36.0, 35.0, 45.0, 63.0, 40.0, 53.0, 65.0, 51.0, 62.0, 46.0, 45.0, 42.0, 34.0, 24.0, 29.0, 24.0, 12.0, 21.0, 8.0, 9.0, 14.0, 14.0, 2.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.182701110839844, -55.2156982421875, -53.248695373535156, -51.28169250488281, -49.3146858215332, -47.34768295288086, -45.380680084228516, -43.41367721557617, -41.44667053222656, -39.47966766357422, -37.512664794921875, -35.54566192626953, -33.57865524291992, -31.611652374267578, -29.644649505615234, -27.67764663696289, -25.710643768310547, -23.743640899658203, -21.776636123657227, -19.809633255004883, -17.842628479003906, -15.875625610351562, -13.908622741699219, -11.941618919372559, -9.974615097045898, -8.007611274719238, -6.040607929229736, -4.073604583740234, -2.106600761413574, -0.13959693908691406, 1.8274059295654297, 3.79440975189209, 5.76141357421875, 7.72841739654541, 9.69542121887207, 11.662424087524414, 13.629427909851074, 15.596431732177734, 17.563434600830078, 19.530437469482422, 21.4974422454834, 23.464445114135742, 25.43144989013672, 27.398452758789062, 29.365455627441406, 31.332460403442383, 33.299461364746094, 35.2664680480957, 37.23347091674805, 39.20047378540039, 41.167476654052734, 43.134483337402344, 45.10148620605469, 47.06848907470703, 49.035491943359375, 51.00249481201172, 52.96949768066406, 54.936500549316406, 56.90350341796875, 58.870506286621094, 60.8375129699707, 62.80451583862305, 64.77151489257812, 66.738525390625, 68.70552825927734]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 8.0, 9.0, 10.0, 12.0, 10.0, 8.0, 20.0, 22.0, 31.0, 30.0, 42.0, 34.0, 34.0, 44.0, 48.0, 53.0, 47.0, 52.0, 49.0, 53.0, 47.0, 49.0, 32.0, 49.0, 39.0, 27.0, 29.0, 17.0, 14.0, 20.0, 13.0, 14.0, 4.0, 6.0, 4.0, 6.0, 4.0, 6.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.51104736328125, -48.61479568481445, -46.71854019165039, -44.822288513183594, -42.92603302001953, -41.029781341552734, -39.13352584838867, -37.237274169921875, -35.34101867675781, -33.444766998291016, -31.548511505126953, -29.652257919311523, -27.756004333496094, -25.859752655029297, -23.963497161865234, -22.067245483398438, -20.170991897583008, -18.274738311767578, -16.37848472595215, -14.482231140136719, -12.585977554321289, -10.689724922180176, -8.793471336364746, -6.897217750549316, -5.000964164733887, -3.104710578918457, -1.2084572315216064, 0.6877961158752441, 2.584049701690674, 4.480302810668945, 6.376556396484375, 8.272809982299805, 10.169063568115234, 12.065317153930664, 13.961570739746094, 15.857824325561523, 17.754077911376953, 19.65032958984375, 21.546585083007812, 23.44283676147461, 25.339092254638672, 27.2353458404541, 29.13159942626953, 31.02785301208496, 32.92410659790039, 34.82035827636719, 36.71661376953125, 38.61286544799805, 40.509117126464844, 42.40536880493164, 44.3016242980957, 46.1978759765625, 48.09413146972656, 49.99038314819336, 51.88663864135742, 53.78289031982422, 55.67914581298828, 57.57539749145508, 59.47165298461914, 61.36790466308594, 63.26416015625, 65.16041564941406, 67.0566635131836, 68.95291900634766, 70.84917449951172]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 16.0, 21.0, 31.0, 55.0, 96.0, 151.0, 266.0, 434.0, 823.0, 1445.0, 2507.0, 4580.0, 8153.0, 14302.0, 25838.0, 46285.0, 82545.0, 147778.0, 259956.0, 440787.0, 686096.0, 819643.0, 663261.0, 421897.0, 246521.0, 140552.0, 78823.0, 43523.0, 24716.0, 13808.0, 7964.0, 4551.0, 2730.0, 1641.0, 944.0, 598.0, 339.0, 190.0, 141.0, 99.0, 61.0, 37.0, 27.0, 14.0, 10.0, 10.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-63.53125, -61.21728515625, -58.9033203125, -56.58935546875, -54.275390625, -51.96142578125, -49.6474609375, -47.33349609375, -45.01953125, -42.70556640625, -40.3916015625, -38.07763671875, -35.763671875, -33.44970703125, -31.1357421875, -28.82177734375, -26.5078125, -24.19384765625, -21.8798828125, -19.56591796875, -17.251953125, -14.93798828125, -12.6240234375, -10.31005859375, -7.99609375, -5.68212890625, -3.3681640625, -1.05419921875, 1.259765625, 3.57373046875, 5.8876953125, 8.20166015625, 10.515625, 12.82958984375, 15.1435546875, 17.45751953125, 19.771484375, 22.08544921875, 24.3994140625, 26.71337890625, 29.02734375, 31.34130859375, 33.6552734375, 35.96923828125, 38.283203125, 40.59716796875, 42.9111328125, 45.22509765625, 47.5390625, 49.85302734375, 52.1669921875, 54.48095703125, 56.794921875, 59.10888671875, 61.4228515625, 63.73681640625, 66.05078125, 68.36474609375, 70.6787109375, 72.99267578125, 75.306640625, 77.62060546875, 79.9345703125, 82.24853515625, 84.5625]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 10.0, 11.0, 14.0, 14.0, 16.0, 20.0, 23.0, 34.0, 29.0, 35.0, 35.0, 46.0, 47.0, 56.0, 45.0, 55.0, 54.0, 52.0, 45.0, 39.0, 52.0, 41.0, 37.0, 46.0, 31.0, 26.0, 14.0, 13.0, 4.0, 5.0, 9.0, 9.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.25, -41.75048828125, -40.2509765625, -38.75146484375, -37.251953125, -35.75244140625, -34.2529296875, -32.75341796875, -31.25390625, -29.75439453125, -28.2548828125, -26.75537109375, -25.255859375, -23.75634765625, -22.2568359375, -20.75732421875, -19.2578125, -17.75830078125, -16.2587890625, -14.75927734375, -13.259765625, -11.76025390625, -10.2607421875, -8.76123046875, -7.26171875, -5.76220703125, -4.2626953125, -2.76318359375, -1.263671875, 0.23583984375, 1.7353515625, 3.23486328125, 4.734375, 6.23388671875, 7.7333984375, 9.23291015625, 10.732421875, 12.23193359375, 13.7314453125, 15.23095703125, 16.73046875, 18.22998046875, 19.7294921875, 21.22900390625, 22.728515625, 24.22802734375, 25.7275390625, 27.22705078125, 28.7265625, 30.22607421875, 31.7255859375, 33.22509765625, 34.724609375, 36.22412109375, 37.7236328125, 39.22314453125, 40.72265625, 42.22216796875, 43.7216796875, 45.22119140625, 46.720703125, 48.22021484375, 49.7197265625, 51.21923828125, 52.71875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 10.0, 15.0, 20.0, 16.0, 38.0, 55.0, 98.0, 122.0, 230.0, 373.0, 528.0, 886.0, 1478.0, 2510.0, 4159.0, 6782.0, 11465.0, 18907.0, 31431.0, 51690.0, 84854.0, 135485.0, 212119.0, 318071.0, 444425.0, 561446.0, 601319.0, 530337.0, 404728.0, 282335.0, 185266.0, 117450.0, 73399.0, 44503.0, 26715.0, 16139.0, 9848.0, 5877.0, 3509.0, 2110.0, 1307.0, 825.0, 513.0, 318.0, 205.0, 136.0, 79.0, 63.0, 35.0, 21.0, 12.0, 9.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-45.875, -44.36328125, -42.8515625, -41.33984375, -39.828125, -38.31640625, -36.8046875, -35.29296875, -33.78125, -32.26953125, -30.7578125, -29.24609375, -27.734375, -26.22265625, -24.7109375, -23.19921875, -21.6875, -20.17578125, -18.6640625, -17.15234375, -15.640625, -14.12890625, -12.6171875, -11.10546875, -9.59375, -8.08203125, -6.5703125, -5.05859375, -3.546875, -2.03515625, -0.5234375, 0.98828125, 2.5, 4.01171875, 5.5234375, 7.03515625, 8.546875, 10.05859375, 11.5703125, 13.08203125, 14.59375, 16.10546875, 17.6171875, 19.12890625, 20.640625, 22.15234375, 23.6640625, 25.17578125, 26.6875, 28.19921875, 29.7109375, 31.22265625, 32.734375, 34.24609375, 35.7578125, 37.26953125, 38.78125, 40.29296875, 41.8046875, 43.31640625, 44.828125, 46.33984375, 47.8515625, 49.36328125, 50.875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 1.0, 7.0, 8.0, 9.0, 17.0, 29.0, 28.0, 28.0, 32.0, 62.0, 51.0, 68.0, 92.0, 97.0, 147.0, 152.0, 175.0, 192.0, 214.0, 227.0, 226.0, 231.0, 215.0, 240.0, 202.0, 176.0, 186.0, 153.0, 154.0, 128.0, 104.0, 76.0, 68.0, 68.0, 35.0, 43.0, 30.0, 32.0, 12.0, 15.0, 10.0, 11.0, 7.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-22.140625, -21.50048828125, -20.8603515625, -20.22021484375, -19.580078125, -18.93994140625, -18.2998046875, -17.65966796875, -17.01953125, -16.37939453125, -15.7392578125, -15.09912109375, -14.458984375, -13.81884765625, -13.1787109375, -12.53857421875, -11.8984375, -11.25830078125, -10.6181640625, -9.97802734375, -9.337890625, -8.69775390625, -8.0576171875, -7.41748046875, -6.77734375, -6.13720703125, -5.4970703125, -4.85693359375, -4.216796875, -3.57666015625, -2.9365234375, -2.29638671875, -1.65625, -1.01611328125, -0.3759765625, 0.26416015625, 0.904296875, 1.54443359375, 2.1845703125, 2.82470703125, 3.46484375, 4.10498046875, 4.7451171875, 5.38525390625, 6.025390625, 6.66552734375, 7.3056640625, 7.94580078125, 8.5859375, 9.22607421875, 9.8662109375, 10.50634765625, 11.146484375, 11.78662109375, 12.4267578125, 13.06689453125, 13.70703125, 14.34716796875, 14.9873046875, 15.62744140625, 16.267578125, 16.90771484375, 17.5478515625, 18.18798828125, 18.828125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 7.0, 8.0, 11.0, 13.0, 18.0, 13.0, 23.0, 33.0, 36.0, 39.0, 45.0, 39.0, 46.0, 61.0, 63.0, 49.0, 67.0, 58.0, 59.0, 53.0, 31.0, 36.0, 35.0, 27.0, 27.0, 29.0, 15.0, 8.0, 15.0, 11.0, 3.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.269248962402344, -43.37336730957031, -41.47748947143555, -39.58161163330078, -37.68572998046875, -35.78984832763672, -33.89397048950195, -31.998090744018555, -30.102210998535156, -28.206331253051758, -26.31045150756836, -24.41457176208496, -22.518692016601562, -20.622812271118164, -18.726932525634766, -16.831052780151367, -14.935173034667969, -13.03929328918457, -11.143413543701172, -9.247533798217773, -7.351654052734375, -5.455774307250977, -3.559894561767578, -1.6640148162841797, 0.23186492919921875, 2.127744674682617, 4.023624420166016, 5.919504165649414, 7.8153839111328125, 9.711263656616211, 11.60714340209961, 13.503023147583008, 15.398902893066406, 17.294782638549805, 19.190662384033203, 21.0865421295166, 22.982421875, 24.8783016204834, 26.774181365966797, 28.670061111450195, 30.565940856933594, 32.461822509765625, 34.35770034790039, 36.253578186035156, 38.14945983886719, 40.04534149169922, 41.941219329833984, 43.83709716796875, 45.73297882080078, 47.62886047363281, 49.52473831176758, 51.420616149902344, 53.316497802734375, 55.212379455566406, 57.10825729370117, 59.00413513183594, 60.90001678466797, 62.7958984375, 64.6917724609375, 66.58765411376953, 68.48353576660156, 70.3794174194336, 72.27529907226562, 74.17117309570312, 76.06705474853516]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 11.0, 4.0, 6.0, 7.0, 10.0, 7.0, 28.0, 20.0, 22.0, 36.0, 29.0, 30.0, 29.0, 28.0, 45.0, 29.0, 45.0, 48.0, 42.0, 52.0, 45.0, 48.0, 31.0, 44.0, 36.0, 29.0, 33.0, 32.0, 32.0, 19.0, 11.0, 14.0, 25.0, 13.0, 14.0, 5.0, 6.0, 6.0, 4.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-48.849143981933594, -47.37669372558594, -45.90424346923828, -44.431793212890625, -42.95934295654297, -41.48689651489258, -40.01444625854492, -38.541996002197266, -37.06954574584961, -35.59709548950195, -34.1246452331543, -32.65219497680664, -31.179746627807617, -29.70729637145996, -28.234848022460938, -26.76239776611328, -25.289947509765625, -23.81749725341797, -22.345046997070312, -20.87259864807129, -19.400148391723633, -17.927698135375977, -16.455249786376953, -14.982799530029297, -13.51034927368164, -12.037899017333984, -10.565449714660645, -9.093000411987305, -7.620550155639648, -6.14810037612915, -4.675650596618652, -3.2032012939453125, -1.7307472229003906, -0.2582974433898926, 1.2141523361206055, 2.6866021156311035, 4.159051895141602, 5.6315016746521, 7.103951454162598, 8.576400756835938, 10.048851013183594, 11.52130126953125, 12.99375057220459, 14.46619987487793, 15.938650131225586, 17.411100387573242, 18.883548736572266, 20.355998992919922, 21.828449249267578, 23.300899505615234, 24.77334976196289, 26.245798110961914, 27.71824836730957, 29.190698623657227, 30.66314697265625, 32.135597229003906, 33.60804748535156, 35.08049774169922, 36.552947998046875, 38.02539825439453, 39.49784851074219, 40.97029495239258, 42.442745208740234, 43.91519546508789, 45.38764572143555]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 13.0, 11.0, 12.0, 26.0, 43.0, 65.0, 94.0, 135.0, 195.0, 284.0, 488.0, 747.0, 1136.0, 1742.0, 2637.0, 4138.0, 6570.0, 10245.0, 16094.0, 25837.0, 41213.0, 67497.0, 108350.0, 160409.0, 184000.0, 151532.0, 99920.0, 61648.0, 38228.0, 23792.0, 15055.0, 9291.0, 6188.0, 3783.0, 2534.0, 1592.0, 988.0, 697.0, 435.0, 301.0, 179.0, 122.0, 86.0, 66.0, 37.0, 25.0, 21.0, 20.0, 11.0, 4.0, 8.0, 2.0, 2.0, 5.0, 1.0, 3.0], "bins": [-73.5625, -71.29296875, -69.0234375, -66.75390625, -64.484375, -62.21484375, -59.9453125, -57.67578125, -55.40625, -53.13671875, -50.8671875, -48.59765625, -46.328125, -44.05859375, -41.7890625, -39.51953125, -37.25, -34.98046875, -32.7109375, -30.44140625, -28.171875, -25.90234375, -23.6328125, -21.36328125, -19.09375, -16.82421875, -14.5546875, -12.28515625, -10.015625, -7.74609375, -5.4765625, -3.20703125, -0.9375, 1.33203125, 3.6015625, 5.87109375, 8.140625, 10.41015625, 12.6796875, 14.94921875, 17.21875, 19.48828125, 21.7578125, 24.02734375, 26.296875, 28.56640625, 30.8359375, 33.10546875, 35.375, 37.64453125, 39.9140625, 42.18359375, 44.453125, 46.72265625, 48.9921875, 51.26171875, 53.53125, 55.80078125, 58.0703125, 60.33984375, 62.609375, 64.87890625, 67.1484375, 69.41796875, 71.6875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 10.0, 7.0, 11.0, 10.0, 18.0, 17.0, 13.0, 24.0, 22.0, 24.0, 21.0, 31.0, 32.0, 48.0, 39.0, 41.0, 40.0, 48.0, 39.0, 48.0, 41.0, 59.0, 49.0, 45.0, 35.0, 19.0, 36.0, 21.0, 13.0, 30.0, 15.0, 21.0, 12.0, 14.0, 10.0, 11.0, 2.0, 5.0, 1.0, 2.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-45.03125, -43.7021484375, -42.373046875, -41.0439453125, -39.71484375, -38.3857421875, -37.056640625, -35.7275390625, -34.3984375, -33.0693359375, -31.740234375, -30.4111328125, -29.08203125, -27.7529296875, -26.423828125, -25.0947265625, -23.765625, -22.4365234375, -21.107421875, -19.7783203125, -18.44921875, -17.1201171875, -15.791015625, -14.4619140625, -13.1328125, -11.8037109375, -10.474609375, -9.1455078125, -7.81640625, -6.4873046875, -5.158203125, -3.8291015625, -2.5, -1.1708984375, 0.158203125, 1.4873046875, 2.81640625, 4.1455078125, 5.474609375, 6.8037109375, 8.1328125, 9.4619140625, 10.791015625, 12.1201171875, 13.44921875, 14.7783203125, 16.107421875, 17.4365234375, 18.765625, 20.0947265625, 21.423828125, 22.7529296875, 24.08203125, 25.4111328125, 26.740234375, 28.0693359375, 29.3984375, 30.7275390625, 32.056640625, 33.3857421875, 34.71484375, 36.0439453125, 37.373046875, 38.7021484375, 40.03125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 8.0, 9.0, 16.0, 27.0, 54.0, 104.0, 137.0, 228.0, 388.0, 591.0, 935.0, 1518.0, 2479.0, 4358.0, 7617.0, 13965.0, 26556.0, 55552.0, 126103.0, 271043.0, 280845.0, 134387.0, 59072.0, 28550.0, 14535.0, 8128.0, 4466.0, 2630.0, 1658.0, 1002.0, 622.0, 351.0, 255.0, 125.0, 75.0, 56.0, 30.0, 22.0, 15.0, 13.0, 6.0, 3.0, 3.0, 6.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-108.125, -104.75, -101.375, -98.0, -94.625, -91.25, -87.875, -84.5, -81.125, -77.75, -74.375, -71.0, -67.625, -64.25, -60.875, -57.5, -54.125, -50.75, -47.375, -44.0, -40.625, -37.25, -33.875, -30.5, -27.125, -23.75, -20.375, -17.0, -13.625, -10.25, -6.875, -3.5, -0.125, 3.25, 6.625, 10.0, 13.375, 16.75, 20.125, 23.5, 26.875, 30.25, 33.625, 37.0, 40.375, 43.75, 47.125, 50.5, 53.875, 57.25, 60.625, 64.0, 67.375, 70.75, 74.125, 77.5, 80.875, 84.25, 87.625, 91.0, 94.375, 97.75, 101.125, 104.5, 107.875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 4.0, 7.0, 5.0, 6.0, 9.0, 10.0, 11.0, 21.0, 20.0, 23.0, 18.0, 13.0, 18.0, 19.0, 17.0, 21.0, 37.0, 29.0, 25.0, 29.0, 27.0, 26.0, 29.0, 33.0, 36.0, 33.0, 42.0, 34.0, 29.0, 26.0, 37.0, 31.0, 31.0, 27.0, 20.0, 30.0, 19.0, 19.0, 17.0, 21.0, 8.0, 14.0, 11.0, 17.0, 8.0, 6.0, 7.0, 5.0, 2.0, 4.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-23.34375, -22.622802734375, -21.90185546875, -21.180908203125, -20.4599609375, -19.739013671875, -19.01806640625, -18.297119140625, -17.576171875, -16.855224609375, -16.13427734375, -15.413330078125, -14.6923828125, -13.971435546875, -13.25048828125, -12.529541015625, -11.80859375, -11.087646484375, -10.36669921875, -9.645751953125, -8.9248046875, -8.203857421875, -7.48291015625, -6.761962890625, -6.041015625, -5.320068359375, -4.59912109375, -3.878173828125, -3.1572265625, -2.436279296875, -1.71533203125, -0.994384765625, -0.2734375, 0.447509765625, 1.16845703125, 1.889404296875, 2.6103515625, 3.331298828125, 4.05224609375, 4.773193359375, 5.494140625, 6.215087890625, 6.93603515625, 7.656982421875, 8.3779296875, 9.098876953125, 9.81982421875, 10.540771484375, 11.26171875, 11.982666015625, 12.70361328125, 13.424560546875, 14.1455078125, 14.866455078125, 15.58740234375, 16.308349609375, 17.029296875, 17.750244140625, 18.47119140625, 19.192138671875, 19.9130859375, 20.634033203125, 21.35498046875, 22.075927734375, 22.796875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 22.0, 21.0, 33.0, 52.0, 66.0, 97.0, 181.0, 277.0, 482.0, 684.0, 1171.0, 2097.0, 3694.0, 6525.0, 12418.0, 24696.0, 53254.0, 125378.0, 290463.0, 292903.0, 127251.0, 53853.0, 24975.0, 12446.0, 6581.0, 3646.0, 2060.0, 1225.0, 766.0, 436.0, 294.0, 182.0, 106.0, 78.0, 56.0, 28.0, 19.0, 13.0, 10.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.34375, -42.91357421875, -41.4833984375, -40.05322265625, -38.623046875, -37.19287109375, -35.7626953125, -34.33251953125, -32.90234375, -31.47216796875, -30.0419921875, -28.61181640625, -27.181640625, -25.75146484375, -24.3212890625, -22.89111328125, -21.4609375, -20.03076171875, -18.6005859375, -17.17041015625, -15.740234375, -14.31005859375, -12.8798828125, -11.44970703125, -10.01953125, -8.58935546875, -7.1591796875, -5.72900390625, -4.298828125, -2.86865234375, -1.4384765625, -0.00830078125, 1.421875, 2.85205078125, 4.2822265625, 5.71240234375, 7.142578125, 8.57275390625, 10.0029296875, 11.43310546875, 12.86328125, 14.29345703125, 15.7236328125, 17.15380859375, 18.583984375, 20.01416015625, 21.4443359375, 22.87451171875, 24.3046875, 25.73486328125, 27.1650390625, 28.59521484375, 30.025390625, 31.45556640625, 32.8857421875, 34.31591796875, 35.74609375, 37.17626953125, 38.6064453125, 40.03662109375, 41.466796875, 42.89697265625, 44.3271484375, 45.75732421875, 47.1875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 7.0, 14.0, 15.0, 26.0, 44.0, 46.0, 82.0, 99.0, 142.0, 142.0, 107.0, 83.0, 64.0, 38.0, 26.0, 12.0, 10.0, 5.0, 4.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004093170166015625, -0.0038986802101135254, -0.0037041902542114258, -0.003509700298309326, -0.0033152103424072266, -0.003120720386505127, -0.0029262304306030273, -0.0027317404747009277, -0.002537250518798828, -0.0023427605628967285, -0.002148270606994629, -0.0019537806510925293, -0.0017592906951904297, -0.00156480073928833, -0.0013703107833862305, -0.0011758208274841309, -0.0009813308715820312, -0.0007868409156799316, -0.000592350959777832, -0.0003978610038757324, -0.0002033710479736328, -8.881092071533203e-06, 0.0001856088638305664, 0.000380098819732666, 0.0005745887756347656, 0.0007690787315368652, 0.0009635686874389648, 0.0011580586433410645, 0.001352548599243164, 0.0015470385551452637, 0.0017415285110473633, 0.0019360184669494629, 0.0021305084228515625, 0.002324998378753662, 0.0025194883346557617, 0.0027139782905578613, 0.002908468246459961, 0.0031029582023620605, 0.00329744815826416, 0.0034919381141662598, 0.0036864280700683594, 0.003880918025970459, 0.004075407981872559, 0.004269897937774658, 0.004464387893676758, 0.004658877849578857, 0.004853367805480957, 0.005047857761383057, 0.005242347717285156, 0.005436837673187256, 0.0056313276290893555, 0.005825817584991455, 0.006020307540893555, 0.006214797496795654, 0.006409287452697754, 0.0066037774085998535, 0.006798267364501953, 0.006992757320404053, 0.007187247276306152, 0.007381737232208252, 0.0075762271881103516, 0.007770717144012451, 0.00796520709991455, 0.00815969705581665, 0.00835418701171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 9.0, 17.0, 15.0, 35.0, 48.0, 69.0, 118.0, 151.0, 251.0, 434.0, 666.0, 1071.0, 1743.0, 3012.0, 5466.0, 9968.0, 18609.0, 36455.0, 74564.0, 147109.0, 238121.0, 230525.0, 138255.0, 68785.0, 33875.0, 17439.0, 9256.0, 5013.0, 2956.0, 1734.0, 1019.0, 610.0, 408.0, 248.0, 170.0, 107.0, 72.0, 41.0, 44.0, 16.0, 12.0, 7.0, 10.0, 7.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.84375, -46.34619140625, -44.8486328125, -43.35107421875, -41.853515625, -40.35595703125, -38.8583984375, -37.36083984375, -35.86328125, -34.36572265625, -32.8681640625, -31.37060546875, -29.873046875, -28.37548828125, -26.8779296875, -25.38037109375, -23.8828125, -22.38525390625, -20.8876953125, -19.39013671875, -17.892578125, -16.39501953125, -14.8974609375, -13.39990234375, -11.90234375, -10.40478515625, -8.9072265625, -7.40966796875, -5.912109375, -4.41455078125, -2.9169921875, -1.41943359375, 0.078125, 1.57568359375, 3.0732421875, 4.57080078125, 6.068359375, 7.56591796875, 9.0634765625, 10.56103515625, 12.05859375, 13.55615234375, 15.0537109375, 16.55126953125, 18.048828125, 19.54638671875, 21.0439453125, 22.54150390625, 24.0390625, 25.53662109375, 27.0341796875, 28.53173828125, 30.029296875, 31.52685546875, 33.0244140625, 34.52197265625, 36.01953125, 37.51708984375, 39.0146484375, 40.51220703125, 42.009765625, 43.50732421875, 45.0048828125, 46.50244140625, 48.0]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 1.0, 2.0, 7.0, 6.0, 9.0, 17.0, 11.0, 23.0, 21.0, 30.0, 29.0, 52.0, 37.0, 53.0, 71.0, 62.0, 61.0, 53.0, 73.0, 57.0, 36.0, 43.0, 44.0, 31.0, 37.0, 27.0, 24.0, 19.0, 9.0, 5.0, 12.0, 6.0, 6.0, 2.0, 0.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.890625, -10.50146484375, -10.1123046875, -9.72314453125, -9.333984375, -8.94482421875, -8.5556640625, -8.16650390625, -7.77734375, -7.38818359375, -6.9990234375, -6.60986328125, -6.220703125, -5.83154296875, -5.4423828125, -5.05322265625, -4.6640625, -4.27490234375, -3.8857421875, -3.49658203125, -3.107421875, -2.71826171875, -2.3291015625, -1.93994140625, -1.55078125, -1.16162109375, -0.7724609375, -0.38330078125, 0.005859375, 0.39501953125, 0.7841796875, 1.17333984375, 1.5625, 1.95166015625, 2.3408203125, 2.72998046875, 3.119140625, 3.50830078125, 3.8974609375, 4.28662109375, 4.67578125, 5.06494140625, 5.4541015625, 5.84326171875, 6.232421875, 6.62158203125, 7.0107421875, 7.39990234375, 7.7890625, 8.17822265625, 8.5673828125, 8.95654296875, 9.345703125, 9.73486328125, 10.1240234375, 10.51318359375, 10.90234375, 11.29150390625, 11.6806640625, 12.06982421875, 12.458984375, 12.84814453125, 13.2373046875, 13.62646484375, 14.015625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 11.0, 7.0, 15.0, 17.0, 22.0, 34.0, 35.0, 38.0, 50.0, 58.0, 56.0, 58.0, 63.0, 71.0, 64.0, 57.0, 45.0, 47.0, 36.0, 29.0, 36.0, 32.0, 24.0, 22.0, 17.0, 16.0, 5.0, 10.0, 6.0, 8.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.69770431518555, -36.896141052246094, -35.09457778930664, -33.29301452636719, -31.4914493560791, -29.68988609313965, -27.888320922851562, -26.08675765991211, -24.285194396972656, -22.483631134033203, -20.68206787109375, -18.880502700805664, -17.07893943786621, -15.277376174926758, -13.475811958312988, -11.674247741699219, -9.872684478759766, -8.071121215820312, -6.269556999206543, -4.467993259429932, -2.6664295196533203, -0.8648662567138672, 0.9366979598999023, 2.738262176513672, 4.539825439453125, 6.341389179229736, 8.142952919006348, 9.944517135620117, 11.74608039855957, 13.547643661499023, 15.349207878112793, 17.150772094726562, 18.95233917236328, 20.753902435302734, 22.555465698242188, 24.357030868530273, 26.158594131469727, 27.96015739440918, 29.761722564697266, 31.56328582763672, 33.36484909057617, 35.166412353515625, 36.96797561645508, 38.76953887939453, 40.57110595703125, 42.37266540527344, 44.174232482910156, 45.97579574584961, 47.77735900878906, 49.578922271728516, 51.38048553466797, 53.18204879760742, 54.983612060546875, 56.785179138183594, 58.58674240112305, 60.3883056640625, 62.18986892700195, 63.991432189941406, 65.79299926757812, 67.59455871582031, 69.39612579345703, 71.19768524169922, 72.99925231933594, 74.80081176757812, 76.60237884521484]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 8.0, 9.0, 7.0, 8.0, 23.0, 17.0, 24.0, 31.0, 37.0, 19.0, 33.0, 28.0, 30.0, 38.0, 41.0, 37.0, 49.0, 30.0, 51.0, 38.0, 44.0, 39.0, 48.0, 33.0, 31.0, 26.0, 23.0, 26.0, 26.0, 22.0, 19.0, 16.0, 14.0, 11.0, 12.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-40.85141372680664, -39.61397171020508, -38.37652587890625, -37.13908386230469, -35.90163803100586, -34.6641960144043, -33.42675018310547, -32.189308166503906, -30.95186424255371, -29.714420318603516, -28.47697639465332, -27.239532470703125, -26.002090454101562, -24.764644622802734, -23.527202606201172, -22.289758682250977, -21.05231475830078, -19.814870834350586, -18.57742691040039, -17.339982986450195, -16.1025390625, -14.865096092224121, -13.627653121948242, -12.390209197998047, -11.152765274047852, -9.915321350097656, -8.677877426147461, -7.440434455871582, -6.202990531921387, -4.965546607971191, -3.7281031608581543, -2.490659713745117, -1.2532196044921875, -0.01577591896057129, 1.221667766571045, 2.459111452102661, 3.6965551376342773, 4.933999061584473, 6.17144250869751, 7.408885955810547, 8.646329879760742, 9.883773803710938, 11.121217727661133, 12.358660697937012, 13.596104621887207, 14.833548545837402, 16.07099151611328, 17.308435440063477, 18.545879364013672, 19.783323287963867, 21.020767211914062, 22.258211135864258, 23.495655059814453, 24.733097076416016, 25.97054100036621, 27.207984924316406, 28.4454288482666, 29.682872772216797, 30.920316696166992, 32.15776062011719, 33.39520263671875, 34.63264846801758, 35.87009048461914, 37.10753631591797, 38.34497833251953]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 11.0, 10.0, 26.0, 32.0, 63.0, 110.0, 153.0, 254.0, 421.0, 703.0, 1027.0, 1736.0, 2770.0, 4502.0, 7022.0, 11031.0, 17251.0, 25875.0, 38091.0, 53853.0, 72079.0, 92027.0, 107990.0, 116802.0, 113589.0, 100501.0, 82478.0, 62547.0, 45448.0, 31491.0, 21086.0, 13741.0, 8895.0, 5672.0, 3508.0, 2174.0, 1408.0, 799.0, 509.0, 362.0, 201.0, 124.0, 75.0, 46.0, 29.0, 13.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.71875, -42.2490234375, -40.779296875, -39.3095703125, -37.83984375, -36.3701171875, -34.900390625, -33.4306640625, -31.9609375, -30.4912109375, -29.021484375, -27.5517578125, -26.08203125, -24.6123046875, -23.142578125, -21.6728515625, -20.203125, -18.7333984375, -17.263671875, -15.7939453125, -14.32421875, -12.8544921875, -11.384765625, -9.9150390625, -8.4453125, -6.9755859375, -5.505859375, -4.0361328125, -2.56640625, -1.0966796875, 0.373046875, 1.8427734375, 3.3125, 4.7822265625, 6.251953125, 7.7216796875, 9.19140625, 10.6611328125, 12.130859375, 13.6005859375, 15.0703125, 16.5400390625, 18.009765625, 19.4794921875, 20.94921875, 22.4189453125, 23.888671875, 25.3583984375, 26.828125, 28.2978515625, 29.767578125, 31.2373046875, 32.70703125, 34.1767578125, 35.646484375, 37.1162109375, 38.5859375, 40.0556640625, 41.525390625, 42.9951171875, 44.46484375, 45.9345703125, 47.404296875, 48.8740234375, 50.34375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 6.0, 9.0, 16.0, 11.0, 15.0, 16.0, 25.0, 22.0, 23.0, 38.0, 27.0, 35.0, 27.0, 51.0, 45.0, 37.0, 37.0, 37.0, 48.0, 38.0, 50.0, 39.0, 28.0, 38.0, 39.0, 26.0, 25.0, 27.0, 22.0, 24.0, 16.0, 11.0, 22.0, 16.0, 7.0, 9.0, 4.0, 3.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-39.28125, -38.08642578125, -36.8916015625, -35.69677734375, -34.501953125, -33.30712890625, -32.1123046875, -30.91748046875, -29.72265625, -28.52783203125, -27.3330078125, -26.13818359375, -24.943359375, -23.74853515625, -22.5537109375, -21.35888671875, -20.1640625, -18.96923828125, -17.7744140625, -16.57958984375, -15.384765625, -14.18994140625, -12.9951171875, -11.80029296875, -10.60546875, -9.41064453125, -8.2158203125, -7.02099609375, -5.826171875, -4.63134765625, -3.4365234375, -2.24169921875, -1.046875, 0.14794921875, 1.3427734375, 2.53759765625, 3.732421875, 4.92724609375, 6.1220703125, 7.31689453125, 8.51171875, 9.70654296875, 10.9013671875, 12.09619140625, 13.291015625, 14.48583984375, 15.6806640625, 16.87548828125, 18.0703125, 19.26513671875, 20.4599609375, 21.65478515625, 22.849609375, 24.04443359375, 25.2392578125, 26.43408203125, 27.62890625, 28.82373046875, 30.0185546875, 31.21337890625, 32.408203125, 33.60302734375, 34.7978515625, 35.99267578125, 37.1875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 4.0, 13.0, 11.0, 33.0, 39.0, 70.0, 112.0, 151.0, 276.0, 439.0, 667.0, 1081.0, 1836.0, 2959.0, 4610.0, 7555.0, 12106.0, 19502.0, 30831.0, 45638.0, 64786.0, 86369.0, 107231.0, 120021.0, 122455.0, 112400.0, 92799.0, 70961.0, 50805.0, 33913.0, 22165.0, 13952.0, 8784.0, 5448.0, 3234.0, 2054.0, 1162.0, 785.0, 450.0, 281.0, 210.0, 129.0, 75.0, 59.0, 40.0, 27.0, 10.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.03125, -52.35009765625, -50.6689453125, -48.98779296875, -47.306640625, -45.62548828125, -43.9443359375, -42.26318359375, -40.58203125, -38.90087890625, -37.2197265625, -35.53857421875, -33.857421875, -32.17626953125, -30.4951171875, -28.81396484375, -27.1328125, -25.45166015625, -23.7705078125, -22.08935546875, -20.408203125, -18.72705078125, -17.0458984375, -15.36474609375, -13.68359375, -12.00244140625, -10.3212890625, -8.64013671875, -6.958984375, -5.27783203125, -3.5966796875, -1.91552734375, -0.234375, 1.44677734375, 3.1279296875, 4.80908203125, 6.490234375, 8.17138671875, 9.8525390625, 11.53369140625, 13.21484375, 14.89599609375, 16.5771484375, 18.25830078125, 19.939453125, 21.62060546875, 23.3017578125, 24.98291015625, 26.6640625, 28.34521484375, 30.0263671875, 31.70751953125, 33.388671875, 35.06982421875, 36.7509765625, 38.43212890625, 40.11328125, 41.79443359375, 43.4755859375, 45.15673828125, 46.837890625, 48.51904296875, 50.2001953125, 51.88134765625, 53.5625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 8.0, 14.0, 7.0, 15.0, 9.0, 13.0, 19.0, 19.0, 20.0, 18.0, 28.0, 31.0, 31.0, 26.0, 34.0, 51.0, 36.0, 33.0, 35.0, 52.0, 46.0, 43.0, 40.0, 35.0, 33.0, 31.0, 37.0, 38.0, 25.0, 24.0, 21.0, 20.0, 19.0, 13.0, 14.0, 11.0, 9.0, 8.0, 6.0, 7.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.953125, -23.16748046875, -22.3818359375, -21.59619140625, -20.810546875, -20.02490234375, -19.2392578125, -18.45361328125, -17.66796875, -16.88232421875, -16.0966796875, -15.31103515625, -14.525390625, -13.73974609375, -12.9541015625, -12.16845703125, -11.3828125, -10.59716796875, -9.8115234375, -9.02587890625, -8.240234375, -7.45458984375, -6.6689453125, -5.88330078125, -5.09765625, -4.31201171875, -3.5263671875, -2.74072265625, -1.955078125, -1.16943359375, -0.3837890625, 0.40185546875, 1.1875, 1.97314453125, 2.7587890625, 3.54443359375, 4.330078125, 5.11572265625, 5.9013671875, 6.68701171875, 7.47265625, 8.25830078125, 9.0439453125, 9.82958984375, 10.615234375, 11.40087890625, 12.1865234375, 12.97216796875, 13.7578125, 14.54345703125, 15.3291015625, 16.11474609375, 16.900390625, 17.68603515625, 18.4716796875, 19.25732421875, 20.04296875, 20.82861328125, 21.6142578125, 22.39990234375, 23.185546875, 23.97119140625, 24.7568359375, 25.54248046875, 26.328125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 11.0, 14.0, 21.0, 31.0, 46.0, 63.0, 105.0, 138.0, 212.0, 331.0, 442.0, 771.0, 1236.0, 2005.0, 3479.0, 6055.0, 10903.0, 20275.0, 38354.0, 71274.0, 125981.0, 185665.0, 203829.0, 160687.0, 98838.0, 53955.0, 28405.0, 15353.0, 8314.0, 4698.0, 2628.0, 1634.0, 986.0, 626.0, 395.0, 253.0, 177.0, 121.0, 75.0, 54.0, 37.0, 26.0, 22.0, 11.0, 10.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.5, -21.780517578125, -21.06103515625, -20.341552734375, -19.6220703125, -18.902587890625, -18.18310546875, -17.463623046875, -16.744140625, -16.024658203125, -15.30517578125, -14.585693359375, -13.8662109375, -13.146728515625, -12.42724609375, -11.707763671875, -10.98828125, -10.268798828125, -9.54931640625, -8.829833984375, -8.1103515625, -7.390869140625, -6.67138671875, -5.951904296875, -5.232421875, -4.512939453125, -3.79345703125, -3.073974609375, -2.3544921875, -1.635009765625, -0.91552734375, -0.196044921875, 0.5234375, 1.242919921875, 1.96240234375, 2.681884765625, 3.4013671875, 4.120849609375, 4.84033203125, 5.559814453125, 6.279296875, 6.998779296875, 7.71826171875, 8.437744140625, 9.1572265625, 9.876708984375, 10.59619140625, 11.315673828125, 12.03515625, 12.754638671875, 13.47412109375, 14.193603515625, 14.9130859375, 15.632568359375, 16.35205078125, 17.071533203125, 17.791015625, 18.510498046875, 19.22998046875, 19.949462890625, 20.6689453125, 21.388427734375, 22.10791015625, 22.827392578125, 23.546875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 6.0, 4.0, 8.0, 5.0, 11.0, 8.0, 11.0, 18.0, 17.0, 15.0, 27.0, 29.0, 30.0, 38.0, 66.0, 47.0, 55.0, 64.0, 70.0, 67.0, 55.0, 43.0, 42.0, 40.0, 37.0, 34.0, 30.0, 28.0, 18.0, 13.0, 13.0, 12.0, 9.0, 8.0, 5.0, 4.0, 3.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0020751953125, -0.002010852098464966, -0.0019465088844299316, -0.0018821656703948975, -0.0018178224563598633, -0.001753479242324829, -0.001689136028289795, -0.0016247928142547607, -0.0015604496002197266, -0.0014961063861846924, -0.0014317631721496582, -0.001367419958114624, -0.0013030767440795898, -0.0012387335300445557, -0.0011743903160095215, -0.0011100471019744873, -0.0010457038879394531, -0.000981360673904419, -0.0009170174598693848, -0.0008526742458343506, -0.0007883310317993164, -0.0007239878177642822, -0.000659644603729248, -0.0005953013896942139, -0.0005309581756591797, -0.0004666149616241455, -0.00040227174758911133, -0.00033792853355407715, -0.00027358531951904297, -0.0002092421054840088, -0.0001448988914489746, -8.055567741394043e-05, -1.621246337890625e-05, 4.813075065612793e-05, 0.00011247396469116211, 0.0001768171787261963, 0.00024116039276123047, 0.00030550360679626465, 0.00036984682083129883, 0.000434190034866333, 0.0004985332489013672, 0.0005628764629364014, 0.0006272196769714355, 0.0006915628910064697, 0.0007559061050415039, 0.0008202493190765381, 0.0008845925331115723, 0.0009489357471466064, 0.0010132789611816406, 0.0010776221752166748, 0.001141965389251709, 0.0012063086032867432, 0.0012706518173217773, 0.0013349950313568115, 0.0013993382453918457, 0.0014636814594268799, 0.001528024673461914, 0.0015923678874969482, 0.0016567111015319824, 0.0017210543155670166, 0.0017853975296020508, 0.001849740743637085, 0.0019140839576721191, 0.0019784271717071533, 0.0020427703857421875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 2.0, 10.0, 15.0, 23.0, 28.0, 35.0, 50.0, 87.0, 112.0, 169.0, 274.0, 427.0, 722.0, 1253.0, 2121.0, 3827.0, 7307.0, 15171.0, 32942.0, 71392.0, 146080.0, 230943.0, 236857.0, 153859.0, 76115.0, 35063.0, 16371.0, 7906.0, 3912.0, 2123.0, 1273.0, 749.0, 457.0, 297.0, 196.0, 119.0, 88.0, 60.0, 36.0, 25.0, 13.0, 21.0, 7.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-27.875, -27.05615234375, -26.2373046875, -25.41845703125, -24.599609375, -23.78076171875, -22.9619140625, -22.14306640625, -21.32421875, -20.50537109375, -19.6865234375, -18.86767578125, -18.048828125, -17.22998046875, -16.4111328125, -15.59228515625, -14.7734375, -13.95458984375, -13.1357421875, -12.31689453125, -11.498046875, -10.67919921875, -9.8603515625, -9.04150390625, -8.22265625, -7.40380859375, -6.5849609375, -5.76611328125, -4.947265625, -4.12841796875, -3.3095703125, -2.49072265625, -1.671875, -0.85302734375, -0.0341796875, 0.78466796875, 1.603515625, 2.42236328125, 3.2412109375, 4.06005859375, 4.87890625, 5.69775390625, 6.5166015625, 7.33544921875, 8.154296875, 8.97314453125, 9.7919921875, 10.61083984375, 11.4296875, 12.24853515625, 13.0673828125, 13.88623046875, 14.705078125, 15.52392578125, 16.3427734375, 17.16162109375, 17.98046875, 18.79931640625, 19.6181640625, 20.43701171875, 21.255859375, 22.07470703125, 22.8935546875, 23.71240234375, 24.53125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 1.0, 7.0, 8.0, 9.0, 4.0, 8.0, 9.0, 12.0, 28.0, 8.0, 39.0, 27.0, 41.0, 41.0, 51.0, 40.0, 62.0, 53.0, 55.0, 54.0, 63.0, 40.0, 55.0, 41.0, 42.0, 42.0, 36.0, 20.0, 20.0, 20.0, 14.0, 14.0, 5.0, 5.0, 5.0, 5.0, 5.0, 5.0, 1.0, 6.0, 4.0], "bins": [-8.8203125, -8.60888671875, -8.3974609375, -8.18603515625, -7.974609375, -7.76318359375, -7.5517578125, -7.34033203125, -7.12890625, -6.91748046875, -6.7060546875, -6.49462890625, -6.283203125, -6.07177734375, -5.8603515625, -5.64892578125, -5.4375, -5.22607421875, -5.0146484375, -4.80322265625, -4.591796875, -4.38037109375, -4.1689453125, -3.95751953125, -3.74609375, -3.53466796875, -3.3232421875, -3.11181640625, -2.900390625, -2.68896484375, -2.4775390625, -2.26611328125, -2.0546875, -1.84326171875, -1.6318359375, -1.42041015625, -1.208984375, -0.99755859375, -0.7861328125, -0.57470703125, -0.36328125, -0.15185546875, 0.0595703125, 0.27099609375, 0.482421875, 0.69384765625, 0.9052734375, 1.11669921875, 1.328125, 1.53955078125, 1.7509765625, 1.96240234375, 2.173828125, 2.38525390625, 2.5966796875, 2.80810546875, 3.01953125, 3.23095703125, 3.4423828125, 3.65380859375, 3.865234375, 4.07666015625, 4.2880859375, 4.49951171875, 4.7109375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 11.0, 9.0, 15.0, 17.0, 25.0, 19.0, 28.0, 22.0, 51.0, 38.0, 45.0, 51.0, 56.0, 50.0, 63.0, 54.0, 44.0, 48.0, 55.0, 36.0, 38.0, 27.0, 31.0, 24.0, 29.0, 21.0, 13.0, 20.0, 9.0, 10.0, 4.0, 10.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.2425422668457, -38.69725799560547, -37.151973724365234, -35.606689453125, -34.061405181884766, -32.51612091064453, -30.970836639404297, -29.425552368164062, -27.880268096923828, -26.334983825683594, -24.78969955444336, -23.244415283203125, -21.69913101196289, -20.153846740722656, -18.608562469482422, -17.063278198242188, -15.517993927001953, -13.972709655761719, -12.427425384521484, -10.88214111328125, -9.336856842041016, -7.791572570800781, -6.246288299560547, -4.7010040283203125, -3.155719757080078, -1.6104354858398438, -0.06515121459960938, 1.480133056640625, 3.0254173278808594, 4.570701599121094, 6.115985870361328, 7.6612701416015625, 9.206554412841797, 10.751838684082031, 12.297122955322266, 13.8424072265625, 15.387691497802734, 16.93297576904297, 18.478260040283203, 20.023544311523438, 21.568828582763672, 23.114112854003906, 24.65939712524414, 26.204681396484375, 27.74996566772461, 29.295249938964844, 30.840534210205078, 32.38581848144531, 33.93110275268555, 35.47638702392578, 37.021671295166016, 38.56695556640625, 40.112239837646484, 41.65752410888672, 43.20280838012695, 44.74809265136719, 46.29337692260742, 47.838661193847656, 49.38394546508789, 50.929229736328125, 52.47451400756836, 54.019798278808594, 55.56508255004883, 57.11036682128906, 58.6556510925293]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 5.0, 11.0, 10.0, 9.0, 23.0, 24.0, 23.0, 22.0, 16.0, 33.0, 18.0, 26.0, 29.0, 40.0, 33.0, 41.0, 30.0, 44.0, 39.0, 38.0, 35.0, 34.0, 42.0, 27.0, 40.0, 28.0, 29.0, 19.0, 31.0, 23.0, 24.0, 26.0, 19.0, 18.0, 12.0, 15.0, 7.0, 12.0, 6.0, 4.0, 5.0, 7.0, 5.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0], "bins": [-39.16324996948242, -38.02390670776367, -36.88456344604492, -35.74522018432617, -34.60587692260742, -33.46653366088867, -32.32719039916992, -31.187849044799805, -30.048505783081055, -28.909162521362305, -27.769819259643555, -26.630475997924805, -25.491134643554688, -24.351791381835938, -23.212448120117188, -22.073104858398438, -20.933761596679688, -19.794418334960938, -18.655075073242188, -17.515731811523438, -16.376388549804688, -15.237046241760254, -14.09770393371582, -12.95836067199707, -11.81901741027832, -10.67967414855957, -9.54033088684082, -8.400988578796387, -7.261645317077637, -6.122302055358887, -4.982959270477295, -3.843616485595703, -2.7042770385742188, -1.5649340152740479, -0.42559099197387695, 0.713752031326294, 1.8530950546264648, 2.992438316345215, 4.131781101226807, 5.271123886108398, 6.410467147827148, 7.549810409545898, 8.689153671264648, 9.828495979309082, 10.967839241027832, 12.107182502746582, 13.246524810791016, 14.385868072509766, 15.525211334228516, 16.664554595947266, 17.803897857666016, 18.943241119384766, 20.082584381103516, 21.221927642822266, 22.361268997192383, 23.500612258911133, 24.639955520629883, 25.779298782348633, 26.918642044067383, 28.057985305786133, 29.19732666015625, 30.336669921875, 31.47601318359375, 32.6153564453125, 33.75469970703125]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 8.0, 17.0, 18.0, 29.0, 29.0, 49.0, 95.0, 154.0, 233.0, 369.0, 522.0, 937.0, 1538.0, 2374.0, 4017.0, 6590.0, 10693.0, 18018.0, 29717.0, 49750.0, 82474.0, 138150.0, 229933.0, 376963.0, 584537.0, 743443.0, 683460.0, 476570.0, 297640.0, 179686.0, 108872.0, 65449.0, 39826.0, 24227.0, 14580.0, 8886.0, 5424.0, 3373.0, 2175.0, 1286.0, 785.0, 517.0, 337.0, 182.0, 112.0, 92.0, 54.0, 29.0, 21.0, 15.0, 11.0, 7.0, 4.0, 1.0], "bins": [-53.125, -51.6396484375, -50.154296875, -48.6689453125, -47.18359375, -45.6982421875, -44.212890625, -42.7275390625, -41.2421875, -39.7568359375, -38.271484375, -36.7861328125, -35.30078125, -33.8154296875, -32.330078125, -30.8447265625, -29.359375, -27.8740234375, -26.388671875, -24.9033203125, -23.41796875, -21.9326171875, -20.447265625, -18.9619140625, -17.4765625, -15.9912109375, -14.505859375, -13.0205078125, -11.53515625, -10.0498046875, -8.564453125, -7.0791015625, -5.59375, -4.1083984375, -2.623046875, -1.1376953125, 0.34765625, 1.8330078125, 3.318359375, 4.8037109375, 6.2890625, 7.7744140625, 9.259765625, 10.7451171875, 12.23046875, 13.7158203125, 15.201171875, 16.6865234375, 18.171875, 19.6572265625, 21.142578125, 22.6279296875, 24.11328125, 25.5986328125, 27.083984375, 28.5693359375, 30.0546875, 31.5400390625, 33.025390625, 34.5107421875, 35.99609375, 37.4814453125, 38.966796875, 40.4521484375, 41.9375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 4.0, 4.0, 4.0, 8.0, 16.0, 10.0, 8.0, 15.0, 17.0, 17.0, 33.0, 33.0, 31.0, 28.0, 34.0, 40.0, 32.0, 37.0, 29.0, 45.0, 41.0, 38.0, 35.0, 49.0, 55.0, 35.0, 31.0, 27.0, 26.0, 35.0, 24.0, 14.0, 22.0, 17.0, 20.0, 21.0, 14.0, 10.0, 8.0, 4.0, 8.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.671875, -23.80029296875, -22.9287109375, -22.05712890625, -21.185546875, -20.31396484375, -19.4423828125, -18.57080078125, -17.69921875, -16.82763671875, -15.9560546875, -15.08447265625, -14.212890625, -13.34130859375, -12.4697265625, -11.59814453125, -10.7265625, -9.85498046875, -8.9833984375, -8.11181640625, -7.240234375, -6.36865234375, -5.4970703125, -4.62548828125, -3.75390625, -2.88232421875, -2.0107421875, -1.13916015625, -0.267578125, 0.60400390625, 1.4755859375, 2.34716796875, 3.21875, 4.09033203125, 4.9619140625, 5.83349609375, 6.705078125, 7.57666015625, 8.4482421875, 9.31982421875, 10.19140625, 11.06298828125, 11.9345703125, 12.80615234375, 13.677734375, 14.54931640625, 15.4208984375, 16.29248046875, 17.1640625, 18.03564453125, 18.9072265625, 19.77880859375, 20.650390625, 21.52197265625, 22.3935546875, 23.26513671875, 24.13671875, 25.00830078125, 25.8798828125, 26.75146484375, 27.623046875, 28.49462890625, 29.3662109375, 30.23779296875, 31.109375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 8.0, 9.0, 11.0, 22.0, 31.0, 49.0, 75.0, 120.0, 191.0, 291.0, 554.0, 794.0, 1246.0, 2182.0, 3563.0, 6066.0, 10119.0, 17313.0, 29372.0, 49018.0, 81839.0, 134211.0, 215313.0, 330361.0, 471421.0, 596000.0, 625062.0, 534853.0, 393463.0, 264514.0, 168139.0, 102836.0, 63005.0, 37220.0, 22253.0, 12952.0, 7832.0, 4569.0, 2877.0, 1749.0, 1051.0, 658.0, 401.0, 233.0, 165.0, 97.0, 64.0, 33.0, 30.0, 17.0, 10.0, 12.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-38.84375, -37.638671875, -36.43359375, -35.228515625, -34.0234375, -32.818359375, -31.61328125, -30.408203125, -29.203125, -27.998046875, -26.79296875, -25.587890625, -24.3828125, -23.177734375, -21.97265625, -20.767578125, -19.5625, -18.357421875, -17.15234375, -15.947265625, -14.7421875, -13.537109375, -12.33203125, -11.126953125, -9.921875, -8.716796875, -7.51171875, -6.306640625, -5.1015625, -3.896484375, -2.69140625, -1.486328125, -0.28125, 0.923828125, 2.12890625, 3.333984375, 4.5390625, 5.744140625, 6.94921875, 8.154296875, 9.359375, 10.564453125, 11.76953125, 12.974609375, 14.1796875, 15.384765625, 16.58984375, 17.794921875, 19.0, 20.205078125, 21.41015625, 22.615234375, 23.8203125, 25.025390625, 26.23046875, 27.435546875, 28.640625, 29.845703125, 31.05078125, 32.255859375, 33.4609375, 34.666015625, 35.87109375, 37.076171875, 38.28125]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 8.0, 9.0, 12.0, 25.0, 33.0, 33.0, 38.0, 46.0, 70.0, 91.0, 87.0, 98.0, 129.0, 146.0, 169.0, 198.0, 187.0, 193.0, 240.0, 220.0, 224.0, 214.0, 220.0, 181.0, 183.0, 165.0, 140.0, 132.0, 120.0, 92.0, 87.0, 62.0, 48.0, 34.0, 27.0, 21.0, 14.0, 12.0, 20.0, 10.0, 11.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.5, -15.0159912109375, -14.531982421875, -14.0479736328125, -13.56396484375, -13.0799560546875, -12.595947265625, -12.1119384765625, -11.6279296875, -11.1439208984375, -10.659912109375, -10.1759033203125, -9.69189453125, -9.2078857421875, -8.723876953125, -8.2398681640625, -7.755859375, -7.2718505859375, -6.787841796875, -6.3038330078125, -5.81982421875, -5.3358154296875, -4.851806640625, -4.3677978515625, -3.8837890625, -3.3997802734375, -2.915771484375, -2.4317626953125, -1.94775390625, -1.4637451171875, -0.979736328125, -0.4957275390625, -0.01171875, 0.4722900390625, 0.956298828125, 1.4403076171875, 1.92431640625, 2.4083251953125, 2.892333984375, 3.3763427734375, 3.8603515625, 4.3443603515625, 4.828369140625, 5.3123779296875, 5.79638671875, 6.2803955078125, 6.764404296875, 7.2484130859375, 7.732421875, 8.2164306640625, 8.700439453125, 9.1844482421875, 9.66845703125, 10.1524658203125, 10.636474609375, 11.1204833984375, 11.6044921875, 12.0885009765625, 12.572509765625, 13.0565185546875, 13.54052734375, 14.0245361328125, 14.508544921875, 14.9925537109375, 15.4765625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 6.0, 7.0, 12.0, 16.0, 15.0, 18.0, 29.0, 37.0, 28.0, 36.0, 49.0, 47.0, 62.0, 44.0, 61.0, 50.0, 45.0, 54.0, 56.0, 44.0, 36.0, 36.0, 32.0, 36.0, 31.0, 18.0, 11.0, 11.0, 14.0, 9.0, 11.0, 5.0, 2.0, 1.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-44.19761657714844, -42.84590148925781, -41.49419021606445, -40.14247512817383, -38.79076385498047, -37.439048767089844, -36.08733367919922, -34.735618591308594, -33.383907318115234, -32.03219223022461, -30.68048095703125, -29.328765869140625, -27.977052688598633, -26.62533950805664, -25.273624420166016, -23.921911239624023, -22.57019805908203, -21.21848487854004, -19.866771697998047, -18.515056610107422, -17.16334342956543, -15.811630249023438, -14.459916114807129, -13.10820198059082, -11.756488800048828, -10.404775619506836, -9.053061485290527, -7.701347827911377, -6.349634170532227, -4.997920513153076, -3.646206855773926, -2.294492721557617, -0.9427833557128906, 0.40893030166625977, 1.7606439590454102, 3.1123576164245605, 4.464071273803711, 5.815784931182861, 7.167498588562012, 8.51921272277832, 9.870925903320312, 11.222639083862305, 12.574353218078613, 13.926067352294922, 15.277780532836914, 16.629493713378906, 17.98120880126953, 19.332921981811523, 20.684635162353516, 22.036348342895508, 23.3880615234375, 24.739776611328125, 26.091489791870117, 27.44320297241211, 28.794918060302734, 30.146631240844727, 31.49834442138672, 32.850059509277344, 34.2017707824707, 35.55348587036133, 36.90519714355469, 38.25691223144531, 39.60862731933594, 40.96034240722656, 42.31205368041992]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 13.0, 11.0, 8.0, 6.0, 18.0, 10.0, 16.0, 20.0, 28.0, 21.0, 23.0, 22.0, 31.0, 38.0, 38.0, 42.0, 23.0, 41.0, 47.0, 40.0, 33.0, 39.0, 36.0, 38.0, 48.0, 34.0, 27.0, 33.0, 25.0, 27.0, 22.0, 25.0, 20.0, 25.0, 9.0, 11.0, 6.0, 9.0, 10.0, 10.0, 5.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.25787353515625, -34.21341323852539, -33.16895294189453, -32.12449264526367, -31.080034255981445, -30.035573959350586, -28.99111557006836, -27.9466552734375, -26.90219497680664, -25.85773468017578, -24.813274383544922, -23.768815994262695, -22.724355697631836, -21.679895401000977, -20.63543701171875, -19.59097671508789, -18.54651641845703, -17.502056121826172, -16.457595825195312, -15.413137435913086, -14.368677139282227, -13.324216842651367, -12.279757499694824, -11.235298156738281, -10.190837860107422, -9.146377563476562, -8.10191822052002, -7.057458400726318, -6.012998580932617, -4.968538761138916, -3.924078941345215, -2.8796191215515137, -1.8351593017578125, -0.7906994819641113, 0.25376033782958984, 1.298220157623291, 2.342679977416992, 3.3871397972106934, 4.4315996170043945, 5.476059436798096, 6.520519256591797, 7.564979076385498, 8.6094388961792, 9.653898239135742, 10.698358535766602, 11.742818832397461, 12.787278175354004, 13.831737518310547, 14.876197814941406, 15.920658111572266, 16.965118408203125, 18.00957679748535, 19.05403709411621, 20.09849739074707, 21.142955780029297, 22.187416076660156, 23.231876373291016, 24.276336669921875, 25.320796966552734, 26.36525535583496, 27.40971565246582, 28.45417594909668, 29.498634338378906, 30.543094635009766, 31.587554931640625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 14.0, 13.0, 30.0, 52.0, 68.0, 85.0, 143.0, 238.0, 355.0, 466.0, 785.0, 1150.0, 1768.0, 2655.0, 4059.0, 6180.0, 9615.0, 14611.0, 22241.0, 33387.0, 49401.0, 70292.0, 95107.0, 118437.0, 130538.0, 125372.0, 105755.0, 80689.0, 57347.0, 39870.0, 26658.0, 17447.0, 11528.0, 7599.0, 5095.0, 3307.0, 2118.0, 1374.0, 943.0, 581.0, 393.0, 267.0, 180.0, 116.0, 71.0, 59.0, 36.0, 23.0, 15.0, 8.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-62.59375, -60.55615234375, -58.5185546875, -56.48095703125, -54.443359375, -52.40576171875, -50.3681640625, -48.33056640625, -46.29296875, -44.25537109375, -42.2177734375, -40.18017578125, -38.142578125, -36.10498046875, -34.0673828125, -32.02978515625, -29.9921875, -27.95458984375, -25.9169921875, -23.87939453125, -21.841796875, -19.80419921875, -17.7666015625, -15.72900390625, -13.69140625, -11.65380859375, -9.6162109375, -7.57861328125, -5.541015625, -3.50341796875, -1.4658203125, 0.57177734375, 2.609375, 4.64697265625, 6.6845703125, 8.72216796875, 10.759765625, 12.79736328125, 14.8349609375, 16.87255859375, 18.91015625, 20.94775390625, 22.9853515625, 25.02294921875, 27.060546875, 29.09814453125, 31.1357421875, 33.17333984375, 35.2109375, 37.24853515625, 39.2861328125, 41.32373046875, 43.361328125, 45.39892578125, 47.4365234375, 49.47412109375, 51.51171875, 53.54931640625, 55.5869140625, 57.62451171875, 59.662109375, 61.69970703125, 63.7373046875, 65.77490234375, 67.8125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 3.0, 1.0, 5.0, 13.0, 5.0, 5.0, 13.0, 12.0, 12.0, 22.0, 13.0, 22.0, 18.0, 17.0, 20.0, 28.0, 28.0, 28.0, 50.0, 37.0, 27.0, 36.0, 44.0, 41.0, 34.0, 36.0, 42.0, 27.0, 34.0, 43.0, 37.0, 28.0, 25.0, 27.0, 27.0, 28.0, 14.0, 14.0, 14.0, 11.0, 14.0, 9.0, 6.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.015625, -23.2421875, -22.46875, -21.6953125, -20.921875, -20.1484375, -19.375, -18.6015625, -17.828125, -17.0546875, -16.28125, -15.5078125, -14.734375, -13.9609375, -13.1875, -12.4140625, -11.640625, -10.8671875, -10.09375, -9.3203125, -8.546875, -7.7734375, -7.0, -6.2265625, -5.453125, -4.6796875, -3.90625, -3.1328125, -2.359375, -1.5859375, -0.8125, -0.0390625, 0.734375, 1.5078125, 2.28125, 3.0546875, 3.828125, 4.6015625, 5.375, 6.1484375, 6.921875, 7.6953125, 8.46875, 9.2421875, 10.015625, 10.7890625, 11.5625, 12.3359375, 13.109375, 13.8828125, 14.65625, 15.4296875, 16.203125, 16.9765625, 17.75, 18.5234375, 19.296875, 20.0703125, 20.84375, 21.6171875, 22.390625, 23.1640625, 23.9375, 24.7109375, 25.484375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 9.0, 1.0, 4.0, 6.0, 15.0, 10.0, 29.0, 36.0, 51.0, 85.0, 101.0, 129.0, 197.0, 265.0, 448.0, 562.0, 856.0, 1235.0, 1790.0, 2504.0, 3836.0, 5453.0, 8406.0, 13010.0, 20724.0, 33507.0, 55878.0, 92689.0, 149256.0, 200862.0, 170976.0, 109864.0, 66409.0, 39760.0, 24399.0, 15124.0, 9876.0, 6473.0, 4339.0, 2925.0, 1989.0, 1376.0, 982.0, 640.0, 449.0, 309.0, 209.0, 155.0, 117.0, 70.0, 54.0, 34.0, 26.0, 14.0, 16.0, 9.0, 4.0, 4.0, 9.0, 1.0, 3.0], "bins": [-77.625, -75.2490234375, -72.873046875, -70.4970703125, -68.12109375, -65.7451171875, -63.369140625, -60.9931640625, -58.6171875, -56.2412109375, -53.865234375, -51.4892578125, -49.11328125, -46.7373046875, -44.361328125, -41.9853515625, -39.609375, -37.2333984375, -34.857421875, -32.4814453125, -30.10546875, -27.7294921875, -25.353515625, -22.9775390625, -20.6015625, -18.2255859375, -15.849609375, -13.4736328125, -11.09765625, -8.7216796875, -6.345703125, -3.9697265625, -1.59375, 0.7822265625, 3.158203125, 5.5341796875, 7.91015625, 10.2861328125, 12.662109375, 15.0380859375, 17.4140625, 19.7900390625, 22.166015625, 24.5419921875, 26.91796875, 29.2939453125, 31.669921875, 34.0458984375, 36.421875, 38.7978515625, 41.173828125, 43.5498046875, 45.92578125, 48.3017578125, 50.677734375, 53.0537109375, 55.4296875, 57.8056640625, 60.181640625, 62.5576171875, 64.93359375, 67.3095703125, 69.685546875, 72.0615234375, 74.4375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 5.0, 3.0, 9.0, 17.0, 12.0, 10.0, 12.0, 22.0, 21.0, 13.0, 33.0, 33.0, 36.0, 32.0, 25.0, 27.0, 34.0, 32.0, 46.0, 43.0, 34.0, 37.0, 41.0, 28.0, 31.0, 34.0, 39.0, 38.0, 26.0, 25.0, 24.0, 32.0, 24.0, 19.0, 18.0, 16.0, 12.0, 10.0, 11.0, 7.0, 3.0, 8.0, 2.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-19.015625, -18.380859375, -17.74609375, -17.111328125, -16.4765625, -15.841796875, -15.20703125, -14.572265625, -13.9375, -13.302734375, -12.66796875, -12.033203125, -11.3984375, -10.763671875, -10.12890625, -9.494140625, -8.859375, -8.224609375, -7.58984375, -6.955078125, -6.3203125, -5.685546875, -5.05078125, -4.416015625, -3.78125, -3.146484375, -2.51171875, -1.876953125, -1.2421875, -0.607421875, 0.02734375, 0.662109375, 1.296875, 1.931640625, 2.56640625, 3.201171875, 3.8359375, 4.470703125, 5.10546875, 5.740234375, 6.375, 7.009765625, 7.64453125, 8.279296875, 8.9140625, 9.548828125, 10.18359375, 10.818359375, 11.453125, 12.087890625, 12.72265625, 13.357421875, 13.9921875, 14.626953125, 15.26171875, 15.896484375, 16.53125, 17.166015625, 17.80078125, 18.435546875, 19.0703125, 19.705078125, 20.33984375, 20.974609375, 21.609375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 3.0, 3.0, 10.0, 16.0, 23.0, 42.0, 49.0, 105.0, 95.0, 124.0, 217.0, 309.0, 485.0, 722.0, 1074.0, 1623.0, 2639.0, 4273.0, 7547.0, 14599.0, 30592.0, 84489.0, 416019.0, 348289.0, 75031.0, 27975.0, 13552.0, 7252.0, 4155.0, 2591.0, 1527.0, 1044.0, 657.0, 467.0, 290.0, 212.0, 153.0, 83.0, 63.0, 44.0, 40.0, 22.0, 14.0, 14.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.875, -147.12109375, -142.3671875, -137.61328125, -132.859375, -128.10546875, -123.3515625, -118.59765625, -113.84375, -109.08984375, -104.3359375, -99.58203125, -94.828125, -90.07421875, -85.3203125, -80.56640625, -75.8125, -71.05859375, -66.3046875, -61.55078125, -56.796875, -52.04296875, -47.2890625, -42.53515625, -37.78125, -33.02734375, -28.2734375, -23.51953125, -18.765625, -14.01171875, -9.2578125, -4.50390625, 0.25, 5.00390625, 9.7578125, 14.51171875, 19.265625, 24.01953125, 28.7734375, 33.52734375, 38.28125, 43.03515625, 47.7890625, 52.54296875, 57.296875, 62.05078125, 66.8046875, 71.55859375, 76.3125, 81.06640625, 85.8203125, 90.57421875, 95.328125, 100.08203125, 104.8359375, 109.58984375, 114.34375, 119.09765625, 123.8515625, 128.60546875, 133.359375, 138.11328125, 142.8671875, 147.62109375, 152.375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 9.0, 9.0, 16.0, 18.0, 31.0, 60.0, 120.0, 255.0, 197.0, 99.0, 52.0, 33.0, 15.0, 17.0, 11.0, 9.0, 6.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0195770263671875, -0.018816471099853516, -0.01805591583251953, -0.017295360565185547, -0.016534805297851562, -0.015774250030517578, -0.015013694763183594, -0.01425313949584961, -0.013492584228515625, -0.01273202896118164, -0.011971473693847656, -0.011210918426513672, -0.010450363159179688, -0.009689807891845703, -0.008929252624511719, -0.008168697357177734, -0.00740814208984375, -0.006647586822509766, -0.005887031555175781, -0.005126476287841797, -0.0043659210205078125, -0.003605365753173828, -0.0028448104858398438, -0.0020842552185058594, -0.001323699951171875, -0.0005631446838378906, 0.00019741058349609375, 0.0009579658508300781, 0.0017185211181640625, 0.002479076385498047, 0.0032396316528320312, 0.004000186920166016, 0.0047607421875, 0.005521297454833984, 0.006281852722167969, 0.007042407989501953, 0.0078029632568359375, 0.008563518524169922, 0.009324073791503906, 0.01008462905883789, 0.010845184326171875, 0.01160573959350586, 0.012366294860839844, 0.013126850128173828, 0.013887405395507812, 0.014647960662841797, 0.015408515930175781, 0.016169071197509766, 0.01692962646484375, 0.017690181732177734, 0.01845073699951172, 0.019211292266845703, 0.019971847534179688, 0.020732402801513672, 0.021492958068847656, 0.02225351333618164, 0.023014068603515625, 0.02377462387084961, 0.024535179138183594, 0.025295734405517578, 0.026056289672851562, 0.026816844940185547, 0.02757740020751953, 0.028337955474853516, 0.0290985107421875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 4.0, 12.0, 13.0, 19.0, 20.0, 38.0, 53.0, 74.0, 101.0, 142.0, 185.0, 315.0, 415.0, 655.0, 990.0, 1549.0, 2548.0, 4335.0, 8141.0, 16760.0, 41404.0, 148888.0, 489880.0, 231220.0, 56102.0, 21568.0, 9814.0, 5100.0, 2948.0, 1790.0, 1128.0, 734.0, 505.0, 360.0, 240.0, 141.0, 107.0, 82.0, 51.0, 30.0, 30.0, 20.0, 9.0, 6.0, 8.0, 8.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-123.5625, -119.8896484375, -116.216796875, -112.5439453125, -108.87109375, -105.1982421875, -101.525390625, -97.8525390625, -94.1796875, -90.5068359375, -86.833984375, -83.1611328125, -79.48828125, -75.8154296875, -72.142578125, -68.4697265625, -64.796875, -61.1240234375, -57.451171875, -53.7783203125, -50.10546875, -46.4326171875, -42.759765625, -39.0869140625, -35.4140625, -31.7412109375, -28.068359375, -24.3955078125, -20.72265625, -17.0498046875, -13.376953125, -9.7041015625, -6.03125, -2.3583984375, 1.314453125, 4.9873046875, 8.66015625, 12.3330078125, 16.005859375, 19.6787109375, 23.3515625, 27.0244140625, 30.697265625, 34.3701171875, 38.04296875, 41.7158203125, 45.388671875, 49.0615234375, 52.734375, 56.4072265625, 60.080078125, 63.7529296875, 67.42578125, 71.0986328125, 74.771484375, 78.4443359375, 82.1171875, 85.7900390625, 89.462890625, 93.1357421875, 96.80859375, 100.4814453125, 104.154296875, 107.8271484375, 111.5]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 12.0, 14.0, 14.0, 21.0, 19.0, 25.0, 55.0, 68.0, 102.0, 94.0, 116.0, 106.0, 84.0, 78.0, 44.0, 28.0, 27.0, 13.0, 10.0, 12.0, 8.0, 10.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.65625, -29.768798828125, -28.88134765625, -27.993896484375, -27.1064453125, -26.218994140625, -25.33154296875, -24.444091796875, -23.556640625, -22.669189453125, -21.78173828125, -20.894287109375, -20.0068359375, -19.119384765625, -18.23193359375, -17.344482421875, -16.45703125, -15.569580078125, -14.68212890625, -13.794677734375, -12.9072265625, -12.019775390625, -11.13232421875, -10.244873046875, -9.357421875, -8.469970703125, -7.58251953125, -6.695068359375, -5.8076171875, -4.920166015625, -4.03271484375, -3.145263671875, -2.2578125, -1.370361328125, -0.48291015625, 0.404541015625, 1.2919921875, 2.179443359375, 3.06689453125, 3.954345703125, 4.841796875, 5.729248046875, 6.61669921875, 7.504150390625, 8.3916015625, 9.279052734375, 10.16650390625, 11.053955078125, 11.94140625, 12.828857421875, 13.71630859375, 14.603759765625, 15.4912109375, 16.378662109375, 17.26611328125, 18.153564453125, 19.041015625, 19.928466796875, 20.81591796875, 21.703369140625, 22.5908203125, 23.478271484375, 24.36572265625, 25.253173828125, 26.140625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 8.0, 9.0, 9.0, 16.0, 24.0, 25.0, 24.0, 22.0, 30.0, 28.0, 41.0, 49.0, 45.0, 49.0, 52.0, 60.0, 55.0, 52.0, 46.0, 49.0, 45.0, 37.0, 30.0, 30.0, 17.0, 24.0, 18.0, 14.0, 16.0, 5.0, 11.0, 8.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-39.827659606933594, -38.600399017333984, -37.37313461303711, -36.1458740234375, -34.91861343383789, -33.69135284423828, -32.464088439941406, -31.236827850341797, -30.009565353393555, -28.782302856445312, -27.555042266845703, -26.32777976989746, -25.10051727294922, -23.87325668334961, -22.645994186401367, -21.418731689453125, -20.191471099853516, -18.964208602905273, -17.736948013305664, -16.509685516357422, -15.282423973083496, -14.05516242980957, -12.827899932861328, -11.600638389587402, -10.373376846313477, -9.14611530303955, -7.918853282928467, -6.691591262817383, -5.464329719543457, -4.237068176269531, -3.0098061561584473, -1.7825441360473633, -0.5552825927734375, 0.6719791889190674, 1.8992409706115723, 3.126502752304077, 4.353764533996582, 5.581026077270508, 6.808288097381592, 8.035550117492676, 9.262811660766602, 10.490073204040527, 11.717334747314453, 12.944597244262695, 14.171858787536621, 15.399120330810547, 16.62638282775879, 17.85364532470703, 19.08090591430664, 20.308168411254883, 21.535429000854492, 22.762691497802734, 23.989952087402344, 25.217214584350586, 26.444477081298828, 27.671737670898438, 28.89900016784668, 30.126262664794922, 31.35352325439453, 32.58078384399414, 33.808048248291016, 35.035308837890625, 36.262569427490234, 37.48983383178711, 38.71709442138672]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 6.0, 3.0, 11.0, 12.0, 17.0, 15.0, 21.0, 20.0, 21.0, 24.0, 19.0, 21.0, 35.0, 41.0, 33.0, 43.0, 25.0, 29.0, 38.0, 34.0, 47.0, 46.0, 42.0, 37.0, 43.0, 34.0, 30.0, 30.0, 36.0, 27.0, 22.0, 24.0, 12.0, 22.0, 13.0, 9.0, 13.0, 5.0, 10.0, 10.0, 7.0, 0.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.89644432067871, -26.964345932006836, -26.032249450683594, -25.10015106201172, -24.168052673339844, -23.2359561920166, -22.303857803344727, -21.371761322021484, -20.43966293334961, -19.507564544677734, -18.575468063354492, -17.643369674682617, -16.711273193359375, -15.7791748046875, -14.847076416015625, -13.914978981018066, -12.982881546020508, -12.05078411102295, -11.11868667602539, -10.186588287353516, -9.254490852355957, -8.322393417358398, -7.390295505523682, -6.458197593688965, -5.526100158691406, -4.594002723693848, -3.661904811859131, -2.729807138442993, -1.7977094650268555, -0.8656120300292969, 0.06648588180541992, 0.9985837936401367, 1.9306812286376953, 2.862778902053833, 3.7948765754699707, 4.7269744873046875, 5.659071922302246, 6.591169357299805, 7.5232672691345215, 8.455365180969238, 9.387462615966797, 10.319560050964355, 11.251657485961914, 12.183755874633789, 13.115853309631348, 14.047950744628906, 14.980049133300781, 15.91214656829834, 16.8442440032959, 17.776342391967773, 18.708438873291016, 19.64053726196289, 20.572635650634766, 21.504732131958008, 22.436830520629883, 23.368927001953125, 24.301025390625, 25.233123779296875, 26.165220260620117, 27.097318649291992, 28.029415130615234, 28.96151351928711, 29.893611907958984, 30.82571029663086, 31.7578067779541]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 15.0, 23.0, 41.0, 57.0, 87.0, 148.0, 250.0, 359.0, 631.0, 970.0, 1481.0, 2499.0, 3759.0, 6172.0, 9731.0, 15526.0, 25069.0, 38944.0, 58360.0, 84413.0, 113926.0, 135581.0, 140281.0, 123280.0, 95068.0, 67366.0, 45274.0, 29106.0, 18570.0, 11722.0, 7312.0, 4631.0, 2937.0, 1854.0, 1129.0, 762.0, 462.0, 263.0, 191.0, 119.0, 72.0, 40.0, 29.0, 18.0, 9.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.125, -42.75390625, -41.3828125, -40.01171875, -38.640625, -37.26953125, -35.8984375, -34.52734375, -33.15625, -31.78515625, -30.4140625, -29.04296875, -27.671875, -26.30078125, -24.9296875, -23.55859375, -22.1875, -20.81640625, -19.4453125, -18.07421875, -16.703125, -15.33203125, -13.9609375, -12.58984375, -11.21875, -9.84765625, -8.4765625, -7.10546875, -5.734375, -4.36328125, -2.9921875, -1.62109375, -0.25, 1.12109375, 2.4921875, 3.86328125, 5.234375, 6.60546875, 7.9765625, 9.34765625, 10.71875, 12.08984375, 13.4609375, 14.83203125, 16.203125, 17.57421875, 18.9453125, 20.31640625, 21.6875, 23.05859375, 24.4296875, 25.80078125, 27.171875, 28.54296875, 29.9140625, 31.28515625, 32.65625, 34.02734375, 35.3984375, 36.76953125, 38.140625, 39.51171875, 40.8828125, 42.25390625, 43.625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 3.0, 5.0, 11.0, 16.0, 12.0, 18.0, 23.0, 20.0, 17.0, 23.0, 26.0, 33.0, 30.0, 25.0, 28.0, 40.0, 32.0, 30.0, 42.0, 41.0, 36.0, 49.0, 36.0, 42.0, 34.0, 31.0, 33.0, 27.0, 40.0, 28.0, 22.0, 27.0, 16.0, 14.0, 7.0, 12.0, 13.0, 11.0, 11.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.296875, -23.481201171875, -22.66552734375, -21.849853515625, -21.0341796875, -20.218505859375, -19.40283203125, -18.587158203125, -17.771484375, -16.955810546875, -16.14013671875, -15.324462890625, -14.5087890625, -13.693115234375, -12.87744140625, -12.061767578125, -11.24609375, -10.430419921875, -9.61474609375, -8.799072265625, -7.9833984375, -7.167724609375, -6.35205078125, -5.536376953125, -4.720703125, -3.905029296875, -3.08935546875, -2.273681640625, -1.4580078125, -0.642333984375, 0.17333984375, 0.989013671875, 1.8046875, 2.620361328125, 3.43603515625, 4.251708984375, 5.0673828125, 5.883056640625, 6.69873046875, 7.514404296875, 8.330078125, 9.145751953125, 9.96142578125, 10.777099609375, 11.5927734375, 12.408447265625, 13.22412109375, 14.039794921875, 14.85546875, 15.671142578125, 16.48681640625, 17.302490234375, 18.1181640625, 18.933837890625, 19.74951171875, 20.565185546875, 21.380859375, 22.196533203125, 23.01220703125, 23.827880859375, 24.6435546875, 25.459228515625, 26.27490234375, 27.090576171875, 27.90625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 8.0, 17.0, 21.0, 27.0, 40.0, 62.0, 99.0, 148.0, 220.0, 355.0, 497.0, 801.0, 1180.0, 1693.0, 2550.0, 3917.0, 6234.0, 9123.0, 14076.0, 20698.0, 31184.0, 45645.0, 65069.0, 88437.0, 111231.0, 125804.0, 125228.0, 109567.0, 86687.0, 63401.0, 44619.0, 30325.0, 20136.0, 13456.0, 8742.0, 5722.0, 4017.0, 2516.0, 1645.0, 1108.0, 770.0, 498.0, 330.0, 247.0, 149.0, 87.0, 54.0, 29.0, 36.0, 27.0, 15.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.65625, -36.3994140625, -35.142578125, -33.8857421875, -32.62890625, -31.3720703125, -30.115234375, -28.8583984375, -27.6015625, -26.3447265625, -25.087890625, -23.8310546875, -22.57421875, -21.3173828125, -20.060546875, -18.8037109375, -17.546875, -16.2900390625, -15.033203125, -13.7763671875, -12.51953125, -11.2626953125, -10.005859375, -8.7490234375, -7.4921875, -6.2353515625, -4.978515625, -3.7216796875, -2.46484375, -1.2080078125, 0.048828125, 1.3056640625, 2.5625, 3.8193359375, 5.076171875, 6.3330078125, 7.58984375, 8.8466796875, 10.103515625, 11.3603515625, 12.6171875, 13.8740234375, 15.130859375, 16.3876953125, 17.64453125, 18.9013671875, 20.158203125, 21.4150390625, 22.671875, 23.9287109375, 25.185546875, 26.4423828125, 27.69921875, 28.9560546875, 30.212890625, 31.4697265625, 32.7265625, 33.9833984375, 35.240234375, 36.4970703125, 37.75390625, 39.0107421875, 40.267578125, 41.5244140625, 42.78125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 6.0, 9.0, 9.0, 6.0, 7.0, 9.0, 12.0, 9.0, 15.0, 14.0, 21.0, 23.0, 24.0, 23.0, 38.0, 42.0, 44.0, 26.0, 33.0, 33.0, 40.0, 42.0, 29.0, 41.0, 44.0, 43.0, 41.0, 38.0, 41.0, 27.0, 22.0, 20.0, 27.0, 26.0, 17.0, 17.0, 18.0, 16.0, 9.0, 8.0, 11.0, 5.0, 7.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.75, -19.142822265625, -18.53564453125, -17.928466796875, -17.3212890625, -16.714111328125, -16.10693359375, -15.499755859375, -14.892578125, -14.285400390625, -13.67822265625, -13.071044921875, -12.4638671875, -11.856689453125, -11.24951171875, -10.642333984375, -10.03515625, -9.427978515625, -8.82080078125, -8.213623046875, -7.6064453125, -6.999267578125, -6.39208984375, -5.784912109375, -5.177734375, -4.570556640625, -3.96337890625, -3.356201171875, -2.7490234375, -2.141845703125, -1.53466796875, -0.927490234375, -0.3203125, 0.286865234375, 0.89404296875, 1.501220703125, 2.1083984375, 2.715576171875, 3.32275390625, 3.929931640625, 4.537109375, 5.144287109375, 5.75146484375, 6.358642578125, 6.9658203125, 7.572998046875, 8.18017578125, 8.787353515625, 9.39453125, 10.001708984375, 10.60888671875, 11.216064453125, 11.8232421875, 12.430419921875, 13.03759765625, 13.644775390625, 14.251953125, 14.859130859375, 15.46630859375, 16.073486328125, 16.6806640625, 17.287841796875, 17.89501953125, 18.502197265625, 19.109375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 6.0, 8.0, 18.0, 20.0, 29.0, 25.0, 64.0, 100.0, 123.0, 230.0, 331.0, 473.0, 684.0, 1178.0, 1923.0, 3178.0, 5587.0, 10124.0, 18653.0, 36793.0, 73576.0, 142034.0, 222746.0, 226179.0, 146242.0, 75858.0, 38006.0, 19645.0, 10344.0, 5825.0, 3221.0, 1938.0, 1193.0, 757.0, 484.0, 333.0, 212.0, 142.0, 89.0, 57.0, 41.0, 18.0, 21.0, 16.0, 17.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.78125, -37.53125, -36.28125, -35.03125, -33.78125, -32.53125, -31.28125, -30.03125, -28.78125, -27.53125, -26.28125, -25.03125, -23.78125, -22.53125, -21.28125, -20.03125, -18.78125, -17.53125, -16.28125, -15.03125, -13.78125, -12.53125, -11.28125, -10.03125, -8.78125, -7.53125, -6.28125, -5.03125, -3.78125, -2.53125, -1.28125, -0.03125, 1.21875, 2.46875, 3.71875, 4.96875, 6.21875, 7.46875, 8.71875, 9.96875, 11.21875, 12.46875, 13.71875, 14.96875, 16.21875, 17.46875, 18.71875, 19.96875, 21.21875, 22.46875, 23.71875, 24.96875, 26.21875, 27.46875, 28.71875, 29.96875, 31.21875, 32.46875, 33.71875, 34.96875, 36.21875, 37.46875, 38.71875, 39.96875, 41.21875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 2.0, 7.0, 5.0, 3.0, 15.0, 11.0, 16.0, 19.0, 31.0, 20.0, 46.0, 51.0, 60.0, 54.0, 68.0, 83.0, 59.0, 48.0, 62.0, 59.0, 49.0, 42.0, 46.0, 26.0, 14.0, 21.0, 17.0, 15.0, 6.0, 12.0, 4.0, 11.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0036468505859375, -0.0035337507724761963, -0.0034206509590148926, -0.003307551145553589, -0.003194451332092285, -0.0030813515186309814, -0.0029682517051696777, -0.002855151891708374, -0.0027420520782470703, -0.0026289522647857666, -0.002515852451324463, -0.002402752637863159, -0.0022896528244018555, -0.0021765530109405518, -0.002063453197479248, -0.0019503533840179443, -0.0018372535705566406, -0.001724153757095337, -0.0016110539436340332, -0.0014979541301727295, -0.0013848543167114258, -0.001271754503250122, -0.0011586546897888184, -0.0010455548763275146, -0.0009324550628662109, -0.0008193552494049072, -0.0007062554359436035, -0.0005931556224822998, -0.0004800558090209961, -0.0003669559955596924, -0.00025385618209838867, -0.00014075636863708496, -2.765655517578125e-05, 8.544325828552246e-05, 0.00019854307174682617, 0.0003116428852081299, 0.0004247426986694336, 0.0005378425121307373, 0.000650942325592041, 0.0007640421390533447, 0.0008771419525146484, 0.0009902417659759521, 0.0011033415794372559, 0.0012164413928985596, 0.0013295412063598633, 0.001442641019821167, 0.0015557408332824707, 0.0016688406467437744, 0.0017819404602050781, 0.0018950402736663818, 0.0020081400871276855, 0.0021212399005889893, 0.002234339714050293, 0.0023474395275115967, 0.0024605393409729004, 0.002573639154434204, 0.002686738967895508, 0.0027998387813568115, 0.0029129385948181152, 0.003026038408279419, 0.0031391382217407227, 0.0032522380352020264, 0.00336533784866333, 0.003478437662124634, 0.0035915374755859375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 12.0, 16.0, 16.0, 24.0, 32.0, 56.0, 68.0, 104.0, 154.0, 218.0, 343.0, 480.0, 729.0, 1087.0, 1633.0, 2571.0, 3980.0, 6749.0, 11463.0, 19655.0, 35476.0, 64590.0, 114992.0, 180562.0, 208947.0, 164940.0, 100583.0, 55352.0, 30313.0, 16957.0, 10054.0, 5958.0, 3636.0, 2327.0, 1534.0, 971.0, 627.0, 428.0, 295.0, 211.0, 125.0, 93.0, 68.0, 41.0, 29.0, 24.0, 9.0, 13.0, 8.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.9375, -29.9189453125, -28.900390625, -27.8818359375, -26.86328125, -25.8447265625, -24.826171875, -23.8076171875, -22.7890625, -21.7705078125, -20.751953125, -19.7333984375, -18.71484375, -17.6962890625, -16.677734375, -15.6591796875, -14.640625, -13.6220703125, -12.603515625, -11.5849609375, -10.56640625, -9.5478515625, -8.529296875, -7.5107421875, -6.4921875, -5.4736328125, -4.455078125, -3.4365234375, -2.41796875, -1.3994140625, -0.380859375, 0.6376953125, 1.65625, 2.6748046875, 3.693359375, 4.7119140625, 5.73046875, 6.7490234375, 7.767578125, 8.7861328125, 9.8046875, 10.8232421875, 11.841796875, 12.8603515625, 13.87890625, 14.8974609375, 15.916015625, 16.9345703125, 17.953125, 18.9716796875, 19.990234375, 21.0087890625, 22.02734375, 23.0458984375, 24.064453125, 25.0830078125, 26.1015625, 27.1201171875, 28.138671875, 29.1572265625, 30.17578125, 31.1943359375, 32.212890625, 33.2314453125, 34.25]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 10.0, 9.0, 11.0, 21.0, 16.0, 28.0, 29.0, 44.0, 59.0, 69.0, 66.0, 83.0, 77.0, 80.0, 63.0, 73.0, 49.0, 42.0, 27.0, 32.0, 21.0, 15.0, 7.0, 14.0, 9.0, 6.0, 10.0, 7.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.5537109375, -10.154296875, -9.7548828125, -9.35546875, -8.9560546875, -8.556640625, -8.1572265625, -7.7578125, -7.3583984375, -6.958984375, -6.5595703125, -6.16015625, -5.7607421875, -5.361328125, -4.9619140625, -4.5625, -4.1630859375, -3.763671875, -3.3642578125, -2.96484375, -2.5654296875, -2.166015625, -1.7666015625, -1.3671875, -0.9677734375, -0.568359375, -0.1689453125, 0.23046875, 0.6298828125, 1.029296875, 1.4287109375, 1.828125, 2.2275390625, 2.626953125, 3.0263671875, 3.42578125, 3.8251953125, 4.224609375, 4.6240234375, 5.0234375, 5.4228515625, 5.822265625, 6.2216796875, 6.62109375, 7.0205078125, 7.419921875, 7.8193359375, 8.21875, 8.6181640625, 9.017578125, 9.4169921875, 9.81640625, 10.2158203125, 10.615234375, 11.0146484375, 11.4140625, 11.8134765625, 12.212890625, 12.6123046875, 13.01171875, 13.4111328125, 13.810546875, 14.2099609375, 14.609375]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 9.0, 11.0, 6.0, 11.0, 9.0, 9.0, 16.0, 11.0, 17.0, 40.0, 22.0, 23.0, 34.0, 34.0, 44.0, 52.0, 53.0, 46.0, 54.0, 49.0, 47.0, 44.0, 38.0, 31.0, 35.0, 38.0, 32.0, 29.0, 34.0, 21.0, 19.0, 11.0, 15.0, 6.0, 7.0, 9.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-33.787757873535156, -32.69562530517578, -31.60348892211914, -30.511354446411133, -29.419219970703125, -28.32708740234375, -27.234952926635742, -26.142818450927734, -25.050683975219727, -23.95854949951172, -22.86641502380371, -21.774280548095703, -20.682147979736328, -19.590011596679688, -18.497879028320312, -17.405744552612305, -16.313610076904297, -15.221475601196289, -14.129341125488281, -13.03720760345459, -11.945073127746582, -10.852938652038574, -9.760805130004883, -8.668670654296875, -7.576536178588867, -6.484401702880859, -5.39226770401001, -4.30013370513916, -3.2079992294311523, -2.1158647537231445, -1.023730754852295, 0.06840324401855469, 1.1605415344238281, 2.252675771713257, 3.3448100090026855, 4.436944007873535, 5.529078483581543, 6.621212959289551, 7.7133469581604, 8.80548095703125, 9.897615432739258, 10.989749908447266, 12.081884384155273, 13.174017906188965, 14.266152381896973, 15.35828685760498, 16.450420379638672, 17.54255485534668, 18.634689331054688, 19.726823806762695, 20.818958282470703, 21.91109275817871, 23.00322723388672, 24.095359802246094, 25.1874942779541, 26.27962875366211, 27.371763229370117, 28.463897705078125, 29.556032180786133, 30.64816665649414, 31.740299224853516, 32.832435607910156, 33.92456817626953, 35.016700744628906, 36.10883712768555]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 11.0, 7.0, 11.0, 10.0, 15.0, 17.0, 13.0, 25.0, 31.0, 29.0, 34.0, 32.0, 54.0, 56.0, 46.0, 56.0, 50.0, 48.0, 45.0, 57.0, 40.0, 39.0, 41.0, 33.0, 33.0, 34.0, 24.0, 15.0, 27.0, 13.0, 17.0, 9.0, 5.0, 6.0, 5.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.968156814575195, -30.830211639404297, -29.6922664642334, -28.5543212890625, -27.4163761138916, -26.278430938720703, -25.140485763549805, -24.002540588378906, -22.864595413208008, -21.72665023803711, -20.58870506286621, -19.450759887695312, -18.312814712524414, -17.174869537353516, -16.036924362182617, -14.898979187011719, -13.76103401184082, -12.623088836669922, -11.485143661499023, -10.347198486328125, -9.209253311157227, -8.071308135986328, -6.93336296081543, -5.795417785644531, -4.657472610473633, -3.5195274353027344, -2.381582260131836, -1.2436370849609375, -0.10569190979003906, 1.0322532653808594, 2.170198440551758, 3.3081436157226562, 4.4460906982421875, 5.584035873413086, 6.721981048583984, 7.859926223754883, 8.997871398925781, 10.13581657409668, 11.273761749267578, 12.411706924438477, 13.549652099609375, 14.687597274780273, 15.825542449951172, 16.96348762512207, 18.10143280029297, 19.239377975463867, 20.377323150634766, 21.515268325805664, 22.653213500976562, 23.79115867614746, 24.92910385131836, 26.067049026489258, 27.204994201660156, 28.342939376831055, 29.480884552001953, 30.61882972717285, 31.75677490234375, 32.89472198486328, 34.03266525268555, 35.17060852050781, 36.308555603027344, 37.446502685546875, 38.58444595336914, 39.722389221191406, 40.86033630371094]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 12.0, 17.0, 26.0, 52.0, 77.0, 95.0, 161.0, 254.0, 395.0, 669.0, 971.0, 1638.0, 2573.0, 4082.0, 6746.0, 10943.0, 18431.0, 30587.0, 52133.0, 90454.0, 159476.0, 286359.0, 509986.0, 779319.0, 836852.0, 601227.0, 346018.0, 192161.0, 108311.0, 62337.0, 36288.0, 21576.0, 13070.0, 7890.0, 4912.0, 3022.0, 1875.0, 1204.0, 735.0, 511.0, 302.0, 209.0, 114.0, 76.0, 53.0, 24.0, 20.0, 19.0, 9.0, 8.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-33.3125, -32.27685546875, -31.2412109375, -30.20556640625, -29.169921875, -28.13427734375, -27.0986328125, -26.06298828125, -25.02734375, -23.99169921875, -22.9560546875, -21.92041015625, -20.884765625, -19.84912109375, -18.8134765625, -17.77783203125, -16.7421875, -15.70654296875, -14.6708984375, -13.63525390625, -12.599609375, -11.56396484375, -10.5283203125, -9.49267578125, -8.45703125, -7.42138671875, -6.3857421875, -5.35009765625, -4.314453125, -3.27880859375, -2.2431640625, -1.20751953125, -0.171875, 0.86376953125, 1.8994140625, 2.93505859375, 3.970703125, 5.00634765625, 6.0419921875, 7.07763671875, 8.11328125, 9.14892578125, 10.1845703125, 11.22021484375, 12.255859375, 13.29150390625, 14.3271484375, 15.36279296875, 16.3984375, 17.43408203125, 18.4697265625, 19.50537109375, 20.541015625, 21.57666015625, 22.6123046875, 23.64794921875, 24.68359375, 25.71923828125, 26.7548828125, 27.79052734375, 28.826171875, 29.86181640625, 30.8974609375, 31.93310546875, 32.96875]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 4.0, 5.0, 10.0, 14.0, 13.0, 25.0, 26.0, 25.0, 29.0, 35.0, 27.0, 25.0, 48.0, 49.0, 51.0, 45.0, 55.0, 57.0, 59.0, 53.0, 46.0, 33.0, 31.0, 33.0, 29.0, 30.0, 39.0, 21.0, 21.0, 17.0, 10.0, 5.0, 11.0, 5.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.046875, -21.20263671875, -20.3583984375, -19.51416015625, -18.669921875, -17.82568359375, -16.9814453125, -16.13720703125, -15.29296875, -14.44873046875, -13.6044921875, -12.76025390625, -11.916015625, -11.07177734375, -10.2275390625, -9.38330078125, -8.5390625, -7.69482421875, -6.8505859375, -6.00634765625, -5.162109375, -4.31787109375, -3.4736328125, -2.62939453125, -1.78515625, -0.94091796875, -0.0966796875, 0.74755859375, 1.591796875, 2.43603515625, 3.2802734375, 4.12451171875, 4.96875, 5.81298828125, 6.6572265625, 7.50146484375, 8.345703125, 9.18994140625, 10.0341796875, 10.87841796875, 11.72265625, 12.56689453125, 13.4111328125, 14.25537109375, 15.099609375, 15.94384765625, 16.7880859375, 17.63232421875, 18.4765625, 19.32080078125, 20.1650390625, 21.00927734375, 21.853515625, 22.69775390625, 23.5419921875, 24.38623046875, 25.23046875, 26.07470703125, 26.9189453125, 27.76318359375, 28.607421875, 29.45166015625, 30.2958984375, 31.14013671875, 31.984375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 18.0, 21.0, 44.0, 61.0, 100.0, 123.0, 209.0, 311.0, 462.0, 733.0, 1165.0, 1777.0, 2879.0, 4483.0, 7245.0, 11346.0, 18661.0, 29685.0, 48420.0, 78305.0, 127232.0, 205277.0, 324112.0, 489041.0, 655704.0, 684850.0, 535081.0, 361712.0, 230201.0, 143491.0, 87573.0, 54148.0, 33682.0, 20776.0, 12851.0, 8244.0, 5230.0, 3256.0, 2030.0, 1360.0, 815.0, 521.0, 372.0, 230.0, 175.0, 90.0, 69.0, 38.0, 30.0, 15.0, 7.0, 14.0, 3.0, 4.0, 1.0], "bins": [-32.5, -31.547607421875, -30.59521484375, -29.642822265625, -28.6904296875, -27.738037109375, -26.78564453125, -25.833251953125, -24.880859375, -23.928466796875, -22.97607421875, -22.023681640625, -21.0712890625, -20.118896484375, -19.16650390625, -18.214111328125, -17.26171875, -16.309326171875, -15.35693359375, -14.404541015625, -13.4521484375, -12.499755859375, -11.54736328125, -10.594970703125, -9.642578125, -8.690185546875, -7.73779296875, -6.785400390625, -5.8330078125, -4.880615234375, -3.92822265625, -2.975830078125, -2.0234375, -1.071044921875, -0.11865234375, 0.833740234375, 1.7861328125, 2.738525390625, 3.69091796875, 4.643310546875, 5.595703125, 6.548095703125, 7.50048828125, 8.452880859375, 9.4052734375, 10.357666015625, 11.31005859375, 12.262451171875, 13.21484375, 14.167236328125, 15.11962890625, 16.072021484375, 17.0244140625, 17.976806640625, 18.92919921875, 19.881591796875, 20.833984375, 21.786376953125, 22.73876953125, 23.691162109375, 24.6435546875, 25.595947265625, 26.54833984375, 27.500732421875, 28.453125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 5.0, 8.0, 13.0, 21.0, 20.0, 28.0, 22.0, 38.0, 50.0, 63.0, 92.0, 98.0, 109.0, 123.0, 144.0, 176.0, 186.0, 211.0, 216.0, 255.0, 228.0, 212.0, 235.0, 206.0, 169.0, 184.0, 165.0, 119.0, 101.0, 104.0, 72.0, 81.0, 74.0, 58.0, 37.0, 39.0, 25.0, 11.0, 17.0, 16.0, 13.0, 6.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.53125, -10.1593017578125, -9.787353515625, -9.4154052734375, -9.04345703125, -8.6715087890625, -8.299560546875, -7.9276123046875, -7.5556640625, -7.1837158203125, -6.811767578125, -6.4398193359375, -6.06787109375, -5.6959228515625, -5.323974609375, -4.9520263671875, -4.580078125, -4.2081298828125, -3.836181640625, -3.4642333984375, -3.09228515625, -2.7203369140625, -2.348388671875, -1.9764404296875, -1.6044921875, -1.2325439453125, -0.860595703125, -0.4886474609375, -0.11669921875, 0.2552490234375, 0.627197265625, 0.9991455078125, 1.37109375, 1.7430419921875, 2.114990234375, 2.4869384765625, 2.85888671875, 3.2308349609375, 3.602783203125, 3.9747314453125, 4.3466796875, 4.7186279296875, 5.090576171875, 5.4625244140625, 5.83447265625, 6.2064208984375, 6.578369140625, 6.9503173828125, 7.322265625, 7.6942138671875, 8.066162109375, 8.4381103515625, 8.81005859375, 9.1820068359375, 9.553955078125, 9.9259033203125, 10.2978515625, 10.6697998046875, 11.041748046875, 11.4136962890625, 11.78564453125, 12.1575927734375, 12.529541015625, 12.9014892578125, 13.2734375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 9.0, 5.0, 10.0, 14.0, 13.0, 16.0, 15.0, 14.0, 21.0, 34.0, 26.0, 35.0, 49.0, 32.0, 44.0, 56.0, 52.0, 48.0, 51.0, 42.0, 38.0, 48.0, 39.0, 50.0, 35.0, 38.0, 24.0, 29.0, 16.0, 23.0, 15.0, 13.0, 5.0, 8.0, 7.0, 6.0, 5.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.612056732177734, -33.548973083496094, -32.48588943481445, -31.422807693481445, -30.359725952148438, -29.296642303466797, -28.233558654785156, -27.170475006103516, -26.107393264770508, -25.044309616088867, -23.98122787475586, -22.91814422607422, -21.855060577392578, -20.79197883605957, -19.72889518737793, -18.665813446044922, -17.60272979736328, -16.53964614868164, -15.476564407348633, -14.413480758666992, -13.350398063659668, -12.287315368652344, -11.224231719970703, -10.161149024963379, -9.098066329956055, -8.03498363494873, -6.971900463104248, -5.908817291259766, -4.845734596252441, -3.782651901245117, -2.7195687294006348, -1.6564855575561523, -0.5934066772460938, 0.46967625617980957, 1.532759189605713, 2.595842123031616, 3.6589250564575195, 4.722007751464844, 5.785090923309326, 6.848174095153809, 7.911256790161133, 8.974339485168457, 10.037422180175781, 11.100505828857422, 12.163588523864746, 13.22667121887207, 14.289754867553711, 15.352837562561035, 16.41592025756836, 17.47900390625, 18.542085647583008, 19.60516929626465, 20.668251037597656, 21.731334686279297, 22.794418334960938, 23.857501983642578, 24.920583724975586, 25.983667373657227, 27.046749114990234, 28.109832763671875, 29.172916412353516, 30.235998153686523, 31.299081802368164, 32.36216354370117, 33.42524719238281]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 5.0, 7.0, 6.0, 8.0, 8.0, 22.0, 14.0, 18.0, 22.0, 23.0, 25.0, 30.0, 24.0, 28.0, 38.0, 43.0, 26.0, 37.0, 36.0, 49.0, 48.0, 44.0, 38.0, 31.0, 43.0, 23.0, 31.0, 33.0, 28.0, 37.0, 31.0, 21.0, 18.0, 19.0, 20.0, 11.0, 10.0, 7.0, 8.0, 10.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-27.538476943969727, -26.691091537475586, -25.843708038330078, -24.996322631835938, -24.14893913269043, -23.30155372619629, -22.45417022705078, -21.60678482055664, -20.7593994140625, -19.91201400756836, -19.06463050842285, -18.21724510192871, -17.369861602783203, -16.522476196289062, -15.675091743469238, -14.827707290649414, -13.980323791503906, -13.132939338684082, -12.285554885864258, -11.438169479370117, -10.59078598022461, -9.743400573730469, -8.896016120910645, -8.04863166809082, -7.201247215270996, -6.353862762451172, -5.506478309631348, -4.659093379974365, -3.811708927154541, -2.964324474334717, -2.1169395446777344, -1.2695550918579102, -0.42217254638671875, 0.425212025642395, 1.2725965976715088, 2.119981288909912, 2.9673657417297363, 3.8147501945495605, 4.662135124206543, 5.509519577026367, 6.356904029846191, 7.204288482666016, 8.05167293548584, 8.899057388305664, 9.746442794799805, 10.593826293945312, 11.441211700439453, 12.288596153259277, 13.135980606079102, 13.983365058898926, 14.83074951171875, 15.67813491821289, 16.5255184173584, 17.37290382385254, 18.220287322998047, 19.067672729492188, 19.915058135986328, 20.76244354248047, 21.609827041625977, 22.457212448120117, 23.304595947265625, 24.151981353759766, 24.999366760253906, 25.846750259399414, 26.694133758544922]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 7.0, 20.0, 9.0, 30.0, 26.0, 48.0, 81.0, 114.0, 181.0, 253.0, 380.0, 549.0, 820.0, 1283.0, 1896.0, 2997.0, 4818.0, 7873.0, 12666.0, 21286.0, 36502.0, 61695.0, 103255.0, 159695.0, 196084.0, 165530.0, 108256.0, 64892.0, 38710.0, 22810.0, 13456.0, 8252.0, 4936.0, 3211.0, 2003.0, 1330.0, 841.0, 589.0, 361.0, 266.0, 176.0, 99.0, 87.0, 55.0, 39.0, 24.0, 21.0, 11.0, 11.0, 8.0, 6.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0], "bins": [-79.0, -76.49609375, -73.9921875, -71.48828125, -68.984375, -66.48046875, -63.9765625, -61.47265625, -58.96875, -56.46484375, -53.9609375, -51.45703125, -48.953125, -46.44921875, -43.9453125, -41.44140625, -38.9375, -36.43359375, -33.9296875, -31.42578125, -28.921875, -26.41796875, -23.9140625, -21.41015625, -18.90625, -16.40234375, -13.8984375, -11.39453125, -8.890625, -6.38671875, -3.8828125, -1.37890625, 1.125, 3.62890625, 6.1328125, 8.63671875, 11.140625, 13.64453125, 16.1484375, 18.65234375, 21.15625, 23.66015625, 26.1640625, 28.66796875, 31.171875, 33.67578125, 36.1796875, 38.68359375, 41.1875, 43.69140625, 46.1953125, 48.69921875, 51.203125, 53.70703125, 56.2109375, 58.71484375, 61.21875, 63.72265625, 66.2265625, 68.73046875, 71.234375, 73.73828125, 76.2421875, 78.74609375, 81.25]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 6.0, 6.0, 8.0, 9.0, 10.0, 6.0, 16.0, 20.0, 20.0, 27.0, 20.0, 21.0, 30.0, 35.0, 32.0, 34.0, 30.0, 37.0, 46.0, 37.0, 66.0, 49.0, 42.0, 39.0, 45.0, 27.0, 41.0, 32.0, 28.0, 27.0, 16.0, 25.0, 16.0, 26.0, 22.0, 12.0, 14.0, 8.0, 8.0, 6.0, 1.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-28.078125, -27.2275390625, -26.376953125, -25.5263671875, -24.67578125, -23.8251953125, -22.974609375, -22.1240234375, -21.2734375, -20.4228515625, -19.572265625, -18.7216796875, -17.87109375, -17.0205078125, -16.169921875, -15.3193359375, -14.46875, -13.6181640625, -12.767578125, -11.9169921875, -11.06640625, -10.2158203125, -9.365234375, -8.5146484375, -7.6640625, -6.8134765625, -5.962890625, -5.1123046875, -4.26171875, -3.4111328125, -2.560546875, -1.7099609375, -0.859375, -0.0087890625, 0.841796875, 1.6923828125, 2.54296875, 3.3935546875, 4.244140625, 5.0947265625, 5.9453125, 6.7958984375, 7.646484375, 8.4970703125, 9.34765625, 10.1982421875, 11.048828125, 11.8994140625, 12.75, 13.6005859375, 14.451171875, 15.3017578125, 16.15234375, 17.0029296875, 17.853515625, 18.7041015625, 19.5546875, 20.4052734375, 21.255859375, 22.1064453125, 22.95703125, 23.8076171875, 24.658203125, 25.5087890625, 26.359375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 14.0, 20.0, 28.0, 43.0, 73.0, 86.0, 167.0, 198.0, 298.0, 483.0, 659.0, 1043.0, 1682.0, 2660.0, 4420.0, 7454.0, 13150.0, 24861.0, 48597.0, 104016.0, 223955.0, 296027.0, 162721.0, 74891.0, 36202.0, 18989.0, 10283.0, 5901.0, 3512.0, 2151.0, 1347.0, 858.0, 574.0, 357.0, 288.0, 169.0, 112.0, 91.0, 52.0, 38.0, 27.0, 10.0, 15.0, 9.0, 4.0, 5.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-98.6875, -95.630859375, -92.57421875, -89.517578125, -86.4609375, -83.404296875, -80.34765625, -77.291015625, -74.234375, -71.177734375, -68.12109375, -65.064453125, -62.0078125, -58.951171875, -55.89453125, -52.837890625, -49.78125, -46.724609375, -43.66796875, -40.611328125, -37.5546875, -34.498046875, -31.44140625, -28.384765625, -25.328125, -22.271484375, -19.21484375, -16.158203125, -13.1015625, -10.044921875, -6.98828125, -3.931640625, -0.875, 2.181640625, 5.23828125, 8.294921875, 11.3515625, 14.408203125, 17.46484375, 20.521484375, 23.578125, 26.634765625, 29.69140625, 32.748046875, 35.8046875, 38.861328125, 41.91796875, 44.974609375, 48.03125, 51.087890625, 54.14453125, 57.201171875, 60.2578125, 63.314453125, 66.37109375, 69.427734375, 72.484375, 75.541015625, 78.59765625, 81.654296875, 84.7109375, 87.767578125, 90.82421875, 93.880859375, 96.9375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 13.0, 11.0, 6.0, 15.0, 13.0, 25.0, 16.0, 27.0, 29.0, 36.0, 40.0, 40.0, 42.0, 43.0, 58.0, 36.0, 37.0, 42.0, 37.0, 46.0, 42.0, 39.0, 41.0, 20.0, 28.0, 26.0, 37.0, 24.0, 24.0, 24.0, 10.0, 11.0, 8.0, 11.0, 6.0, 4.0, 7.0, 8.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.549072265625, -19.89501953125, -19.240966796875, -18.5869140625, -17.932861328125, -17.27880859375, -16.624755859375, -15.970703125, -15.316650390625, -14.66259765625, -14.008544921875, -13.3544921875, -12.700439453125, -12.04638671875, -11.392333984375, -10.73828125, -10.084228515625, -9.43017578125, -8.776123046875, -8.1220703125, -7.468017578125, -6.81396484375, -6.159912109375, -5.505859375, -4.851806640625, -4.19775390625, -3.543701171875, -2.8896484375, -2.235595703125, -1.58154296875, -0.927490234375, -0.2734375, 0.380615234375, 1.03466796875, 1.688720703125, 2.3427734375, 2.996826171875, 3.65087890625, 4.304931640625, 4.958984375, 5.613037109375, 6.26708984375, 6.921142578125, 7.5751953125, 8.229248046875, 8.88330078125, 9.537353515625, 10.19140625, 10.845458984375, 11.49951171875, 12.153564453125, 12.8076171875, 13.461669921875, 14.11572265625, 14.769775390625, 15.423828125, 16.077880859375, 16.73193359375, 17.385986328125, 18.0400390625, 18.694091796875, 19.34814453125, 20.002197265625, 20.65625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 11.0, 13.0, 18.0, 30.0, 24.0, 55.0, 75.0, 105.0, 145.0, 192.0, 309.0, 427.0, 616.0, 890.0, 1311.0, 2111.0, 3067.0, 4977.0, 8340.0, 15298.0, 32662.0, 109764.0, 596876.0, 184312.0, 42774.0, 18195.0, 9619.0, 5746.0, 3529.0, 2301.0, 1421.0, 990.0, 651.0, 499.0, 370.0, 251.0, 170.0, 122.0, 82.0, 62.0, 53.0, 27.0, 14.0, 17.0, 9.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-152.375, -147.845703125, -143.31640625, -138.787109375, -134.2578125, -129.728515625, -125.19921875, -120.669921875, -116.140625, -111.611328125, -107.08203125, -102.552734375, -98.0234375, -93.494140625, -88.96484375, -84.435546875, -79.90625, -75.376953125, -70.84765625, -66.318359375, -61.7890625, -57.259765625, -52.73046875, -48.201171875, -43.671875, -39.142578125, -34.61328125, -30.083984375, -25.5546875, -21.025390625, -16.49609375, -11.966796875, -7.4375, -2.908203125, 1.62109375, 6.150390625, 10.6796875, 15.208984375, 19.73828125, 24.267578125, 28.796875, 33.326171875, 37.85546875, 42.384765625, 46.9140625, 51.443359375, 55.97265625, 60.501953125, 65.03125, 69.560546875, 74.08984375, 78.619140625, 83.1484375, 87.677734375, 92.20703125, 96.736328125, 101.265625, 105.794921875, 110.32421875, 114.853515625, 119.3828125, 123.912109375, 128.44140625, 132.970703125, 137.5]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 4.0, 9.0, 8.0, 11.0, 13.0, 16.0, 25.0, 36.0, 95.0, 274.0, 269.0, 76.0, 42.0, 20.0, 19.0, 7.0, 8.0, 13.0, 2.0, 5.0, 3.0, 3.0, 6.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0185546875, -0.01789093017578125, -0.0172271728515625, -0.01656341552734375, -0.015899658203125, -0.01523590087890625, -0.0145721435546875, -0.01390838623046875, -0.01324462890625, -0.01258087158203125, -0.0119171142578125, -0.01125335693359375, -0.010589599609375, -0.00992584228515625, -0.0092620849609375, -0.00859832763671875, -0.0079345703125, -0.00727081298828125, -0.0066070556640625, -0.00594329833984375, -0.005279541015625, -0.00461578369140625, -0.0039520263671875, -0.00328826904296875, -0.00262451171875, -0.00196075439453125, -0.0012969970703125, -0.00063323974609375, 3.0517578125e-05, 0.00069427490234375, 0.0013580322265625, 0.00202178955078125, 0.002685546875, 0.00334930419921875, 0.0040130615234375, 0.00467681884765625, 0.005340576171875, 0.00600433349609375, 0.0066680908203125, 0.00733184814453125, 0.00799560546875, 0.00865936279296875, 0.0093231201171875, 0.00998687744140625, 0.010650634765625, 0.01131439208984375, 0.0119781494140625, 0.01264190673828125, 0.0133056640625, 0.01396942138671875, 0.0146331787109375, 0.01529693603515625, 0.015960693359375, 0.01662445068359375, 0.0172882080078125, 0.01795196533203125, 0.01861572265625, 0.01927947998046875, 0.0199432373046875, 0.02060699462890625, 0.021270751953125, 0.02193450927734375, 0.0225982666015625, 0.02326202392578125, 0.02392578125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 9.0, 16.0, 23.0, 37.0, 46.0, 50.0, 72.0, 102.0, 162.0, 238.0, 344.0, 557.0, 813.0, 1285.0, 2061.0, 3373.0, 5559.0, 9355.0, 17526.0, 38478.0, 117393.0, 421733.0, 291464.0, 75171.0, 28342.0, 13998.0, 7888.0, 4624.0, 2910.0, 1717.0, 1024.0, 788.0, 475.0, 291.0, 197.0, 127.0, 84.0, 70.0, 47.0, 21.0, 18.0, 13.0, 8.0, 9.0, 13.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-95.0, -91.91796875, -88.8359375, -85.75390625, -82.671875, -79.58984375, -76.5078125, -73.42578125, -70.34375, -67.26171875, -64.1796875, -61.09765625, -58.015625, -54.93359375, -51.8515625, -48.76953125, -45.6875, -42.60546875, -39.5234375, -36.44140625, -33.359375, -30.27734375, -27.1953125, -24.11328125, -21.03125, -17.94921875, -14.8671875, -11.78515625, -8.703125, -5.62109375, -2.5390625, 0.54296875, 3.625, 6.70703125, 9.7890625, 12.87109375, 15.953125, 19.03515625, 22.1171875, 25.19921875, 28.28125, 31.36328125, 34.4453125, 37.52734375, 40.609375, 43.69140625, 46.7734375, 49.85546875, 52.9375, 56.01953125, 59.1015625, 62.18359375, 65.265625, 68.34765625, 71.4296875, 74.51171875, 77.59375, 80.67578125, 83.7578125, 86.83984375, 89.921875, 93.00390625, 96.0859375, 99.16796875, 102.25]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 9.0, 5.0, 10.0, 5.0, 6.0, 6.0, 12.0, 13.0, 21.0, 18.0, 24.0, 29.0, 55.0, 64.0, 87.0, 102.0, 106.0, 91.0, 69.0, 67.0, 37.0, 39.0, 20.0, 17.0, 15.0, 16.0, 9.0, 5.0, 6.0, 5.0, 4.0, 7.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.59375, -23.880859375, -23.16796875, -22.455078125, -21.7421875, -21.029296875, -20.31640625, -19.603515625, -18.890625, -18.177734375, -17.46484375, -16.751953125, -16.0390625, -15.326171875, -14.61328125, -13.900390625, -13.1875, -12.474609375, -11.76171875, -11.048828125, -10.3359375, -9.623046875, -8.91015625, -8.197265625, -7.484375, -6.771484375, -6.05859375, -5.345703125, -4.6328125, -3.919921875, -3.20703125, -2.494140625, -1.78125, -1.068359375, -0.35546875, 0.357421875, 1.0703125, 1.783203125, 2.49609375, 3.208984375, 3.921875, 4.634765625, 5.34765625, 6.060546875, 6.7734375, 7.486328125, 8.19921875, 8.912109375, 9.625, 10.337890625, 11.05078125, 11.763671875, 12.4765625, 13.189453125, 13.90234375, 14.615234375, 15.328125, 16.041015625, 16.75390625, 17.466796875, 18.1796875, 18.892578125, 19.60546875, 20.318359375, 21.03125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 10.0, 5.0, 14.0, 8.0, 16.0, 16.0, 25.0, 34.0, 33.0, 35.0, 52.0, 47.0, 55.0, 66.0, 65.0, 60.0, 55.0, 59.0, 45.0, 32.0, 42.0, 38.0, 33.0, 24.0, 21.0, 19.0, 25.0, 11.0, 9.0, 11.0, 11.0, 5.0, 3.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-45.637935638427734, -44.28535079956055, -42.93276596069336, -41.580177307128906, -40.22759246826172, -38.87500762939453, -37.522422790527344, -36.169837951660156, -34.81725311279297, -33.46466827392578, -32.112083435058594, -30.759496688842773, -29.406909942626953, -28.054325103759766, -26.701740264892578, -25.34915542602539, -23.996566772460938, -22.64398193359375, -21.29139518737793, -19.938810348510742, -18.586223602294922, -17.233638763427734, -15.881053924560547, -14.528468132019043, -13.175882339477539, -11.823296546936035, -10.470710754394531, -9.118125915527344, -7.76554012298584, -6.412954330444336, -5.060369491577148, -3.7077836990356445, -2.3552017211914062, -1.0026161670684814, 0.34996938705444336, 1.702554702758789, 3.055140495300293, 4.407726287841797, 5.760311126708984, 7.112896919250488, 8.465482711791992, 9.818068504333496, 11.170654296875, 12.523239135742188, 13.875824928283691, 15.228410720825195, 16.580995559692383, 17.933582305908203, 19.28616714477539, 20.638751983642578, 21.9913387298584, 23.343923568725586, 24.696510314941406, 26.049095153808594, 27.40167999267578, 28.75426483154297, 30.10685157775879, 31.459436416625977, 32.8120231628418, 34.164608001708984, 35.51719284057617, 36.869781494140625, 38.22236633300781, 39.574951171875, 40.92753601074219]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 6.0, 10.0, 14.0, 16.0, 16.0, 20.0, 23.0, 29.0, 27.0, 32.0, 43.0, 36.0, 32.0, 38.0, 41.0, 46.0, 38.0, 47.0, 47.0, 43.0, 62.0, 32.0, 35.0, 36.0, 27.0, 25.0, 25.0, 23.0, 21.0, 17.0, 20.0, 14.0, 8.0, 9.0, 5.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-39.595787048339844, -38.51987075805664, -37.44395446777344, -36.368038177490234, -35.29212188720703, -34.21620178222656, -33.14028549194336, -32.064369201660156, -30.988452911376953, -29.91253662109375, -28.836620330810547, -27.76070213317871, -26.684785842895508, -25.608869552612305, -24.53295135498047, -23.457035064697266, -22.381118774414062, -21.30520248413086, -20.229286193847656, -19.15336799621582, -18.077451705932617, -17.001535415649414, -15.925618171691895, -14.849700927734375, -13.773784637451172, -12.697868347167969, -11.62195110321045, -10.54603385925293, -9.470117568969727, -8.394201278686523, -7.318284034729004, -6.242367267608643, -5.166454315185547, -4.0905375480651855, -3.014620780944824, -1.938704013824463, -0.8627872467041016, 0.21312952041625977, 1.289046287536621, 2.3649630546569824, 3.4408798217773438, 4.516796588897705, 5.592713356018066, 6.668630123138428, 7.744546890258789, 8.820463180541992, 9.896380424499512, 10.972297668457031, 12.048213958740234, 13.124130249023438, 14.200047492980957, 15.275964736938477, 16.35188102722168, 17.427797317504883, 18.50371551513672, 19.579631805419922, 20.655548095703125, 21.731464385986328, 22.80738067626953, 23.883298873901367, 24.95921516418457, 26.035131454467773, 27.11104965209961, 28.186965942382812, 29.262882232666016]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [6.0, 5.0, 9.0, 7.0, 15.0, 13.0, 33.0, 40.0, 47.0, 88.0, 115.0, 203.0, 281.0, 459.0, 731.0, 1130.0, 1688.0, 2607.0, 3929.0, 6137.0, 9498.0, 14248.0, 21715.0, 32473.0, 48252.0, 70061.0, 97450.0, 126277.0, 140873.0, 131171.0, 104490.0, 76280.0, 53360.0, 35864.0, 24035.0, 15502.0, 10347.0, 6799.0, 4300.0, 2815.0, 1815.0, 1201.0, 744.0, 511.0, 342.0, 215.0, 142.0, 81.0, 55.0, 29.0, 24.0, 23.0, 18.0, 4.0, 3.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.53125, -36.2197265625, -34.908203125, -33.5966796875, -32.28515625, -30.9736328125, -29.662109375, -28.3505859375, -27.0390625, -25.7275390625, -24.416015625, -23.1044921875, -21.79296875, -20.4814453125, -19.169921875, -17.8583984375, -16.546875, -15.2353515625, -13.923828125, -12.6123046875, -11.30078125, -9.9892578125, -8.677734375, -7.3662109375, -6.0546875, -4.7431640625, -3.431640625, -2.1201171875, -0.80859375, 0.5029296875, 1.814453125, 3.1259765625, 4.4375, 5.7490234375, 7.060546875, 8.3720703125, 9.68359375, 10.9951171875, 12.306640625, 13.6181640625, 14.9296875, 16.2412109375, 17.552734375, 18.8642578125, 20.17578125, 21.4873046875, 22.798828125, 24.1103515625, 25.421875, 26.7333984375, 28.044921875, 29.3564453125, 30.66796875, 31.9794921875, 33.291015625, 34.6025390625, 35.9140625, 37.2255859375, 38.537109375, 39.8486328125, 41.16015625, 42.4716796875, 43.783203125, 45.0947265625, 46.40625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 5.0, 10.0, 5.0, 13.0, 13.0, 22.0, 20.0, 21.0, 22.0, 23.0, 30.0, 31.0, 24.0, 37.0, 44.0, 46.0, 40.0, 44.0, 47.0, 48.0, 52.0, 37.0, 55.0, 37.0, 39.0, 32.0, 27.0, 28.0, 26.0, 22.0, 22.0, 14.0, 12.0, 10.0, 7.0, 4.0, 9.0, 4.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0], "bins": [-37.46875, -36.496826171875, -35.52490234375, -34.552978515625, -33.5810546875, -32.609130859375, -31.63720703125, -30.665283203125, -29.693359375, -28.721435546875, -27.74951171875, -26.777587890625, -25.8056640625, -24.833740234375, -23.86181640625, -22.889892578125, -21.91796875, -20.946044921875, -19.97412109375, -19.002197265625, -18.0302734375, -17.058349609375, -16.08642578125, -15.114501953125, -14.142578125, -13.170654296875, -12.19873046875, -11.226806640625, -10.2548828125, -9.282958984375, -8.31103515625, -7.339111328125, -6.3671875, -5.395263671875, -4.42333984375, -3.451416015625, -2.4794921875, -1.507568359375, -0.53564453125, 0.436279296875, 1.408203125, 2.380126953125, 3.35205078125, 4.323974609375, 5.2958984375, 6.267822265625, 7.23974609375, 8.211669921875, 9.18359375, 10.155517578125, 11.12744140625, 12.099365234375, 13.0712890625, 14.043212890625, 15.01513671875, 15.987060546875, 16.958984375, 17.930908203125, 18.90283203125, 19.874755859375, 20.8466796875, 21.818603515625, 22.79052734375, 23.762451171875, 24.734375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 2.0, 7.0, 14.0, 13.0, 26.0, 37.0, 57.0, 76.0, 140.0, 191.0, 283.0, 438.0, 597.0, 930.0, 1404.0, 2122.0, 3163.0, 4835.0, 7439.0, 11390.0, 17023.0, 26123.0, 38746.0, 56874.0, 80550.0, 107483.0, 129412.0, 134885.0, 119646.0, 94251.0, 68688.0, 47649.0, 31730.0, 21249.0, 13945.0, 9156.0, 6016.0, 4072.0, 2640.0, 1739.0, 1165.0, 840.0, 526.0, 327.0, 235.0, 154.0, 94.0, 53.0, 36.0, 29.0, 15.0, 14.0, 15.0, 8.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-35.0, -33.84326171875, -32.6865234375, -31.52978515625, -30.373046875, -29.21630859375, -28.0595703125, -26.90283203125, -25.74609375, -24.58935546875, -23.4326171875, -22.27587890625, -21.119140625, -19.96240234375, -18.8056640625, -17.64892578125, -16.4921875, -15.33544921875, -14.1787109375, -13.02197265625, -11.865234375, -10.70849609375, -9.5517578125, -8.39501953125, -7.23828125, -6.08154296875, -4.9248046875, -3.76806640625, -2.611328125, -1.45458984375, -0.2978515625, 0.85888671875, 2.015625, 3.17236328125, 4.3291015625, 5.48583984375, 6.642578125, 7.79931640625, 8.9560546875, 10.11279296875, 11.26953125, 12.42626953125, 13.5830078125, 14.73974609375, 15.896484375, 17.05322265625, 18.2099609375, 19.36669921875, 20.5234375, 21.68017578125, 22.8369140625, 23.99365234375, 25.150390625, 26.30712890625, 27.4638671875, 28.62060546875, 29.77734375, 30.93408203125, 32.0908203125, 33.24755859375, 34.404296875, 35.56103515625, 36.7177734375, 37.87451171875, 39.03125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 8.0, 8.0, 14.0, 17.0, 16.0, 21.0, 23.0, 23.0, 22.0, 33.0, 29.0, 31.0, 49.0, 28.0, 36.0, 34.0, 35.0, 47.0, 51.0, 30.0, 44.0, 37.0, 43.0, 40.0, 35.0, 21.0, 34.0, 23.0, 30.0, 25.0, 19.0, 13.0, 12.0, 13.0, 10.0, 12.0, 6.0, 10.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.265625, -19.647705078125, -19.02978515625, -18.411865234375, -17.7939453125, -17.176025390625, -16.55810546875, -15.940185546875, -15.322265625, -14.704345703125, -14.08642578125, -13.468505859375, -12.8505859375, -12.232666015625, -11.61474609375, -10.996826171875, -10.37890625, -9.760986328125, -9.14306640625, -8.525146484375, -7.9072265625, -7.289306640625, -6.67138671875, -6.053466796875, -5.435546875, -4.817626953125, -4.19970703125, -3.581787109375, -2.9638671875, -2.345947265625, -1.72802734375, -1.110107421875, -0.4921875, 0.125732421875, 0.74365234375, 1.361572265625, 1.9794921875, 2.597412109375, 3.21533203125, 3.833251953125, 4.451171875, 5.069091796875, 5.68701171875, 6.304931640625, 6.9228515625, 7.540771484375, 8.15869140625, 8.776611328125, 9.39453125, 10.012451171875, 10.63037109375, 11.248291015625, 11.8662109375, 12.484130859375, 13.10205078125, 13.719970703125, 14.337890625, 14.955810546875, 15.57373046875, 16.191650390625, 16.8095703125, 17.427490234375, 18.04541015625, 18.663330078125, 19.28125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 8.0, 7.0, 9.0, 17.0, 33.0, 43.0, 54.0, 90.0, 135.0, 209.0, 285.0, 448.0, 707.0, 1080.0, 1896.0, 3032.0, 5143.0, 9103.0, 16372.0, 31125.0, 61358.0, 123914.0, 223624.0, 250382.0, 154832.0, 78180.0, 39308.0, 20326.0, 11189.0, 6207.0, 3626.0, 2092.0, 1374.0, 842.0, 557.0, 303.0, 228.0, 139.0, 102.0, 53.0, 39.0, 27.0, 18.0, 13.0, 12.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-47.125, -45.66015625, -44.1953125, -42.73046875, -41.265625, -39.80078125, -38.3359375, -36.87109375, -35.40625, -33.94140625, -32.4765625, -31.01171875, -29.546875, -28.08203125, -26.6171875, -25.15234375, -23.6875, -22.22265625, -20.7578125, -19.29296875, -17.828125, -16.36328125, -14.8984375, -13.43359375, -11.96875, -10.50390625, -9.0390625, -7.57421875, -6.109375, -4.64453125, -3.1796875, -1.71484375, -0.25, 1.21484375, 2.6796875, 4.14453125, 5.609375, 7.07421875, 8.5390625, 10.00390625, 11.46875, 12.93359375, 14.3984375, 15.86328125, 17.328125, 18.79296875, 20.2578125, 21.72265625, 23.1875, 24.65234375, 26.1171875, 27.58203125, 29.046875, 30.51171875, 31.9765625, 33.44140625, 34.90625, 36.37109375, 37.8359375, 39.30078125, 40.765625, 42.23046875, 43.6953125, 45.16015625, 46.625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 5.0, 1.0, 4.0, 6.0, 0.0, 6.0, 7.0, 12.0, 8.0, 11.0, 15.0, 11.0, 26.0, 33.0, 34.0, 37.0, 47.0, 61.0, 61.0, 51.0, 57.0, 64.0, 58.0, 59.0, 48.0, 46.0, 29.0, 33.0, 36.0, 29.0, 23.0, 18.0, 15.0, 11.0, 10.0, 11.0, 3.0, 7.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0034732818603515625, -0.0033621788024902344, -0.0032510757446289062, -0.003139972686767578, -0.00302886962890625, -0.002917766571044922, -0.0028066635131835938, -0.0026955604553222656, -0.0025844573974609375, -0.0024733543395996094, -0.0023622512817382812, -0.002251148223876953, -0.002140045166015625, -0.002028942108154297, -0.0019178390502929688, -0.0018067359924316406, -0.0016956329345703125, -0.0015845298767089844, -0.0014734268188476562, -0.0013623237609863281, -0.001251220703125, -0.0011401176452636719, -0.0010290145874023438, -0.0009179115295410156, -0.0008068084716796875, -0.0006957054138183594, -0.0005846023559570312, -0.0004734992980957031, -0.000362396240234375, -0.0002512931823730469, -0.00014019012451171875, -2.9087066650390625e-05, 8.20159912109375e-05, 0.00019311904907226562, 0.00030422210693359375, 0.0004153251647949219, 0.00052642822265625, 0.0006375312805175781, 0.0007486343383789062, 0.0008597373962402344, 0.0009708404541015625, 0.0010819435119628906, 0.0011930465698242188, 0.0013041496276855469, 0.001415252685546875, 0.0015263557434082031, 0.0016374588012695312, 0.0017485618591308594, 0.0018596649169921875, 0.0019707679748535156, 0.0020818710327148438, 0.002192974090576172, 0.0023040771484375, 0.002415180206298828, 0.0025262832641601562, 0.0026373863220214844, 0.0027484893798828125, 0.0028595924377441406, 0.0029706954956054688, 0.003081798553466797, 0.003192901611328125, 0.003304004669189453, 0.0034151077270507812, 0.0035262107849121094, 0.0036373138427734375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 11.0, 8.0, 17.0, 31.0, 35.0, 39.0, 78.0, 120.0, 160.0, 236.0, 332.0, 512.0, 781.0, 1132.0, 1726.0, 2714.0, 4193.0, 6529.0, 10633.0, 17356.0, 29805.0, 51521.0, 91241.0, 157171.0, 219909.0, 185428.0, 111903.0, 63240.0, 35918.0, 21156.0, 12641.0, 7891.0, 4928.0, 3121.0, 2042.0, 1289.0, 861.0, 593.0, 410.0, 271.0, 174.0, 121.0, 105.0, 58.0, 47.0, 28.0, 14.0, 9.0, 3.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.125, -36.88232421875, -35.6396484375, -34.39697265625, -33.154296875, -31.91162109375, -30.6689453125, -29.42626953125, -28.18359375, -26.94091796875, -25.6982421875, -24.45556640625, -23.212890625, -21.97021484375, -20.7275390625, -19.48486328125, -18.2421875, -16.99951171875, -15.7568359375, -14.51416015625, -13.271484375, -12.02880859375, -10.7861328125, -9.54345703125, -8.30078125, -7.05810546875, -5.8154296875, -4.57275390625, -3.330078125, -2.08740234375, -0.8447265625, 0.39794921875, 1.640625, 2.88330078125, 4.1259765625, 5.36865234375, 6.611328125, 7.85400390625, 9.0966796875, 10.33935546875, 11.58203125, 12.82470703125, 14.0673828125, 15.31005859375, 16.552734375, 17.79541015625, 19.0380859375, 20.28076171875, 21.5234375, 22.76611328125, 24.0087890625, 25.25146484375, 26.494140625, 27.73681640625, 28.9794921875, 30.22216796875, 31.46484375, 32.70751953125, 33.9501953125, 35.19287109375, 36.435546875, 37.67822265625, 38.9208984375, 40.16357421875, 41.40625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 7.0, 5.0, 7.0, 11.0, 14.0, 22.0, 14.0, 20.0, 25.0, 35.0, 36.0, 35.0, 45.0, 58.0, 73.0, 71.0, 62.0, 58.0, 56.0, 56.0, 49.0, 38.0, 28.0, 31.0, 19.0, 22.0, 15.0, 12.0, 9.0, 19.0, 6.0, 9.0, 5.0, 4.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.2265625, -12.818603515625, -12.41064453125, -12.002685546875, -11.5947265625, -11.186767578125, -10.77880859375, -10.370849609375, -9.962890625, -9.554931640625, -9.14697265625, -8.739013671875, -8.3310546875, -7.923095703125, -7.51513671875, -7.107177734375, -6.69921875, -6.291259765625, -5.88330078125, -5.475341796875, -5.0673828125, -4.659423828125, -4.25146484375, -3.843505859375, -3.435546875, -3.027587890625, -2.61962890625, -2.211669921875, -1.8037109375, -1.395751953125, -0.98779296875, -0.579833984375, -0.171875, 0.236083984375, 0.64404296875, 1.052001953125, 1.4599609375, 1.867919921875, 2.27587890625, 2.683837890625, 3.091796875, 3.499755859375, 3.90771484375, 4.315673828125, 4.7236328125, 5.131591796875, 5.53955078125, 5.947509765625, 6.35546875, 6.763427734375, 7.17138671875, 7.579345703125, 7.9873046875, 8.395263671875, 8.80322265625, 9.211181640625, 9.619140625, 10.027099609375, 10.43505859375, 10.843017578125, 11.2509765625, 11.658935546875, 12.06689453125, 12.474853515625, 12.8828125]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 12.0, 13.0, 8.0, 14.0, 20.0, 20.0, 27.0, 42.0, 40.0, 49.0, 65.0, 51.0, 58.0, 55.0, 52.0, 49.0, 62.0, 47.0, 49.0, 36.0, 35.0, 39.0, 24.0, 23.0, 17.0, 14.0, 18.0, 10.0, 8.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-40.51506423950195, -39.29050827026367, -38.065956115722656, -36.841400146484375, -35.616844177246094, -34.39228820800781, -33.16773223876953, -31.943180084228516, -30.718624114990234, -29.494068145751953, -28.269514083862305, -27.044960021972656, -25.820404052734375, -24.595848083496094, -23.371294021606445, -22.146739959716797, -20.922183990478516, -19.697628021240234, -18.473073959350586, -17.248519897460938, -16.023963928222656, -14.799408912658691, -13.574853897094727, -12.350298881530762, -11.125743865966797, -9.901188850402832, -8.676633834838867, -7.452078819274902, -6.2275238037109375, -5.002968788146973, -3.778413772583008, -2.553858757019043, -1.3293075561523438, -0.1047525405883789, 1.119802474975586, 2.344357490539551, 3.5689125061035156, 4.7934675216674805, 6.018022537231445, 7.24257755279541, 8.467132568359375, 9.69168758392334, 10.916242599487305, 12.14079761505127, 13.365352630615234, 14.5899076461792, 15.814462661743164, 17.039016723632812, 18.263572692871094, 19.488128662109375, 20.712682723999023, 21.937236785888672, 23.161792755126953, 24.386348724365234, 25.610902786254883, 26.83545684814453, 28.060012817382812, 29.284568786621094, 30.509122848510742, 31.73367691040039, 32.95823287963867, 34.18278884887695, 35.40734100341797, 36.63189697265625, 37.85645294189453]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 6.0, 9.0, 13.0, 15.0, 16.0, 22.0, 21.0, 24.0, 28.0, 26.0, 25.0, 38.0, 34.0, 36.0, 37.0, 29.0, 38.0, 44.0, 38.0, 55.0, 41.0, 33.0, 45.0, 36.0, 29.0, 33.0, 35.0, 27.0, 20.0, 23.0, 15.0, 20.0, 17.0, 14.0, 11.0, 5.0, 10.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-36.519691467285156, -35.51594924926758, -34.51220703125, -33.50846481323242, -32.504722595214844, -31.500980377197266, -30.497238159179688, -29.49349594116211, -28.48975372314453, -27.486011505126953, -26.482269287109375, -25.478527069091797, -24.47478485107422, -23.47104263305664, -22.467300415039062, -21.463558197021484, -20.459814071655273, -19.456071853637695, -18.452329635620117, -17.44858741760254, -16.44484519958496, -15.441102981567383, -14.437359809875488, -13.43361759185791, -12.429875373840332, -11.426133155822754, -10.422390937805176, -9.418647766113281, -8.414905548095703, -7.411163806915283, -6.407421112060547, -5.403678894042969, -4.399938583374023, -3.3961963653564453, -2.392453908920288, -1.3887114524841309, -0.38496923446655273, 0.6187729835510254, 1.6225156784057617, 2.62625789642334, 3.630000114440918, 4.633742332458496, 5.637484550476074, 6.6412272453308105, 7.644969463348389, 8.648712158203125, 9.652454376220703, 10.656196594238281, 11.65993881225586, 12.663681030273438, 13.667423248291016, 14.671165466308594, 15.674907684326172, 16.67864990234375, 17.682392120361328, 18.686134338378906, 19.689876556396484, 20.693618774414062, 21.69736099243164, 22.70110321044922, 23.704845428466797, 24.708587646484375, 25.712329864501953, 26.71607208251953, 27.719816207885742]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 10.0, 14.0, 21.0, 33.0, 59.0, 99.0, 137.0, 191.0, 320.0, 511.0, 854.0, 1313.0, 2147.0, 3508.0, 5504.0, 8579.0, 14706.0, 24391.0, 42282.0, 75697.0, 140901.0, 280759.0, 587076.0, 982941.0, 939322.0, 535048.0, 254687.0, 128304.0, 69311.0, 38612.0, 22349.0, 13485.0, 8205.0, 4786.0, 2991.0, 1909.0, 1282.0, 755.0, 445.0, 289.0, 171.0, 112.0, 69.0, 35.0, 26.0, 14.0, 14.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-38.59375, -37.51953125, -36.4453125, -35.37109375, -34.296875, -33.22265625, -32.1484375, -31.07421875, -30.0, -28.92578125, -27.8515625, -26.77734375, -25.703125, -24.62890625, -23.5546875, -22.48046875, -21.40625, -20.33203125, -19.2578125, -18.18359375, -17.109375, -16.03515625, -14.9609375, -13.88671875, -12.8125, -11.73828125, -10.6640625, -9.58984375, -8.515625, -7.44140625, -6.3671875, -5.29296875, -4.21875, -3.14453125, -2.0703125, -0.99609375, 0.078125, 1.15234375, 2.2265625, 3.30078125, 4.375, 5.44921875, 6.5234375, 7.59765625, 8.671875, 9.74609375, 10.8203125, 11.89453125, 12.96875, 14.04296875, 15.1171875, 16.19140625, 17.265625, 18.33984375, 19.4140625, 20.48828125, 21.5625, 22.63671875, 23.7109375, 24.78515625, 25.859375, 26.93359375, 28.0078125, 29.08203125, 30.15625]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 9.0, 6.0, 11.0, 12.0, 11.0, 19.0, 11.0, 26.0, 14.0, 27.0, 23.0, 31.0, 28.0, 32.0, 32.0, 35.0, 32.0, 48.0, 32.0, 35.0, 36.0, 41.0, 35.0, 39.0, 46.0, 31.0, 38.0, 34.0, 28.0, 38.0, 27.0, 18.0, 22.0, 18.0, 18.0, 8.0, 12.0, 13.0, 7.0, 2.0, 7.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-24.234375, -23.551025390625, -22.86767578125, -22.184326171875, -21.5009765625, -20.817626953125, -20.13427734375, -19.450927734375, -18.767578125, -18.084228515625, -17.40087890625, -16.717529296875, -16.0341796875, -15.350830078125, -14.66748046875, -13.984130859375, -13.30078125, -12.617431640625, -11.93408203125, -11.250732421875, -10.5673828125, -9.884033203125, -9.20068359375, -8.517333984375, -7.833984375, -7.150634765625, -6.46728515625, -5.783935546875, -5.1005859375, -4.417236328125, -3.73388671875, -3.050537109375, -2.3671875, -1.683837890625, -1.00048828125, -0.317138671875, 0.3662109375, 1.049560546875, 1.73291015625, 2.416259765625, 3.099609375, 3.782958984375, 4.46630859375, 5.149658203125, 5.8330078125, 6.516357421875, 7.19970703125, 7.883056640625, 8.56640625, 9.249755859375, 9.93310546875, 10.616455078125, 11.2998046875, 11.983154296875, 12.66650390625, 13.349853515625, 14.033203125, 14.716552734375, 15.39990234375, 16.083251953125, 16.7666015625, 17.449951171875, 18.13330078125, 18.816650390625, 19.5]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 7.0, 11.0, 30.0, 38.0, 70.0, 89.0, 124.0, 201.0, 325.0, 484.0, 804.0, 1177.0, 2106.0, 3283.0, 5291.0, 8904.0, 14671.0, 25677.0, 44909.0, 79651.0, 145315.0, 270014.0, 501757.0, 852290.0, 926745.0, 595443.0, 322807.0, 172219.0, 93901.0, 52435.0, 29862.0, 17075.0, 10211.0, 6169.0, 3887.0, 2285.0, 1445.0, 932.0, 579.0, 376.0, 258.0, 140.0, 94.0, 66.0, 46.0, 29.0, 17.0, 11.0, 9.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.9375, -32.8115234375, -31.685546875, -30.5595703125, -29.43359375, -28.3076171875, -27.181640625, -26.0556640625, -24.9296875, -23.8037109375, -22.677734375, -21.5517578125, -20.42578125, -19.2998046875, -18.173828125, -17.0478515625, -15.921875, -14.7958984375, -13.669921875, -12.5439453125, -11.41796875, -10.2919921875, -9.166015625, -8.0400390625, -6.9140625, -5.7880859375, -4.662109375, -3.5361328125, -2.41015625, -1.2841796875, -0.158203125, 0.9677734375, 2.09375, 3.2197265625, 4.345703125, 5.4716796875, 6.59765625, 7.7236328125, 8.849609375, 9.9755859375, 11.1015625, 12.2275390625, 13.353515625, 14.4794921875, 15.60546875, 16.7314453125, 17.857421875, 18.9833984375, 20.109375, 21.2353515625, 22.361328125, 23.4873046875, 24.61328125, 25.7392578125, 26.865234375, 27.9912109375, 29.1171875, 30.2431640625, 31.369140625, 32.4951171875, 33.62109375, 34.7470703125, 35.873046875, 36.9990234375, 38.125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 6.0, 18.0, 10.0, 15.0, 20.0, 38.0, 28.0, 49.0, 53.0, 56.0, 84.0, 97.0, 125.0, 144.0, 182.0, 206.0, 226.0, 264.0, 273.0, 303.0, 264.0, 252.0, 216.0, 165.0, 181.0, 140.0, 122.0, 111.0, 86.0, 71.0, 48.0, 48.0, 39.0, 31.0, 15.0, 11.0, 20.0, 11.0, 11.0, 11.0, 4.0, 6.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.234375, -11.8409423828125, -11.447509765625, -11.0540771484375, -10.66064453125, -10.2672119140625, -9.873779296875, -9.4803466796875, -9.0869140625, -8.6934814453125, -8.300048828125, -7.9066162109375, -7.51318359375, -7.1197509765625, -6.726318359375, -6.3328857421875, -5.939453125, -5.5460205078125, -5.152587890625, -4.7591552734375, -4.36572265625, -3.9722900390625, -3.578857421875, -3.1854248046875, -2.7919921875, -2.3985595703125, -2.005126953125, -1.6116943359375, -1.21826171875, -0.8248291015625, -0.431396484375, -0.0379638671875, 0.35546875, 0.7489013671875, 1.142333984375, 1.5357666015625, 1.92919921875, 2.3226318359375, 2.716064453125, 3.1094970703125, 3.5029296875, 3.8963623046875, 4.289794921875, 4.6832275390625, 5.07666015625, 5.4700927734375, 5.863525390625, 6.2569580078125, 6.650390625, 7.0438232421875, 7.437255859375, 7.8306884765625, 8.22412109375, 8.6175537109375, 9.010986328125, 9.4044189453125, 9.7978515625, 10.1912841796875, 10.584716796875, 10.9781494140625, 11.37158203125, 11.7650146484375, 12.158447265625, 12.5518798828125, 12.9453125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 9.0, 7.0, 13.0, 19.0, 14.0, 16.0, 25.0, 20.0, 33.0, 43.0, 45.0, 57.0, 78.0, 54.0, 61.0, 81.0, 53.0, 65.0, 43.0, 44.0, 29.0, 41.0, 31.0, 27.0, 16.0, 12.0, 19.0, 9.0, 9.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.2911491394043, -36.08531951904297, -34.87948989868164, -33.67366027832031, -32.46782684326172, -31.26199722290039, -30.056167602539062, -28.850337982177734, -27.644508361816406, -26.438678741455078, -25.232847213745117, -24.02701759338379, -22.82118797302246, -21.6153564453125, -20.409526824951172, -19.203697204589844, -17.997865676879883, -16.792036056518555, -15.58620548248291, -14.380374908447266, -13.174545288085938, -11.968714714050293, -10.762884140014648, -9.55705451965332, -8.351223945617676, -7.1453938484191895, -5.939563751220703, -4.733733177185059, -3.5279030799865723, -2.322072982788086, -1.1162424087524414, 0.08958721160888672, 1.2954177856445312, 2.5012478828430176, 3.707078218460083, 4.912908554077148, 6.118738651275635, 7.324568748474121, 8.530399322509766, 9.736228942871094, 10.942059516906738, 12.147890090942383, 13.353719711303711, 14.559550285339355, 15.765380859375, 16.971210479736328, 18.177040100097656, 19.382869720458984, 20.588701248168945, 21.794530868530273, 23.000362396240234, 24.206192016601562, 25.41202163696289, 26.61785125732422, 27.82368278503418, 29.029512405395508, 30.23534393310547, 31.441173553466797, 32.647003173828125, 33.85283660888672, 35.05866622924805, 36.264495849609375, 37.4703254699707, 38.67615509033203, 39.88198471069336]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 9.0, 14.0, 12.0, 24.0, 15.0, 18.0, 25.0, 22.0, 22.0, 26.0, 34.0, 36.0, 39.0, 37.0, 43.0, 54.0, 49.0, 49.0, 48.0, 31.0, 49.0, 32.0, 46.0, 35.0, 34.0, 29.0, 18.0, 12.0, 21.0, 16.0, 13.0, 16.0, 14.0, 7.0, 9.0, 3.0, 5.0, 7.0, 6.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.34120559692383, -32.357147216796875, -31.373088836669922, -30.38903045654297, -29.404972076416016, -28.420913696289062, -27.436853408813477, -26.452795028686523, -25.46873664855957, -24.484678268432617, -23.500619888305664, -22.51656150817871, -21.532501220703125, -20.548442840576172, -19.56438446044922, -18.580326080322266, -17.596267700195312, -16.61220932006836, -15.628150939941406, -14.644091606140137, -13.660033226013184, -12.67597484588623, -11.691915512084961, -10.707857131958008, -9.723798751831055, -8.739740371704102, -7.75568151473999, -6.771622657775879, -5.787564277648926, -4.803505897521973, -3.8194470405578613, -2.83538818359375, -1.8513317108154297, -0.8672730922698975, 0.11678552627563477, 1.100844144821167, 2.084902763366699, 3.0689611434936523, 4.053020000457764, 5.037078857421875, 6.021137237548828, 7.005195617675781, 7.989254474639893, 8.973313331604004, 9.957371711730957, 10.94143009185791, 11.92548942565918, 12.909547805786133, 13.893606185913086, 14.877664566040039, 15.861722946166992, 16.845781326293945, 17.82984161376953, 18.813899993896484, 19.797958374023438, 20.78201675415039, 21.766075134277344, 22.750133514404297, 23.73419189453125, 24.718250274658203, 25.702308654785156, 26.68636703491211, 27.670427322387695, 28.65448570251465, 29.6385440826416]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 9.0, 7.0, 10.0, 25.0, 33.0, 46.0, 53.0, 69.0, 100.0, 146.0, 222.0, 295.0, 408.0, 681.0, 984.0, 1401.0, 2304.0, 3941.0, 6564.0, 12318.0, 25783.0, 62724.0, 173512.0, 379890.0, 228695.0, 81377.0, 32166.0, 14897.0, 7704.0, 4450.0, 2662.0, 1728.0, 1093.0, 676.0, 468.0, 325.0, 230.0, 166.0, 106.0, 77.0, 59.0, 61.0, 31.0, 19.0, 17.0, 4.0, 4.0, 3.0, 5.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-100.875, -97.58203125, -94.2890625, -90.99609375, -87.703125, -84.41015625, -81.1171875, -77.82421875, -74.53125, -71.23828125, -67.9453125, -64.65234375, -61.359375, -58.06640625, -54.7734375, -51.48046875, -48.1875, -44.89453125, -41.6015625, -38.30859375, -35.015625, -31.72265625, -28.4296875, -25.13671875, -21.84375, -18.55078125, -15.2578125, -11.96484375, -8.671875, -5.37890625, -2.0859375, 1.20703125, 4.5, 7.79296875, 11.0859375, 14.37890625, 17.671875, 20.96484375, 24.2578125, 27.55078125, 30.84375, 34.13671875, 37.4296875, 40.72265625, 44.015625, 47.30859375, 50.6015625, 53.89453125, 57.1875, 60.48046875, 63.7734375, 67.06640625, 70.359375, 73.65234375, 76.9453125, 80.23828125, 83.53125, 86.82421875, 90.1171875, 93.41015625, 96.703125, 99.99609375, 103.2890625, 106.58203125, 109.875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 9.0, 7.0, 6.0, 15.0, 8.0, 18.0, 19.0, 20.0, 31.0, 25.0, 29.0, 28.0, 25.0, 46.0, 60.0, 51.0, 51.0, 43.0, 53.0, 45.0, 43.0, 46.0, 36.0, 46.0, 41.0, 42.0, 29.0, 12.0, 21.0, 17.0, 14.0, 7.0, 12.0, 12.0, 9.0, 4.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.71875, -33.695556640625, -32.67236328125, -31.649169921875, -30.6259765625, -29.602783203125, -28.57958984375, -27.556396484375, -26.533203125, -25.510009765625, -24.48681640625, -23.463623046875, -22.4404296875, -21.417236328125, -20.39404296875, -19.370849609375, -18.34765625, -17.324462890625, -16.30126953125, -15.278076171875, -14.2548828125, -13.231689453125, -12.20849609375, -11.185302734375, -10.162109375, -9.138916015625, -8.11572265625, -7.092529296875, -6.0693359375, -5.046142578125, -4.02294921875, -2.999755859375, -1.9765625, -0.953369140625, 0.06982421875, 1.093017578125, 2.1162109375, 3.139404296875, 4.16259765625, 5.185791015625, 6.208984375, 7.232177734375, 8.25537109375, 9.278564453125, 10.3017578125, 11.324951171875, 12.34814453125, 13.371337890625, 14.39453125, 15.417724609375, 16.44091796875, 17.464111328125, 18.4873046875, 19.510498046875, 20.53369140625, 21.556884765625, 22.580078125, 23.603271484375, 24.62646484375, 25.649658203125, 26.6728515625, 27.696044921875, 28.71923828125, 29.742431640625, 30.765625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 11.0, 11.0, 30.0, 27.0, 32.0, 77.0, 93.0, 153.0, 210.0, 311.0, 495.0, 726.0, 1094.0, 1823.0, 2958.0, 5358.0, 10496.0, 21978.0, 54372.0, 165032.0, 437918.0, 221991.0, 68901.0, 26761.0, 12339.0, 6274.0, 3382.0, 2046.0, 1253.0, 789.0, 563.0, 351.0, 228.0, 162.0, 90.0, 65.0, 45.0, 33.0, 24.0, 17.0, 6.0, 10.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-95.5, -92.4794921875, -89.458984375, -86.4384765625, -83.41796875, -80.3974609375, -77.376953125, -74.3564453125, -71.3359375, -68.3154296875, -65.294921875, -62.2744140625, -59.25390625, -56.2333984375, -53.212890625, -50.1923828125, -47.171875, -44.1513671875, -41.130859375, -38.1103515625, -35.08984375, -32.0693359375, -29.048828125, -26.0283203125, -23.0078125, -19.9873046875, -16.966796875, -13.9462890625, -10.92578125, -7.9052734375, -4.884765625, -1.8642578125, 1.15625, 4.1767578125, 7.197265625, 10.2177734375, 13.23828125, 16.2587890625, 19.279296875, 22.2998046875, 25.3203125, 28.3408203125, 31.361328125, 34.3818359375, 37.40234375, 40.4228515625, 43.443359375, 46.4638671875, 49.484375, 52.5048828125, 55.525390625, 58.5458984375, 61.56640625, 64.5869140625, 67.607421875, 70.6279296875, 73.6484375, 76.6689453125, 79.689453125, 82.7099609375, 85.73046875, 88.7509765625, 91.771484375, 94.7919921875, 97.8125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 8.0, 9.0, 6.0, 16.0, 13.0, 13.0, 23.0, 23.0, 29.0, 30.0, 31.0, 39.0, 40.0, 44.0, 40.0, 54.0, 46.0, 52.0, 57.0, 42.0, 45.0, 33.0, 41.0, 35.0, 31.0, 31.0, 31.0, 24.0, 28.0, 11.0, 13.0, 7.0, 9.0, 9.0, 5.0, 10.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.375, -18.74267578125, -18.1103515625, -17.47802734375, -16.845703125, -16.21337890625, -15.5810546875, -14.94873046875, -14.31640625, -13.68408203125, -13.0517578125, -12.41943359375, -11.787109375, -11.15478515625, -10.5224609375, -9.89013671875, -9.2578125, -8.62548828125, -7.9931640625, -7.36083984375, -6.728515625, -6.09619140625, -5.4638671875, -4.83154296875, -4.19921875, -3.56689453125, -2.9345703125, -2.30224609375, -1.669921875, -1.03759765625, -0.4052734375, 0.22705078125, 0.859375, 1.49169921875, 2.1240234375, 2.75634765625, 3.388671875, 4.02099609375, 4.6533203125, 5.28564453125, 5.91796875, 6.55029296875, 7.1826171875, 7.81494140625, 8.447265625, 9.07958984375, 9.7119140625, 10.34423828125, 10.9765625, 11.60888671875, 12.2412109375, 12.87353515625, 13.505859375, 14.13818359375, 14.7705078125, 15.40283203125, 16.03515625, 16.66748046875, 17.2998046875, 17.93212890625, 18.564453125, 19.19677734375, 19.8291015625, 20.46142578125, 21.09375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 6.0, 9.0, 8.0, 11.0, 19.0, 28.0, 33.0, 49.0, 74.0, 107.0, 161.0, 213.0, 312.0, 402.0, 655.0, 901.0, 1253.0, 1954.0, 3145.0, 4936.0, 8708.0, 18372.0, 45134.0, 158957.0, 499271.0, 202486.0, 55154.0, 20727.0, 10085.0, 5526.0, 3310.0, 2162.0, 1323.0, 912.0, 635.0, 434.0, 306.0, 227.0, 162.0, 120.0, 77.0, 52.0, 39.0, 39.0, 15.0, 13.0, 7.0, 9.0, 6.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-44.90625, -43.43798828125, -41.9697265625, -40.50146484375, -39.033203125, -37.56494140625, -36.0966796875, -34.62841796875, -33.16015625, -31.69189453125, -30.2236328125, -28.75537109375, -27.287109375, -25.81884765625, -24.3505859375, -22.88232421875, -21.4140625, -19.94580078125, -18.4775390625, -17.00927734375, -15.541015625, -14.07275390625, -12.6044921875, -11.13623046875, -9.66796875, -8.19970703125, -6.7314453125, -5.26318359375, -3.794921875, -2.32666015625, -0.8583984375, 0.60986328125, 2.078125, 3.54638671875, 5.0146484375, 6.48291015625, 7.951171875, 9.41943359375, 10.8876953125, 12.35595703125, 13.82421875, 15.29248046875, 16.7607421875, 18.22900390625, 19.697265625, 21.16552734375, 22.6337890625, 24.10205078125, 25.5703125, 27.03857421875, 28.5068359375, 29.97509765625, 31.443359375, 32.91162109375, 34.3798828125, 35.84814453125, 37.31640625, 38.78466796875, 40.2529296875, 41.72119140625, 43.189453125, 44.65771484375, 46.1259765625, 47.59423828125, 49.0625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 9.0, 6.0, 2.0, 9.0, 8.0, 15.0, 20.0, 26.0, 51.0, 73.0, 110.0, 155.0, 132.0, 120.0, 82.0, 48.0, 31.0, 21.0, 16.0, 7.0, 7.0, 4.0, 8.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.004055023193359375, -0.003932058811187744, -0.0038090944290161133, -0.0036861300468444824, -0.0035631656646728516, -0.0034402012825012207, -0.00331723690032959, -0.003194272518157959, -0.003071308135986328, -0.0029483437538146973, -0.0028253793716430664, -0.0027024149894714355, -0.0025794506072998047, -0.002456486225128174, -0.002333521842956543, -0.002210557460784912, -0.0020875930786132812, -0.0019646286964416504, -0.0018416643142700195, -0.0017186999320983887, -0.0015957355499267578, -0.001472771167755127, -0.001349806785583496, -0.0012268424034118652, -0.0011038780212402344, -0.0009809136390686035, -0.0008579492568969727, -0.0007349848747253418, -0.0006120204925537109, -0.0004890561103820801, -0.0003660917282104492, -0.00024312734603881836, -0.0001201629638671875, 2.8014183044433594e-06, 0.00012576580047607422, 0.0002487301826477051, 0.00037169456481933594, 0.0004946589469909668, 0.0006176233291625977, 0.0007405877113342285, 0.0008635520935058594, 0.0009865164756774902, 0.001109480857849121, 0.001232445240020752, 0.0013554096221923828, 0.0014783740043640137, 0.0016013383865356445, 0.0017243027687072754, 0.0018472671508789062, 0.001970231533050537, 0.002093195915222168, 0.002216160297393799, 0.0023391246795654297, 0.0024620890617370605, 0.0025850534439086914, 0.0027080178260803223, 0.002830982208251953, 0.002953946590423584, 0.003076910972595215, 0.0031998753547668457, 0.0033228397369384766, 0.0034458041191101074, 0.0035687685012817383, 0.003691732883453369, 0.003814697265625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 9.0, 6.0, 20.0, 26.0, 53.0, 76.0, 126.0, 210.0, 350.0, 603.0, 1074.0, 1806.0, 3358.0, 6389.0, 13971.0, 36775.0, 115577.0, 333728.0, 344638.0, 122126.0, 38570.0, 14410.0, 6621.0, 3498.0, 1881.0, 1135.0, 614.0, 343.0, 225.0, 112.0, 71.0, 50.0, 30.0, 20.0, 15.0, 8.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.5625, -42.2021484375, -40.841796875, -39.4814453125, -38.12109375, -36.7607421875, -35.400390625, -34.0400390625, -32.6796875, -31.3193359375, -29.958984375, -28.5986328125, -27.23828125, -25.8779296875, -24.517578125, -23.1572265625, -21.796875, -20.4365234375, -19.076171875, -17.7158203125, -16.35546875, -14.9951171875, -13.634765625, -12.2744140625, -10.9140625, -9.5537109375, -8.193359375, -6.8330078125, -5.47265625, -4.1123046875, -2.751953125, -1.3916015625, -0.03125, 1.3291015625, 2.689453125, 4.0498046875, 5.41015625, 6.7705078125, 8.130859375, 9.4912109375, 10.8515625, 12.2119140625, 13.572265625, 14.9326171875, 16.29296875, 17.6533203125, 19.013671875, 20.3740234375, 21.734375, 23.0947265625, 24.455078125, 25.8154296875, 27.17578125, 28.5361328125, 29.896484375, 31.2568359375, 32.6171875, 33.9775390625, 35.337890625, 36.6982421875, 38.05859375, 39.4189453125, 40.779296875, 42.1396484375, 43.5]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 10.0, 2.0, 11.0, 12.0, 14.0, 11.0, 20.0, 27.0, 28.0, 48.0, 52.0, 81.0, 103.0, 86.0, 92.0, 77.0, 74.0, 62.0, 46.0, 47.0, 22.0, 17.0, 17.0, 11.0, 7.0, 5.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.5389404296875, -8.195068359375, -7.8511962890625, -7.50732421875, -7.1634521484375, -6.819580078125, -6.4757080078125, -6.1318359375, -5.7879638671875, -5.444091796875, -5.1002197265625, -4.75634765625, -4.4124755859375, -4.068603515625, -3.7247314453125, -3.380859375, -3.0369873046875, -2.693115234375, -2.3492431640625, -2.00537109375, -1.6614990234375, -1.317626953125, -0.9737548828125, -0.6298828125, -0.2860107421875, 0.057861328125, 0.4017333984375, 0.74560546875, 1.0894775390625, 1.433349609375, 1.7772216796875, 2.12109375, 2.4649658203125, 2.808837890625, 3.1527099609375, 3.49658203125, 3.8404541015625, 4.184326171875, 4.5281982421875, 4.8720703125, 5.2159423828125, 5.559814453125, 5.9036865234375, 6.24755859375, 6.5914306640625, 6.935302734375, 7.2791748046875, 7.623046875, 7.9669189453125, 8.310791015625, 8.6546630859375, 8.99853515625, 9.3424072265625, 9.686279296875, 10.0301513671875, 10.3740234375, 10.7178955078125, 11.061767578125, 11.4056396484375, 11.74951171875, 12.0933837890625, 12.437255859375, 12.7811279296875, 13.125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 5.0, 8.0, 3.0, 9.0, 10.0, 8.0, 10.0, 21.0, 25.0, 38.0, 36.0, 39.0, 45.0, 45.0, 54.0, 62.0, 60.0, 72.0, 57.0, 63.0, 66.0, 49.0, 42.0, 36.0, 20.0, 24.0, 22.0, 22.0, 16.0, 7.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.1842155456543, -35.0134162902832, -33.84261703491211, -32.67182159423828, -31.501022338867188, -30.330223083496094, -29.159423828125, -27.988624572753906, -26.817827224731445, -25.64702796936035, -24.47623062133789, -23.305431365966797, -22.134632110595703, -20.963834762573242, -19.79303550720215, -18.622238159179688, -17.451438903808594, -16.2806396484375, -15.109842300415039, -13.939043045043945, -12.768244743347168, -11.59744644165039, -10.426647186279297, -9.25584888458252, -8.085050582885742, -6.914252281188965, -5.743453502655029, -4.572654724121094, -3.4018564224243164, -2.231058120727539, -1.0602593421936035, 0.11053943634033203, 1.2813339233398438, 2.4521324634552, 3.6229310035705566, 4.793729782104492, 5.9645280838012695, 7.135326385498047, 8.30612564086914, 9.476923942565918, 10.647722244262695, 11.818520545959473, 12.98931884765625, 14.160118103027344, 15.330916404724121, 16.5017147064209, 17.672513961791992, 18.843311309814453, 20.014110565185547, 21.18490982055664, 22.3557071685791, 23.526506423950195, 24.697303771972656, 25.86810302734375, 27.038902282714844, 28.209701538085938, 29.3804988861084, 30.551298141479492, 31.722095489501953, 32.89289474487305, 34.06369400024414, 35.23448944091797, 36.40528869628906, 37.576087951660156, 38.74688720703125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 12.0, 10.0, 11.0, 12.0, 11.0, 18.0, 24.0, 18.0, 12.0, 19.0, 32.0, 28.0, 33.0, 41.0, 29.0, 38.0, 36.0, 45.0, 41.0, 47.0, 60.0, 35.0, 34.0, 33.0, 34.0, 43.0, 28.0, 30.0, 27.0, 23.0, 13.0, 13.0, 19.0, 9.0, 21.0, 6.0, 10.0, 14.0, 7.0, 4.0, 2.0, 2.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-30.263290405273438, -29.37462043762207, -28.485952377319336, -27.59728240966797, -26.708614349365234, -25.819944381713867, -24.931276321411133, -24.042606353759766, -23.15393829345703, -22.265268325805664, -21.37660026550293, -20.487930297851562, -19.599262237548828, -18.71059226989746, -17.821924209594727, -16.93325424194336, -16.044586181640625, -15.155917167663574, -14.267248153686523, -13.378579139709473, -12.489910125732422, -11.601240158081055, -10.71257209777832, -9.823902130126953, -8.935232162475586, -8.046563148498535, -7.157894134521484, -6.269225120544434, -5.380556106567383, -4.491886615753174, -3.603217601776123, -2.7145485877990723, -1.8258800506591797, -0.9372109770774841, -0.048541903495788574, 0.8401272296905518, 1.7287962436676025, 2.6174654960632324, 3.506134510040283, 4.394803524017334, 5.283472537994385, 6.1721415519714355, 7.060810565948486, 7.949480056762695, 8.838149070739746, 9.726818084716797, 10.615487098693848, 11.504156112670898, 12.39282512664795, 13.281494140625, 14.17016315460205, 15.058832168579102, 15.947501182556152, 16.836170196533203, 17.72484016418457, 18.613508224487305, 19.502178192138672, 20.39084815979004, 21.279516220092773, 22.16818618774414, 23.056854248046875, 23.945524215698242, 24.834192276000977, 25.722862243652344, 26.611530303955078]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 10.0, 12.0, 17.0, 34.0, 44.0, 53.0, 109.0, 148.0, 246.0, 385.0, 629.0, 1233.0, 2072.0, 3737.0, 6860.0, 12526.0, 22583.0, 42165.0, 77115.0, 132199.0, 196563.0, 205253.0, 148819.0, 88658.0, 48857.0, 26171.0, 14276.0, 7855.0, 4309.0, 2354.0, 1369.0, 759.0, 469.0, 251.0, 143.0, 102.0, 55.0, 30.0, 29.0, 30.0, 14.0, 14.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.75, -49.119140625, -47.48828125, -45.857421875, -44.2265625, -42.595703125, -40.96484375, -39.333984375, -37.703125, -36.072265625, -34.44140625, -32.810546875, -31.1796875, -29.548828125, -27.91796875, -26.287109375, -24.65625, -23.025390625, -21.39453125, -19.763671875, -18.1328125, -16.501953125, -14.87109375, -13.240234375, -11.609375, -9.978515625, -8.34765625, -6.716796875, -5.0859375, -3.455078125, -1.82421875, -0.193359375, 1.4375, 3.068359375, 4.69921875, 6.330078125, 7.9609375, 9.591796875, 11.22265625, 12.853515625, 14.484375, 16.115234375, 17.74609375, 19.376953125, 21.0078125, 22.638671875, 24.26953125, 25.900390625, 27.53125, 29.162109375, 30.79296875, 32.423828125, 34.0546875, 35.685546875, 37.31640625, 38.947265625, 40.578125, 42.208984375, 43.83984375, 45.470703125, 47.1015625, 48.732421875, 50.36328125, 51.994140625, 53.625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 9.0, 10.0, 10.0, 10.0, 9.0, 13.0, 23.0, 12.0, 18.0, 25.0, 18.0, 27.0, 36.0, 40.0, 45.0, 39.0, 39.0, 50.0, 44.0, 47.0, 40.0, 42.0, 33.0, 32.0, 37.0, 37.0, 37.0, 28.0, 23.0, 15.0, 28.0, 18.0, 13.0, 10.0, 15.0, 10.0, 12.0, 13.0, 7.0, 5.0, 4.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.90625, -23.09521484375, -22.2841796875, -21.47314453125, -20.662109375, -19.85107421875, -19.0400390625, -18.22900390625, -17.41796875, -16.60693359375, -15.7958984375, -14.98486328125, -14.173828125, -13.36279296875, -12.5517578125, -11.74072265625, -10.9296875, -10.11865234375, -9.3076171875, -8.49658203125, -7.685546875, -6.87451171875, -6.0634765625, -5.25244140625, -4.44140625, -3.63037109375, -2.8193359375, -2.00830078125, -1.197265625, -0.38623046875, 0.4248046875, 1.23583984375, 2.046875, 2.85791015625, 3.6689453125, 4.47998046875, 5.291015625, 6.10205078125, 6.9130859375, 7.72412109375, 8.53515625, 9.34619140625, 10.1572265625, 10.96826171875, 11.779296875, 12.59033203125, 13.4013671875, 14.21240234375, 15.0234375, 15.83447265625, 16.6455078125, 17.45654296875, 18.267578125, 19.07861328125, 19.8896484375, 20.70068359375, 21.51171875, 22.32275390625, 23.1337890625, 23.94482421875, 24.755859375, 25.56689453125, 26.3779296875, 27.18896484375, 28.0]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 9.0, 11.0, 14.0, 26.0, 43.0, 50.0, 65.0, 113.0, 182.0, 240.0, 383.0, 525.0, 830.0, 1275.0, 1849.0, 2827.0, 4277.0, 6741.0, 10153.0, 15625.0, 24287.0, 36858.0, 56354.0, 82826.0, 115327.0, 142103.0, 146501.0, 124229.0, 91796.0, 63134.0, 41867.0, 27285.0, 17552.0, 11273.0, 7538.0, 4844.0, 3155.0, 2112.0, 1343.0, 976.0, 668.0, 451.0, 286.0, 184.0, 130.0, 76.0, 39.0, 46.0, 33.0, 18.0, 15.0, 8.0, 3.0, 0.0, 3.0, 1.0, 5.0], "bins": [-33.375, -32.367919921875, -31.36083984375, -30.353759765625, -29.3466796875, -28.339599609375, -27.33251953125, -26.325439453125, -25.318359375, -24.311279296875, -23.30419921875, -22.297119140625, -21.2900390625, -20.282958984375, -19.27587890625, -18.268798828125, -17.26171875, -16.254638671875, -15.24755859375, -14.240478515625, -13.2333984375, -12.226318359375, -11.21923828125, -10.212158203125, -9.205078125, -8.197998046875, -7.19091796875, -6.183837890625, -5.1767578125, -4.169677734375, -3.16259765625, -2.155517578125, -1.1484375, -0.141357421875, 0.86572265625, 1.872802734375, 2.8798828125, 3.886962890625, 4.89404296875, 5.901123046875, 6.908203125, 7.915283203125, 8.92236328125, 9.929443359375, 10.9365234375, 11.943603515625, 12.95068359375, 13.957763671875, 14.96484375, 15.971923828125, 16.97900390625, 17.986083984375, 18.9931640625, 20.000244140625, 21.00732421875, 22.014404296875, 23.021484375, 24.028564453125, 25.03564453125, 26.042724609375, 27.0498046875, 28.056884765625, 29.06396484375, 30.071044921875, 31.078125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 6.0, 9.0, 9.0, 13.0, 10.0, 18.0, 23.0, 26.0, 30.0, 25.0, 32.0, 29.0, 33.0, 41.0, 32.0, 46.0, 53.0, 51.0, 49.0, 45.0, 30.0, 37.0, 42.0, 50.0, 36.0, 40.0, 34.0, 21.0, 19.0, 15.0, 15.0, 18.0, 9.0, 15.0, 9.0, 5.0, 11.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.25, -18.64208984375, -18.0341796875, -17.42626953125, -16.818359375, -16.21044921875, -15.6025390625, -14.99462890625, -14.38671875, -13.77880859375, -13.1708984375, -12.56298828125, -11.955078125, -11.34716796875, -10.7392578125, -10.13134765625, -9.5234375, -8.91552734375, -8.3076171875, -7.69970703125, -7.091796875, -6.48388671875, -5.8759765625, -5.26806640625, -4.66015625, -4.05224609375, -3.4443359375, -2.83642578125, -2.228515625, -1.62060546875, -1.0126953125, -0.40478515625, 0.203125, 0.81103515625, 1.4189453125, 2.02685546875, 2.634765625, 3.24267578125, 3.8505859375, 4.45849609375, 5.06640625, 5.67431640625, 6.2822265625, 6.89013671875, 7.498046875, 8.10595703125, 8.7138671875, 9.32177734375, 9.9296875, 10.53759765625, 11.1455078125, 11.75341796875, 12.361328125, 12.96923828125, 13.5771484375, 14.18505859375, 14.79296875, 15.40087890625, 16.0087890625, 16.61669921875, 17.224609375, 17.83251953125, 18.4404296875, 19.04833984375, 19.65625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 10.0, 30.0, 29.0, 58.0, 70.0, 110.0, 165.0, 260.0, 406.0, 590.0, 864.0, 1496.0, 2345.0, 3779.0, 6262.0, 10702.0, 19060.0, 34165.0, 65331.0, 128135.0, 227584.0, 241200.0, 143637.0, 73256.0, 38184.0, 20859.0, 11842.0, 6944.0, 4199.0, 2573.0, 1573.0, 1019.0, 632.0, 405.0, 245.0, 172.0, 105.0, 78.0, 60.0, 32.0, 23.0, 23.0, 8.0, 10.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-31.609375, -30.624267578125, -29.63916015625, -28.654052734375, -27.6689453125, -26.683837890625, -25.69873046875, -24.713623046875, -23.728515625, -22.743408203125, -21.75830078125, -20.773193359375, -19.7880859375, -18.802978515625, -17.81787109375, -16.832763671875, -15.84765625, -14.862548828125, -13.87744140625, -12.892333984375, -11.9072265625, -10.922119140625, -9.93701171875, -8.951904296875, -7.966796875, -6.981689453125, -5.99658203125, -5.011474609375, -4.0263671875, -3.041259765625, -2.05615234375, -1.071044921875, -0.0859375, 0.899169921875, 1.88427734375, 2.869384765625, 3.8544921875, 4.839599609375, 5.82470703125, 6.809814453125, 7.794921875, 8.780029296875, 9.76513671875, 10.750244140625, 11.7353515625, 12.720458984375, 13.70556640625, 14.690673828125, 15.67578125, 16.660888671875, 17.64599609375, 18.631103515625, 19.6162109375, 20.601318359375, 21.58642578125, 22.571533203125, 23.556640625, 24.541748046875, 25.52685546875, 26.511962890625, 27.4970703125, 28.482177734375, 29.46728515625, 30.452392578125, 31.4375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 5.0, 4.0, 6.0, 10.0, 7.0, 12.0, 17.0, 15.0, 17.0, 23.0, 39.0, 40.0, 46.0, 65.0, 71.0, 65.0, 71.0, 70.0, 73.0, 73.0, 49.0, 49.0, 38.0, 24.0, 23.0, 9.0, 19.0, 13.0, 10.0, 11.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002910614013671875, -0.002819061279296875, -0.002727508544921875, -0.002635955810546875, -0.002544403076171875, -0.002452850341796875, -0.002361297607421875, -0.002269744873046875, -0.002178192138671875, -0.002086639404296875, -0.001995086669921875, -0.001903533935546875, -0.001811981201171875, -0.001720428466796875, -0.001628875732421875, -0.001537322998046875, -0.001445770263671875, -0.001354217529296875, -0.001262664794921875, -0.001171112060546875, -0.001079559326171875, -0.000988006591796875, -0.000896453857421875, -0.000804901123046875, -0.000713348388671875, -0.000621795654296875, -0.000530242919921875, -0.000438690185546875, -0.000347137451171875, -0.000255584716796875, -0.000164031982421875, -7.2479248046875e-05, 1.9073486328125e-05, 0.000110626220703125, 0.000202178955078125, 0.000293731689453125, 0.000385284423828125, 0.000476837158203125, 0.000568389892578125, 0.000659942626953125, 0.000751495361328125, 0.000843048095703125, 0.000934600830078125, 0.001026153564453125, 0.001117706298828125, 0.001209259033203125, 0.001300811767578125, 0.001392364501953125, 0.001483917236328125, 0.001575469970703125, 0.001667022705078125, 0.001758575439453125, 0.001850128173828125, 0.001941680908203125, 0.002033233642578125, 0.002124786376953125, 0.002216339111328125, 0.002307891845703125, 0.002399444580078125, 0.002490997314453125, 0.002582550048828125, 0.002674102783203125, 0.002765655517578125, 0.002857208251953125, 0.002948760986328125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 3.0, 7.0, 11.0, 25.0, 25.0, 30.0, 45.0, 55.0, 89.0, 156.0, 216.0, 296.0, 476.0, 751.0, 1073.0, 1798.0, 3001.0, 4828.0, 8299.0, 15280.0, 29221.0, 59803.0, 125905.0, 241303.0, 263066.0, 147400.0, 70518.0, 33623.0, 17496.0, 9493.0, 5405.0, 3328.0, 1963.0, 1244.0, 743.0, 541.0, 338.0, 220.0, 159.0, 117.0, 81.0, 44.0, 21.0, 22.0, 9.0, 10.0, 4.0, 4.0, 11.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.953125, -28.887451171875, -27.82177734375, -26.756103515625, -25.6904296875, -24.624755859375, -23.55908203125, -22.493408203125, -21.427734375, -20.362060546875, -19.29638671875, -18.230712890625, -17.1650390625, -16.099365234375, -15.03369140625, -13.968017578125, -12.90234375, -11.836669921875, -10.77099609375, -9.705322265625, -8.6396484375, -7.573974609375, -6.50830078125, -5.442626953125, -4.376953125, -3.311279296875, -2.24560546875, -1.179931640625, -0.1142578125, 0.951416015625, 2.01708984375, 3.082763671875, 4.1484375, 5.214111328125, 6.27978515625, 7.345458984375, 8.4111328125, 9.476806640625, 10.54248046875, 11.608154296875, 12.673828125, 13.739501953125, 14.80517578125, 15.870849609375, 16.9365234375, 18.002197265625, 19.06787109375, 20.133544921875, 21.19921875, 22.264892578125, 23.33056640625, 24.396240234375, 25.4619140625, 26.527587890625, 27.59326171875, 28.658935546875, 29.724609375, 30.790283203125, 31.85595703125, 32.921630859375, 33.9873046875, 35.052978515625, 36.11865234375, 37.184326171875, 38.25]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 7.0, 7.0, 6.0, 9.0, 22.0, 14.0, 43.0, 50.0, 60.0, 75.0, 101.0, 120.0, 97.0, 84.0, 76.0, 57.0, 45.0, 37.0, 18.0, 21.0, 19.0, 7.0, 7.0, 4.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.4375, -15.982177734375, -15.52685546875, -15.071533203125, -14.6162109375, -14.160888671875, -13.70556640625, -13.250244140625, -12.794921875, -12.339599609375, -11.88427734375, -11.428955078125, -10.9736328125, -10.518310546875, -10.06298828125, -9.607666015625, -9.15234375, -8.697021484375, -8.24169921875, -7.786376953125, -7.3310546875, -6.875732421875, -6.42041015625, -5.965087890625, -5.509765625, -5.054443359375, -4.59912109375, -4.143798828125, -3.6884765625, -3.233154296875, -2.77783203125, -2.322509765625, -1.8671875, -1.411865234375, -0.95654296875, -0.501220703125, -0.0458984375, 0.409423828125, 0.86474609375, 1.320068359375, 1.775390625, 2.230712890625, 2.68603515625, 3.141357421875, 3.5966796875, 4.052001953125, 4.50732421875, 4.962646484375, 5.41796875, 5.873291015625, 6.32861328125, 6.783935546875, 7.2392578125, 7.694580078125, 8.14990234375, 8.605224609375, 9.060546875, 9.515869140625, 9.97119140625, 10.426513671875, 10.8818359375, 11.337158203125, 11.79248046875, 12.247802734375, 12.703125]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 13.0, 7.0, 6.0, 10.0, 20.0, 17.0, 28.0, 28.0, 29.0, 35.0, 32.0, 32.0, 47.0, 54.0, 53.0, 56.0, 59.0, 46.0, 58.0, 54.0, 41.0, 39.0, 48.0, 30.0, 22.0, 22.0, 15.0, 18.0, 13.0, 5.0, 10.0, 10.0, 8.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-28.695228576660156, -27.745759963989258, -26.796293258666992, -25.846824645996094, -24.897357940673828, -23.94788932800293, -22.998422622680664, -22.048954010009766, -21.0994873046875, -20.1500186920166, -19.200551986694336, -18.251083374023438, -17.301616668701172, -16.352148056030273, -15.402681350708008, -14.45321273803711, -13.503745079040527, -12.554277420043945, -11.604809761047363, -10.655342102050781, -9.7058744430542, -8.756406784057617, -7.806938648223877, -6.857470989227295, -5.908003330230713, -4.958535671234131, -4.009068012237549, -3.0596001148223877, -2.1101324558258057, -1.1606645584106445, -0.2111968994140625, 0.7382707595825195, 1.6877384185791016, 2.6372060775756836, 3.5866737365722656, 4.536141395568848, 5.48560905456543, 6.43507719039917, 7.384544849395752, 8.334012985229492, 9.283479690551758, 10.23294734954834, 11.182415008544922, 12.131882667541504, 13.081350326538086, 14.030818939208984, 14.98028564453125, 15.929754257202148, 16.879222869873047, 17.828691482543945, 18.77815818786621, 19.72762680053711, 20.677093505859375, 21.626562118530273, 22.57602882385254, 23.525497436523438, 24.474964141845703, 25.4244327545166, 26.373899459838867, 27.323368072509766, 28.27283477783203, 29.22230339050293, 30.171770095825195, 31.121238708496094, 32.07070541381836]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 3.0, 8.0, 7.0, 11.0, 12.0, 18.0, 7.0, 21.0, 28.0, 24.0, 28.0, 29.0, 31.0, 36.0, 38.0, 23.0, 34.0, 42.0, 36.0, 31.0, 43.0, 34.0, 50.0, 33.0, 46.0, 41.0, 27.0, 29.0, 42.0, 28.0, 25.0, 17.0, 19.0, 18.0, 16.0, 14.0, 10.0, 3.0, 8.0, 6.0, 3.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.04069709777832, -26.171142578125, -25.30158805847168, -24.43203353881836, -23.562477111816406, -22.69292449951172, -21.823368072509766, -20.953813552856445, -20.084259033203125, -19.214704513549805, -18.345149993896484, -17.475595474243164, -16.606040954589844, -15.736485481262207, -14.86693000793457, -13.99737548828125, -13.12782096862793, -12.25826644897461, -11.388711929321289, -10.519156455993652, -9.649601936340332, -8.780047416687012, -7.910492420196533, -7.040937423706055, -6.171382904052734, -5.301828384399414, -4.4322733879089355, -3.562718629837036, -2.6931638717651367, -1.8236093521118164, -0.9540543556213379, -0.08449935913085938, 0.7850532531738281, 1.6546080112457275, 2.524162769317627, 3.3937175273895264, 4.263272285461426, 5.132826805114746, 6.002381801605225, 6.871936798095703, 7.741491317749023, 8.611045837402344, 9.480600357055664, 10.3501558303833, 11.219710350036621, 12.089264869689941, 12.958820343017578, 13.828374862670898, 14.697929382324219, 15.567483901977539, 16.43703842163086, 17.30659294128418, 18.1761474609375, 19.045703887939453, 19.915258407592773, 20.784812927246094, 21.654367446899414, 22.523921966552734, 23.393476486206055, 24.263031005859375, 25.132587432861328, 26.002140045166016, 26.87169647216797, 27.74125099182129, 28.61080551147461]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 9.0, 7.0, 13.0, 23.0, 43.0, 62.0, 59.0, 132.0, 158.0, 244.0, 368.0, 502.0, 779.0, 1131.0, 1789.0, 2623.0, 4073.0, 6447.0, 10273.0, 16601.0, 27857.0, 48004.0, 86112.0, 166367.0, 353826.0, 760560.0, 1105716.0, 817969.0, 389793.0, 179536.0, 90582.0, 49403.0, 28314.0, 16822.0, 10228.0, 6476.0, 4001.0, 2612.0, 1592.0, 1040.0, 770.0, 434.0, 344.0, 197.0, 122.0, 102.0, 68.0, 42.0, 30.0, 17.0, 10.0, 6.0, 5.0, 0.0, 4.0], "bins": [-33.78125, -32.8310546875, -31.880859375, -30.9306640625, -29.98046875, -29.0302734375, -28.080078125, -27.1298828125, -26.1796875, -25.2294921875, -24.279296875, -23.3291015625, -22.37890625, -21.4287109375, -20.478515625, -19.5283203125, -18.578125, -17.6279296875, -16.677734375, -15.7275390625, -14.77734375, -13.8271484375, -12.876953125, -11.9267578125, -10.9765625, -10.0263671875, -9.076171875, -8.1259765625, -7.17578125, -6.2255859375, -5.275390625, -4.3251953125, -3.375, -2.4248046875, -1.474609375, -0.5244140625, 0.42578125, 1.3759765625, 2.326171875, 3.2763671875, 4.2265625, 5.1767578125, 6.126953125, 7.0771484375, 8.02734375, 8.9775390625, 9.927734375, 10.8779296875, 11.828125, 12.7783203125, 13.728515625, 14.6787109375, 15.62890625, 16.5791015625, 17.529296875, 18.4794921875, 19.4296875, 20.3798828125, 21.330078125, 22.2802734375, 23.23046875, 24.1806640625, 25.130859375, 26.0810546875, 27.03125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 8.0, 8.0, 17.0, 21.0, 18.0, 11.0, 22.0, 25.0, 19.0, 20.0, 36.0, 37.0, 37.0, 42.0, 37.0, 32.0, 39.0, 47.0, 37.0, 35.0, 58.0, 39.0, 42.0, 33.0, 29.0, 33.0, 27.0, 36.0, 24.0, 19.0, 14.0, 19.0, 9.0, 17.0, 8.0, 7.0, 6.0, 9.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.38330078125, -18.7822265625, -18.18115234375, -17.580078125, -16.97900390625, -16.3779296875, -15.77685546875, -15.17578125, -14.57470703125, -13.9736328125, -13.37255859375, -12.771484375, -12.17041015625, -11.5693359375, -10.96826171875, -10.3671875, -9.76611328125, -9.1650390625, -8.56396484375, -7.962890625, -7.36181640625, -6.7607421875, -6.15966796875, -5.55859375, -4.95751953125, -4.3564453125, -3.75537109375, -3.154296875, -2.55322265625, -1.9521484375, -1.35107421875, -0.75, -0.14892578125, 0.4521484375, 1.05322265625, 1.654296875, 2.25537109375, 2.8564453125, 3.45751953125, 4.05859375, 4.65966796875, 5.2607421875, 5.86181640625, 6.462890625, 7.06396484375, 7.6650390625, 8.26611328125, 8.8671875, 9.46826171875, 10.0693359375, 10.67041015625, 11.271484375, 11.87255859375, 12.4736328125, 13.07470703125, 13.67578125, 14.27685546875, 14.8779296875, 15.47900390625, 16.080078125, 16.68115234375, 17.2822265625, 17.88330078125, 18.484375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 7.0, 8.0, 22.0, 21.0, 38.0, 67.0, 119.0, 152.0, 250.0, 371.0, 533.0, 838.0, 1258.0, 1825.0, 2897.0, 4563.0, 7433.0, 12340.0, 21072.0, 35952.0, 64460.0, 118962.0, 226504.0, 439647.0, 803748.0, 1009987.0, 674667.0, 355172.0, 183734.0, 97283.0, 53682.0, 30527.0, 17777.0, 10702.0, 6321.0, 4009.0, 2494.0, 1613.0, 1050.0, 719.0, 470.0, 290.0, 223.0, 151.0, 99.0, 88.0, 38.0, 32.0, 22.0, 10.0, 11.0, 9.0, 7.0, 2.0, 6.0, 2.0, 2.0], "bins": [-31.09375, -30.13232421875, -29.1708984375, -28.20947265625, -27.248046875, -26.28662109375, -25.3251953125, -24.36376953125, -23.40234375, -22.44091796875, -21.4794921875, -20.51806640625, -19.556640625, -18.59521484375, -17.6337890625, -16.67236328125, -15.7109375, -14.74951171875, -13.7880859375, -12.82666015625, -11.865234375, -10.90380859375, -9.9423828125, -8.98095703125, -8.01953125, -7.05810546875, -6.0966796875, -5.13525390625, -4.173828125, -3.21240234375, -2.2509765625, -1.28955078125, -0.328125, 0.63330078125, 1.5947265625, 2.55615234375, 3.517578125, 4.47900390625, 5.4404296875, 6.40185546875, 7.36328125, 8.32470703125, 9.2861328125, 10.24755859375, 11.208984375, 12.17041015625, 13.1318359375, 14.09326171875, 15.0546875, 16.01611328125, 16.9775390625, 17.93896484375, 18.900390625, 19.86181640625, 20.8232421875, 21.78466796875, 22.74609375, 23.70751953125, 24.6689453125, 25.63037109375, 26.591796875, 27.55322265625, 28.5146484375, 29.47607421875, 30.4375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 9.0, 7.0, 13.0, 14.0, 12.0, 21.0, 22.0, 39.0, 37.0, 53.0, 79.0, 89.0, 105.0, 166.0, 168.0, 175.0, 240.0, 302.0, 325.0, 349.0, 297.0, 268.0, 216.0, 201.0, 163.0, 166.0, 112.0, 104.0, 76.0, 54.0, 39.0, 32.0, 29.0, 16.0, 18.0, 9.0, 15.0, 4.0, 5.0, 6.0, 6.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5234375, -11.14599609375, -10.7685546875, -10.39111328125, -10.013671875, -9.63623046875, -9.2587890625, -8.88134765625, -8.50390625, -8.12646484375, -7.7490234375, -7.37158203125, -6.994140625, -6.61669921875, -6.2392578125, -5.86181640625, -5.484375, -5.10693359375, -4.7294921875, -4.35205078125, -3.974609375, -3.59716796875, -3.2197265625, -2.84228515625, -2.46484375, -2.08740234375, -1.7099609375, -1.33251953125, -0.955078125, -0.57763671875, -0.2001953125, 0.17724609375, 0.5546875, 0.93212890625, 1.3095703125, 1.68701171875, 2.064453125, 2.44189453125, 2.8193359375, 3.19677734375, 3.57421875, 3.95166015625, 4.3291015625, 4.70654296875, 5.083984375, 5.46142578125, 5.8388671875, 6.21630859375, 6.59375, 6.97119140625, 7.3486328125, 7.72607421875, 8.103515625, 8.48095703125, 8.8583984375, 9.23583984375, 9.61328125, 9.99072265625, 10.3681640625, 10.74560546875, 11.123046875, 11.50048828125, 11.8779296875, 12.25537109375, 12.6328125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 11.0, 14.0, 9.0, 20.0, 18.0, 24.0, 28.0, 27.0, 39.0, 36.0, 56.0, 44.0, 53.0, 49.0, 56.0, 56.0, 55.0, 52.0, 50.0, 45.0, 45.0, 32.0, 28.0, 23.0, 20.0, 20.0, 12.0, 10.0, 5.0, 13.0, 4.0, 8.0, 8.0, 3.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-32.94244384765625, -32.026336669921875, -31.110227584838867, -30.19411849975586, -29.278011322021484, -28.361902236938477, -27.44579315185547, -26.529685974121094, -25.613576889038086, -24.697467803955078, -23.781360626220703, -22.865251541137695, -21.949142456054688, -21.033035278320312, -20.116926193237305, -19.200817108154297, -18.284709930419922, -17.368600845336914, -16.45249366760254, -15.536384582519531, -14.62027645111084, -13.704168319702148, -12.78805923461914, -11.87195110321045, -10.955842971801758, -10.039734840393066, -9.123626708984375, -8.207517623901367, -7.291409492492676, -6.375301361083984, -5.459192752838135, -4.543084144592285, -3.626974105834961, -2.7108657360076904, -1.79475736618042, -0.8786489963531494, 0.037459373474121094, 0.9535675048828125, 1.869676113128662, 2.7857847213745117, 3.701892852783203, 4.6180009841918945, 5.534109592437744, 6.450218200683594, 7.366326332092285, 8.282434463500977, 9.198543548583984, 10.114651679992676, 11.030759811401367, 11.946867942810059, 12.86297607421875, 13.779085159301758, 14.69519329071045, 15.61130142211914, 16.52741050720215, 17.443519592285156, 18.35962677001953, 19.27573585510254, 20.191843032836914, 21.107952117919922, 22.024059295654297, 22.940168380737305, 23.856277465820312, 24.772384643554688, 25.688493728637695]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 5.0, 6.0, 9.0, 8.0, 10.0, 7.0, 13.0, 9.0, 14.0, 17.0, 24.0, 18.0, 15.0, 19.0, 25.0, 28.0, 36.0, 36.0, 34.0, 37.0, 44.0, 38.0, 29.0, 34.0, 34.0, 43.0, 46.0, 42.0, 26.0, 33.0, 24.0, 25.0, 19.0, 25.0, 24.0, 17.0, 13.0, 19.0, 14.0, 15.0, 7.0, 9.0, 14.0, 7.0, 9.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.238008499145508, -23.473983764648438, -22.7099609375, -21.94593620300293, -21.18191146850586, -20.41788673400879, -19.65386199951172, -18.88983917236328, -18.12581443786621, -17.36178970336914, -16.597766876220703, -15.833742141723633, -15.069717407226562, -14.305692672729492, -13.541668891906738, -12.777645111083984, -12.013620376586914, -11.249595642089844, -10.48557186126709, -9.721548080444336, -8.957523345947266, -8.193498611450195, -7.429474830627441, -6.665450572967529, -5.901426315307617, -5.137402057647705, -4.373377799987793, -3.609353542327881, -2.8453292846679688, -2.0813050270080566, -1.3172807693481445, -0.5532565116882324, 0.2107696533203125, 0.9747939109802246, 1.7388181686401367, 2.502842426300049, 3.266866683959961, 4.030890941619873, 4.794915199279785, 5.558939456939697, 6.322963714599609, 7.0869879722595215, 7.851012229919434, 8.615036010742188, 9.379060745239258, 10.143085479736328, 10.907109260559082, 11.671133041381836, 12.435157775878906, 13.199182510375977, 13.96320629119873, 14.727230072021484, 15.491254806518555, 16.255279541015625, 17.019302368164062, 17.783327102661133, 18.547351837158203, 19.311376571655273, 20.075401306152344, 20.83942413330078, 21.60344886779785, 22.367473602294922, 23.13149642944336, 23.89552116394043, 24.6595458984375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 8.0, 9.0, 8.0, 10.0, 26.0, 24.0, 45.0, 55.0, 78.0, 134.0, 202.0, 314.0, 426.0, 674.0, 1000.0, 1470.0, 2185.0, 3453.0, 5416.0, 8505.0, 14178.0, 23495.0, 40416.0, 71634.0, 127461.0, 200170.0, 210690.0, 141321.0, 80729.0, 45499.0, 26478.0, 15654.0, 9691.0, 5938.0, 3927.0, 2446.0, 1631.0, 1085.0, 690.0, 460.0, 303.0, 195.0, 122.0, 102.0, 66.0, 56.0, 32.0, 17.0, 12.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.0, -32.94091796875, -31.8818359375, -30.82275390625, -29.763671875, -28.70458984375, -27.6455078125, -26.58642578125, -25.52734375, -24.46826171875, -23.4091796875, -22.35009765625, -21.291015625, -20.23193359375, -19.1728515625, -18.11376953125, -17.0546875, -15.99560546875, -14.9365234375, -13.87744140625, -12.818359375, -11.75927734375, -10.7001953125, -9.64111328125, -8.58203125, -7.52294921875, -6.4638671875, -5.40478515625, -4.345703125, -3.28662109375, -2.2275390625, -1.16845703125, -0.109375, 0.94970703125, 2.0087890625, 3.06787109375, 4.126953125, 5.18603515625, 6.2451171875, 7.30419921875, 8.36328125, 9.42236328125, 10.4814453125, 11.54052734375, 12.599609375, 13.65869140625, 14.7177734375, 15.77685546875, 16.8359375, 17.89501953125, 18.9541015625, 20.01318359375, 21.072265625, 22.13134765625, 23.1904296875, 24.24951171875, 25.30859375, 26.36767578125, 27.4267578125, 28.48583984375, 29.544921875, 30.60400390625, 31.6630859375, 32.72216796875, 33.78125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 4.0, 4.0, 7.0, 6.0, 9.0, 13.0, 14.0, 8.0, 9.0, 17.0, 21.0, 26.0, 15.0, 26.0, 26.0, 24.0, 32.0, 32.0, 38.0, 48.0, 39.0, 34.0, 34.0, 24.0, 43.0, 60.0, 43.0, 38.0, 28.0, 26.0, 31.0, 24.0, 19.0, 24.0, 25.0, 13.0, 13.0, 11.0, 15.0, 9.0, 6.0, 11.0, 10.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.203125, -22.439208984375, -21.67529296875, -20.911376953125, -20.1474609375, -19.383544921875, -18.61962890625, -17.855712890625, -17.091796875, -16.327880859375, -15.56396484375, -14.800048828125, -14.0361328125, -13.272216796875, -12.50830078125, -11.744384765625, -10.98046875, -10.216552734375, -9.45263671875, -8.688720703125, -7.9248046875, -7.160888671875, -6.39697265625, -5.633056640625, -4.869140625, -4.105224609375, -3.34130859375, -2.577392578125, -1.8134765625, -1.049560546875, -0.28564453125, 0.478271484375, 1.2421875, 2.006103515625, 2.77001953125, 3.533935546875, 4.2978515625, 5.061767578125, 5.82568359375, 6.589599609375, 7.353515625, 8.117431640625, 8.88134765625, 9.645263671875, 10.4091796875, 11.173095703125, 11.93701171875, 12.700927734375, 13.46484375, 14.228759765625, 14.99267578125, 15.756591796875, 16.5205078125, 17.284423828125, 18.04833984375, 18.812255859375, 19.576171875, 20.340087890625, 21.10400390625, 21.867919921875, 22.6318359375, 23.395751953125, 24.15966796875, 24.923583984375, 25.6875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 10.0, 11.0, 13.0, 18.0, 24.0, 27.0, 47.0, 67.0, 102.0, 136.0, 174.0, 240.0, 365.0, 553.0, 787.0, 1148.0, 1964.0, 2883.0, 4853.0, 8771.0, 16792.0, 36609.0, 93884.0, 271205.0, 364846.0, 141723.0, 51611.0, 22245.0, 11003.0, 6198.0, 3607.0, 2197.0, 1440.0, 957.0, 620.0, 432.0, 303.0, 190.0, 157.0, 110.0, 76.0, 42.0, 37.0, 30.0, 17.0, 21.0, 6.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-58.28125, -56.525390625, -54.76953125, -53.013671875, -51.2578125, -49.501953125, -47.74609375, -45.990234375, -44.234375, -42.478515625, -40.72265625, -38.966796875, -37.2109375, -35.455078125, -33.69921875, -31.943359375, -30.1875, -28.431640625, -26.67578125, -24.919921875, -23.1640625, -21.408203125, -19.65234375, -17.896484375, -16.140625, -14.384765625, -12.62890625, -10.873046875, -9.1171875, -7.361328125, -5.60546875, -3.849609375, -2.09375, -0.337890625, 1.41796875, 3.173828125, 4.9296875, 6.685546875, 8.44140625, 10.197265625, 11.953125, 13.708984375, 15.46484375, 17.220703125, 18.9765625, 20.732421875, 22.48828125, 24.244140625, 26.0, 27.755859375, 29.51171875, 31.267578125, 33.0234375, 34.779296875, 36.53515625, 38.291015625, 40.046875, 41.802734375, 43.55859375, 45.314453125, 47.0703125, 48.826171875, 50.58203125, 52.337890625, 54.09375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 1.0, 6.0, 13.0, 14.0, 8.0, 15.0, 10.0, 18.0, 13.0, 13.0, 23.0, 20.0, 30.0, 35.0, 44.0, 25.0, 34.0, 41.0, 37.0, 43.0, 49.0, 38.0, 34.0, 41.0, 44.0, 34.0, 16.0, 39.0, 26.0, 33.0, 28.0, 25.0, 22.0, 21.0, 17.0, 17.0, 16.0, 10.0, 9.0, 7.0, 11.0, 3.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-14.875, -14.3944091796875, -13.913818359375, -13.4332275390625, -12.95263671875, -12.4720458984375, -11.991455078125, -11.5108642578125, -11.0302734375, -10.5496826171875, -10.069091796875, -9.5885009765625, -9.10791015625, -8.6273193359375, -8.146728515625, -7.6661376953125, -7.185546875, -6.7049560546875, -6.224365234375, -5.7437744140625, -5.26318359375, -4.7825927734375, -4.302001953125, -3.8214111328125, -3.3408203125, -2.8602294921875, -2.379638671875, -1.8990478515625, -1.41845703125, -0.9378662109375, -0.457275390625, 0.0233154296875, 0.50390625, 0.9844970703125, 1.465087890625, 1.9456787109375, 2.42626953125, 2.9068603515625, 3.387451171875, 3.8680419921875, 4.3486328125, 4.8292236328125, 5.309814453125, 5.7904052734375, 6.27099609375, 6.7515869140625, 7.232177734375, 7.7127685546875, 8.193359375, 8.6739501953125, 9.154541015625, 9.6351318359375, 10.11572265625, 10.5963134765625, 11.076904296875, 11.5574951171875, 12.0380859375, 12.5186767578125, 12.999267578125, 13.4798583984375, 13.96044921875, 14.4410400390625, 14.921630859375, 15.4022216796875, 15.8828125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 11.0, 21.0, 18.0, 29.0, 33.0, 55.0, 74.0, 89.0, 127.0, 169.0, 291.0, 399.0, 626.0, 894.0, 1480.0, 2274.0, 3906.0, 7191.0, 13999.0, 31392.0, 81848.0, 251586.0, 404664.0, 150164.0, 51526.0, 21201.0, 10288.0, 5509.0, 3170.0, 1925.0, 1153.0, 789.0, 484.0, 358.0, 237.0, 168.0, 118.0, 71.0, 63.0, 46.0, 25.0, 21.0, 15.0, 10.0, 7.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-23.28125, -22.536865234375, -21.79248046875, -21.048095703125, -20.3037109375, -19.559326171875, -18.81494140625, -18.070556640625, -17.326171875, -16.581787109375, -15.83740234375, -15.093017578125, -14.3486328125, -13.604248046875, -12.85986328125, -12.115478515625, -11.37109375, -10.626708984375, -9.88232421875, -9.137939453125, -8.3935546875, -7.649169921875, -6.90478515625, -6.160400390625, -5.416015625, -4.671630859375, -3.92724609375, -3.182861328125, -2.4384765625, -1.694091796875, -0.94970703125, -0.205322265625, 0.5390625, 1.283447265625, 2.02783203125, 2.772216796875, 3.5166015625, 4.260986328125, 5.00537109375, 5.749755859375, 6.494140625, 7.238525390625, 7.98291015625, 8.727294921875, 9.4716796875, 10.216064453125, 10.96044921875, 11.704833984375, 12.44921875, 13.193603515625, 13.93798828125, 14.682373046875, 15.4267578125, 16.171142578125, 16.91552734375, 17.659912109375, 18.404296875, 19.148681640625, 19.89306640625, 20.637451171875, 21.3818359375, 22.126220703125, 22.87060546875, 23.614990234375, 24.359375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 3.0, 11.0, 23.0, 31.0, 55.0, 95.0, 114.0, 171.0, 160.0, 119.0, 65.0, 43.0, 34.0, 18.0, 15.0, 11.0, 11.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002227783203125, -0.002148240804672241, -0.0020686984062194824, -0.0019891560077667236, -0.0019096136093139648, -0.001830071210861206, -0.0017505288124084473, -0.0016709864139556885, -0.0015914440155029297, -0.001511901617050171, -0.0014323592185974121, -0.0013528168201446533, -0.0012732744216918945, -0.0011937320232391357, -0.001114189624786377, -0.0010346472263336182, -0.0009551048278808594, -0.0008755624294281006, -0.0007960200309753418, -0.000716477632522583, -0.0006369352340698242, -0.0005573928356170654, -0.00047785043716430664, -0.00039830803871154785, -0.00031876564025878906, -0.00023922324180603027, -0.00015968084335327148, -8.01384449005127e-05, -5.960464477539062e-07, 7.894635200500488e-05, 0.00015848875045776367, 0.00023803114891052246, 0.00031757354736328125, 0.00039711594581604004, 0.00047665834426879883, 0.0005562007427215576, 0.0006357431411743164, 0.0007152855396270752, 0.000794827938079834, 0.0008743703365325928, 0.0009539127349853516, 0.0010334551334381104, 0.0011129975318908691, 0.001192539930343628, 0.0012720823287963867, 0.0013516247272491455, 0.0014311671257019043, 0.001510709524154663, 0.0015902519226074219, 0.0016697943210601807, 0.0017493367195129395, 0.0018288791179656982, 0.001908421516418457, 0.001987963914871216, 0.0020675063133239746, 0.0021470487117767334, 0.002226591110229492, 0.002306133508682251, 0.0023856759071350098, 0.0024652183055877686, 0.0025447607040405273, 0.002624303102493286, 0.002703845500946045, 0.0027833878993988037, 0.0028629302978515625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 6.0, 8.0, 18.0, 16.0, 28.0, 33.0, 39.0, 77.0, 105.0, 135.0, 193.0, 253.0, 341.0, 513.0, 773.0, 1180.0, 1789.0, 2878.0, 4337.0, 7461.0, 12984.0, 23460.0, 45649.0, 93299.0, 190333.0, 273352.0, 192067.0, 94409.0, 45878.0, 23462.0, 13141.0, 7384.0, 4438.0, 2811.0, 1842.0, 1247.0, 766.0, 549.0, 404.0, 279.0, 167.0, 129.0, 95.0, 62.0, 58.0, 41.0, 24.0, 15.0, 6.0, 4.0, 4.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-17.453125, -16.899169921875, -16.34521484375, -15.791259765625, -15.2373046875, -14.683349609375, -14.12939453125, -13.575439453125, -13.021484375, -12.467529296875, -11.91357421875, -11.359619140625, -10.8056640625, -10.251708984375, -9.69775390625, -9.143798828125, -8.58984375, -8.035888671875, -7.48193359375, -6.927978515625, -6.3740234375, -5.820068359375, -5.26611328125, -4.712158203125, -4.158203125, -3.604248046875, -3.05029296875, -2.496337890625, -1.9423828125, -1.388427734375, -0.83447265625, -0.280517578125, 0.2734375, 0.827392578125, 1.38134765625, 1.935302734375, 2.4892578125, 3.043212890625, 3.59716796875, 4.151123046875, 4.705078125, 5.259033203125, 5.81298828125, 6.366943359375, 6.9208984375, 7.474853515625, 8.02880859375, 8.582763671875, 9.13671875, 9.690673828125, 10.24462890625, 10.798583984375, 11.3525390625, 11.906494140625, 12.46044921875, 13.014404296875, 13.568359375, 14.122314453125, 14.67626953125, 15.230224609375, 15.7841796875, 16.338134765625, 16.89208984375, 17.446044921875, 18.0]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 3.0, 10.0, 5.0, 13.0, 24.0, 14.0, 27.0, 42.0, 44.0, 46.0, 64.0, 86.0, 83.0, 84.0, 92.0, 81.0, 56.0, 56.0, 53.0, 25.0, 22.0, 16.0, 10.0, 11.0, 8.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33203125, -6.11590576171875, -5.8997802734375, -5.68365478515625, -5.467529296875, -5.25140380859375, -5.0352783203125, -4.81915283203125, -4.60302734375, -4.38690185546875, -4.1707763671875, -3.95465087890625, -3.738525390625, -3.52239990234375, -3.3062744140625, -3.09014892578125, -2.8740234375, -2.65789794921875, -2.4417724609375, -2.22564697265625, -2.009521484375, -1.79339599609375, -1.5772705078125, -1.36114501953125, -1.14501953125, -0.92889404296875, -0.7127685546875, -0.49664306640625, -0.280517578125, -0.06439208984375, 0.1517333984375, 0.36785888671875, 0.583984375, 0.80010986328125, 1.0162353515625, 1.23236083984375, 1.448486328125, 1.66461181640625, 1.8807373046875, 2.09686279296875, 2.31298828125, 2.52911376953125, 2.7452392578125, 2.96136474609375, 3.177490234375, 3.39361572265625, 3.6097412109375, 3.82586669921875, 4.0419921875, 4.25811767578125, 4.4742431640625, 4.69036865234375, 4.906494140625, 5.12261962890625, 5.3387451171875, 5.55487060546875, 5.77099609375, 5.98712158203125, 6.2032470703125, 6.41937255859375, 6.635498046875, 6.85162353515625, 7.0677490234375, 7.28387451171875, 7.5]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 3.0, 7.0, 7.0, 4.0, 7.0, 13.0, 20.0, 32.0, 23.0, 33.0, 26.0, 52.0, 65.0, 57.0, 61.0, 73.0, 73.0, 62.0, 58.0, 51.0, 54.0, 44.0, 39.0, 23.0, 27.0, 22.0, 14.0, 11.0, 11.0, 2.0, 2.0, 9.0, 9.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.64973831176758, -37.58329772949219, -36.51686096191406, -35.45042037963867, -34.38397979736328, -33.317543029785156, -32.251102447509766, -31.184663772583008, -30.11822509765625, -29.051786422729492, -27.985347747802734, -26.918907165527344, -25.852468490600586, -24.786029815673828, -23.719589233398438, -22.65315055847168, -21.586711883544922, -20.520273208618164, -19.453834533691406, -18.387393951416016, -17.320955276489258, -16.2545166015625, -15.188076972961426, -14.121637344360352, -13.055198669433594, -11.988759994506836, -10.922320365905762, -9.855880737304688, -8.78944206237793, -7.723002910614014, -6.656563758850098, -5.590124607086182, -4.523689270019531, -3.4572501182556152, -2.390810966491699, -1.3243718147277832, -0.2579326629638672, 0.8085064888000488, 1.8749456405639648, 2.941384792327881, 4.007823944091797, 5.074263095855713, 6.140702247619629, 7.207141399383545, 8.273580551147461, 9.340019226074219, 10.406458854675293, 11.472898483276367, 12.539337158203125, 13.605775833129883, 14.672215461730957, 15.738655090332031, 16.80509376525879, 17.871532440185547, 18.937973022460938, 20.004411697387695, 21.070850372314453, 22.13728904724121, 23.20372772216797, 24.27016830444336, 25.336606979370117, 26.403045654296875, 27.469486236572266, 28.535924911499023, 29.60236358642578]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 7.0, 11.0, 9.0, 7.0, 10.0, 8.0, 15.0, 13.0, 16.0, 13.0, 19.0, 19.0, 23.0, 20.0, 23.0, 27.0, 26.0, 42.0, 37.0, 33.0, 33.0, 29.0, 41.0, 31.0, 38.0, 37.0, 32.0, 40.0, 44.0, 26.0, 24.0, 22.0, 21.0, 19.0, 19.0, 19.0, 16.0, 16.0, 23.0, 5.0, 14.0, 12.0, 9.0, 10.0, 6.0, 6.0, 8.0, 4.0, 2.0, 5.0, 5.0, 0.0, 1.0, 2.0, 5.0, 1.0], "bins": [-21.573646545410156, -20.88542938232422, -20.19721221923828, -19.508995056152344, -18.820775985717773, -18.132558822631836, -17.4443416595459, -16.75612449645996, -16.06790542602539, -15.379688262939453, -14.6914701461792, -14.003252983093262, -13.315034866333008, -12.62681770324707, -11.938600540161133, -11.250383377075195, -10.562166213989258, -9.87394905090332, -9.185730934143066, -8.497513771057129, -7.809296131134033, -7.1210784912109375, -6.432861328125, -5.744643688201904, -5.056426048278809, -4.368208408355713, -3.6799910068511963, -2.9917736053466797, -2.303555965423584, -1.6153383255004883, -0.9271211624145508, -0.23890352249145508, 0.44931602478027344, 1.1375335454940796, 1.8257510662078857, 2.5139684677124023, 3.202186107635498, 3.8904037475585938, 4.578620910644531, 5.266838550567627, 5.955056190490723, 6.643273830413818, 7.331491470336914, 8.019708633422852, 8.707925796508789, 9.396143913269043, 10.08436107635498, 10.772579193115234, 11.460796356201172, 12.14901351928711, 12.837231636047363, 13.5254487991333, 14.213666915893555, 14.901884078979492, 15.59010124206543, 16.278318405151367, 16.966537475585938, 17.654754638671875, 18.342971801757812, 19.03118896484375, 19.71940803527832, 20.407625198364258, 21.095842361450195, 21.784059524536133, 22.47227668762207]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 5.0, 2.0, 6.0, 18.0, 14.0, 20.0, 25.0, 43.0, 54.0, 80.0, 147.0, 209.0, 332.0, 560.0, 939.0, 1608.0, 2865.0, 4711.0, 8638.0, 15448.0, 29074.0, 55112.0, 102144.0, 172028.0, 221212.0, 185136.0, 114001.0, 61455.0, 32741.0, 17334.0, 9473.0, 5431.0, 3153.0, 1786.0, 1074.0, 625.0, 379.0, 220.0, 143.0, 114.0, 72.0, 36.0, 21.0, 16.0, 11.0, 12.0, 6.0, 6.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-46.53125, -45.103515625, -43.67578125, -42.248046875, -40.8203125, -39.392578125, -37.96484375, -36.537109375, -35.109375, -33.681640625, -32.25390625, -30.826171875, -29.3984375, -27.970703125, -26.54296875, -25.115234375, -23.6875, -22.259765625, -20.83203125, -19.404296875, -17.9765625, -16.548828125, -15.12109375, -13.693359375, -12.265625, -10.837890625, -9.41015625, -7.982421875, -6.5546875, -5.126953125, -3.69921875, -2.271484375, -0.84375, 0.583984375, 2.01171875, 3.439453125, 4.8671875, 6.294921875, 7.72265625, 9.150390625, 10.578125, 12.005859375, 13.43359375, 14.861328125, 16.2890625, 17.716796875, 19.14453125, 20.572265625, 22.0, 23.427734375, 24.85546875, 26.283203125, 27.7109375, 29.138671875, 30.56640625, 31.994140625, 33.421875, 34.849609375, 36.27734375, 37.705078125, 39.1328125, 40.560546875, 41.98828125, 43.416015625, 44.84375]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 8.0, 7.0, 10.0, 6.0, 17.0, 12.0, 16.0, 8.0, 24.0, 18.0, 24.0, 30.0, 17.0, 41.0, 33.0, 33.0, 44.0, 36.0, 38.0, 29.0, 26.0, 45.0, 36.0, 46.0, 47.0, 29.0, 32.0, 32.0, 30.0, 21.0, 27.0, 22.0, 21.0, 20.0, 11.0, 19.0, 14.0, 9.0, 11.0, 13.0, 1.0, 8.0, 4.0, 6.0, 2.0, 4.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.3125, -20.622802734375, -19.93310546875, -19.243408203125, -18.5537109375, -17.864013671875, -17.17431640625, -16.484619140625, -15.794921875, -15.105224609375, -14.41552734375, -13.725830078125, -13.0361328125, -12.346435546875, -11.65673828125, -10.967041015625, -10.27734375, -9.587646484375, -8.89794921875, -8.208251953125, -7.5185546875, -6.828857421875, -6.13916015625, -5.449462890625, -4.759765625, -4.070068359375, -3.38037109375, -2.690673828125, -2.0009765625, -1.311279296875, -0.62158203125, 0.068115234375, 0.7578125, 1.447509765625, 2.13720703125, 2.826904296875, 3.5166015625, 4.206298828125, 4.89599609375, 5.585693359375, 6.275390625, 6.965087890625, 7.65478515625, 8.344482421875, 9.0341796875, 9.723876953125, 10.41357421875, 11.103271484375, 11.79296875, 12.482666015625, 13.17236328125, 13.862060546875, 14.5517578125, 15.241455078125, 15.93115234375, 16.620849609375, 17.310546875, 18.000244140625, 18.68994140625, 19.379638671875, 20.0693359375, 20.759033203125, 21.44873046875, 22.138427734375, 22.828125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 8.0, 8.0, 10.0, 15.0, 22.0, 34.0, 52.0, 72.0, 117.0, 178.0, 245.0, 385.0, 580.0, 920.0, 1447.0, 2152.0, 3354.0, 5352.0, 8276.0, 13269.0, 20618.0, 32850.0, 51662.0, 79269.0, 114072.0, 146385.0, 155756.0, 133467.0, 97386.0, 65522.0, 42208.0, 26447.0, 17062.0, 10433.0, 6662.0, 4265.0, 2755.0, 1833.0, 1152.0, 775.0, 464.0, 332.0, 221.0, 156.0, 107.0, 69.0, 51.0, 27.0, 13.0, 17.0, 14.0, 7.0, 5.0, 4.0, 0.0, 1.0, 3.0], "bins": [-28.421875, -27.567626953125, -26.71337890625, -25.859130859375, -25.0048828125, -24.150634765625, -23.29638671875, -22.442138671875, -21.587890625, -20.733642578125, -19.87939453125, -19.025146484375, -18.1708984375, -17.316650390625, -16.46240234375, -15.608154296875, -14.75390625, -13.899658203125, -13.04541015625, -12.191162109375, -11.3369140625, -10.482666015625, -9.62841796875, -8.774169921875, -7.919921875, -7.065673828125, -6.21142578125, -5.357177734375, -4.5029296875, -3.648681640625, -2.79443359375, -1.940185546875, -1.0859375, -0.231689453125, 0.62255859375, 1.476806640625, 2.3310546875, 3.185302734375, 4.03955078125, 4.893798828125, 5.748046875, 6.602294921875, 7.45654296875, 8.310791015625, 9.1650390625, 10.019287109375, 10.87353515625, 11.727783203125, 12.58203125, 13.436279296875, 14.29052734375, 15.144775390625, 15.9990234375, 16.853271484375, 17.70751953125, 18.561767578125, 19.416015625, 20.270263671875, 21.12451171875, 21.978759765625, 22.8330078125, 23.687255859375, 24.54150390625, 25.395751953125, 26.25]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 10.0, 3.0, 7.0, 12.0, 13.0, 16.0, 21.0, 19.0, 18.0, 29.0, 25.0, 37.0, 28.0, 33.0, 41.0, 48.0, 39.0, 32.0, 46.0, 40.0, 53.0, 40.0, 48.0, 41.0, 42.0, 32.0, 34.0, 39.0, 25.0, 20.0, 18.0, 19.0, 14.0, 19.0, 11.0, 6.0, 9.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.1953125, -14.7066650390625, -14.218017578125, -13.7293701171875, -13.24072265625, -12.7520751953125, -12.263427734375, -11.7747802734375, -11.2861328125, -10.7974853515625, -10.308837890625, -9.8201904296875, -9.33154296875, -8.8428955078125, -8.354248046875, -7.8656005859375, -7.376953125, -6.8883056640625, -6.399658203125, -5.9110107421875, -5.42236328125, -4.9337158203125, -4.445068359375, -3.9564208984375, -3.4677734375, -2.9791259765625, -2.490478515625, -2.0018310546875, -1.51318359375, -1.0245361328125, -0.535888671875, -0.0472412109375, 0.44140625, 0.9300537109375, 1.418701171875, 1.9073486328125, 2.39599609375, 2.8846435546875, 3.373291015625, 3.8619384765625, 4.3505859375, 4.8392333984375, 5.327880859375, 5.8165283203125, 6.30517578125, 6.7938232421875, 7.282470703125, 7.7711181640625, 8.259765625, 8.7484130859375, 9.237060546875, 9.7257080078125, 10.21435546875, 10.7030029296875, 11.191650390625, 11.6802978515625, 12.1689453125, 12.6575927734375, 13.146240234375, 13.6348876953125, 14.12353515625, 14.6121826171875, 15.100830078125, 15.5894775390625, 16.078125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 9.0, 21.0, 28.0, 35.0, 59.0, 73.0, 97.0, 190.0, 232.0, 330.0, 534.0, 828.0, 1427.0, 2299.0, 4072.0, 7399.0, 15171.0, 33170.0, 81085.0, 199448.0, 328346.0, 215336.0, 87728.0, 35572.0, 16185.0, 8062.0, 4261.0, 2454.0, 1506.0, 907.0, 613.0, 339.0, 248.0, 151.0, 106.0, 68.0, 34.0, 44.0, 20.0, 11.0, 18.0, 16.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-26.921875, -25.978759765625, -25.03564453125, -24.092529296875, -23.1494140625, -22.206298828125, -21.26318359375, -20.320068359375, -19.376953125, -18.433837890625, -17.49072265625, -16.547607421875, -15.6044921875, -14.661376953125, -13.71826171875, -12.775146484375, -11.83203125, -10.888916015625, -9.94580078125, -9.002685546875, -8.0595703125, -7.116455078125, -6.17333984375, -5.230224609375, -4.287109375, -3.343994140625, -2.40087890625, -1.457763671875, -0.5146484375, 0.428466796875, 1.37158203125, 2.314697265625, 3.2578125, 4.200927734375, 5.14404296875, 6.087158203125, 7.0302734375, 7.973388671875, 8.91650390625, 9.859619140625, 10.802734375, 11.745849609375, 12.68896484375, 13.632080078125, 14.5751953125, 15.518310546875, 16.46142578125, 17.404541015625, 18.34765625, 19.290771484375, 20.23388671875, 21.177001953125, 22.1201171875, 23.063232421875, 24.00634765625, 24.949462890625, 25.892578125, 26.835693359375, 27.77880859375, 28.721923828125, 29.6650390625, 30.608154296875, 31.55126953125, 32.494384765625, 33.4375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 6.0, 13.0, 11.0, 15.0, 18.0, 22.0, 29.0, 38.0, 61.0, 43.0, 56.0, 62.0, 75.0, 81.0, 71.0, 72.0, 70.0, 46.0, 44.0, 29.0, 21.0, 23.0, 13.0, 18.0, 13.0, 10.0, 6.0, 6.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0018987655639648438, -0.0018338114023208618, -0.0017688572406768799, -0.001703903079032898, -0.001638948917388916, -0.001573994755744934, -0.0015090405941009521, -0.0014440864324569702, -0.0013791322708129883, -0.0013141781091690063, -0.0012492239475250244, -0.0011842697858810425, -0.0011193156242370605, -0.0010543614625930786, -0.0009894073009490967, -0.0009244531393051147, -0.0008594989776611328, -0.0007945448160171509, -0.0007295906543731689, -0.000664636492729187, -0.0005996823310852051, -0.0005347281694412231, -0.0004697740077972412, -0.0004048198461532593, -0.00033986568450927734, -0.0002749115228652954, -0.00020995736122131348, -0.00014500319957733154, -8.004903793334961e-05, -1.5094876289367676e-05, 4.985928535461426e-05, 0.00011481344699859619, 0.00017976760864257812, 0.00024472177028656006, 0.000309675931930542, 0.0003746300935745239, 0.00043958425521850586, 0.0005045384168624878, 0.0005694925785064697, 0.0006344467401504517, 0.0006994009017944336, 0.0007643550634384155, 0.0008293092250823975, 0.0008942633867263794, 0.0009592175483703613, 0.0010241717100143433, 0.0010891258716583252, 0.0011540800333023071, 0.001219034194946289, 0.001283988356590271, 0.001348942518234253, 0.0014138966798782349, 0.0014788508415222168, 0.0015438050031661987, 0.0016087591648101807, 0.0016737133264541626, 0.0017386674880981445, 0.0018036216497421265, 0.0018685758113861084, 0.0019335299730300903, 0.0019984841346740723, 0.002063438296318054, 0.002128392457962036, 0.002193346619606018, 0.00225830078125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 15.0, 10.0, 24.0, 30.0, 45.0, 65.0, 104.0, 144.0, 204.0, 288.0, 411.0, 655.0, 1031.0, 1535.0, 2497.0, 4234.0, 7410.0, 13860.0, 28001.0, 58628.0, 124370.0, 228737.0, 257271.0, 162911.0, 78495.0, 36481.0, 17881.0, 9517.0, 5127.0, 3026.0, 1922.0, 1218.0, 796.0, 525.0, 337.0, 239.0, 161.0, 111.0, 69.0, 55.0, 37.0, 34.0, 15.0, 15.0, 9.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.59375, -23.852783203125, -23.11181640625, -22.370849609375, -21.6298828125, -20.888916015625, -20.14794921875, -19.406982421875, -18.666015625, -17.925048828125, -17.18408203125, -16.443115234375, -15.7021484375, -14.961181640625, -14.22021484375, -13.479248046875, -12.73828125, -11.997314453125, -11.25634765625, -10.515380859375, -9.7744140625, -9.033447265625, -8.29248046875, -7.551513671875, -6.810546875, -6.069580078125, -5.32861328125, -4.587646484375, -3.8466796875, -3.105712890625, -2.36474609375, -1.623779296875, -0.8828125, -0.141845703125, 0.59912109375, 1.340087890625, 2.0810546875, 2.822021484375, 3.56298828125, 4.303955078125, 5.044921875, 5.785888671875, 6.52685546875, 7.267822265625, 8.0087890625, 8.749755859375, 9.49072265625, 10.231689453125, 10.97265625, 11.713623046875, 12.45458984375, 13.195556640625, 13.9365234375, 14.677490234375, 15.41845703125, 16.159423828125, 16.900390625, 17.641357421875, 18.38232421875, 19.123291015625, 19.8642578125, 20.605224609375, 21.34619140625, 22.087158203125, 22.828125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 4.0, 7.0, 1.0, 4.0, 5.0, 16.0, 18.0, 18.0, 24.0, 38.0, 44.0, 51.0, 65.0, 67.0, 69.0, 72.0, 74.0, 68.0, 77.0, 59.0, 47.0, 52.0, 37.0, 19.0, 23.0, 9.0, 10.0, 4.0, 7.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.84375, -7.599609375, -7.35546875, -7.111328125, -6.8671875, -6.623046875, -6.37890625, -6.134765625, -5.890625, -5.646484375, -5.40234375, -5.158203125, -4.9140625, -4.669921875, -4.42578125, -4.181640625, -3.9375, -3.693359375, -3.44921875, -3.205078125, -2.9609375, -2.716796875, -2.47265625, -2.228515625, -1.984375, -1.740234375, -1.49609375, -1.251953125, -1.0078125, -0.763671875, -0.51953125, -0.275390625, -0.03125, 0.212890625, 0.45703125, 0.701171875, 0.9453125, 1.189453125, 1.43359375, 1.677734375, 1.921875, 2.166015625, 2.41015625, 2.654296875, 2.8984375, 3.142578125, 3.38671875, 3.630859375, 3.875, 4.119140625, 4.36328125, 4.607421875, 4.8515625, 5.095703125, 5.33984375, 5.583984375, 5.828125, 6.072265625, 6.31640625, 6.560546875, 6.8046875, 7.048828125, 7.29296875, 7.537109375, 7.78125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 1.0, 4.0, 2.0, 11.0, 13.0, 6.0, 18.0, 11.0, 21.0, 21.0, 37.0, 42.0, 45.0, 54.0, 61.0, 37.0, 64.0, 69.0, 62.0, 62.0, 52.0, 55.0, 42.0, 37.0, 37.0, 36.0, 19.0, 20.0, 9.0, 9.0, 8.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.54153060913086, -29.627031326293945, -28.71253204345703, -27.798032760620117, -26.883533477783203, -25.969036102294922, -25.054536819458008, -24.140037536621094, -23.22553825378418, -22.311038970947266, -21.39653968811035, -20.482040405273438, -19.567543029785156, -18.65304183959961, -17.738544464111328, -16.824045181274414, -15.9095458984375, -14.995046615600586, -14.080547332763672, -13.166049003601074, -12.25154972076416, -11.337050437927246, -10.422552108764648, -9.508052825927734, -8.59355354309082, -7.679054260253906, -6.76455545425415, -5.8500566482543945, -4.9355573654174805, -4.021058082580566, -3.1065592765808105, -2.1920604705810547, -1.2775592803955078, -0.36306023597717285, 0.5514388084411621, 1.465937852859497, 2.380436897277832, 3.294936180114746, 4.209434986114502, 5.123933792114258, 6.038433074951172, 6.952932357788086, 7.867431163787842, 8.781929969787598, 9.696429252624512, 10.610928535461426, 11.525426864624023, 12.439926147460938, 13.354425430297852, 14.268924713134766, 15.18342399597168, 16.097923278808594, 17.012420654296875, 17.926921844482422, 18.841419219970703, 19.755918502807617, 20.67041778564453, 21.584917068481445, 22.49941635131836, 23.413915634155273, 24.328414916992188, 25.24291229248047, 26.157411575317383, 27.071910858154297, 27.98641014099121]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 7.0, 13.0, 15.0, 15.0, 16.0, 19.0, 16.0, 18.0, 20.0, 24.0, 35.0, 29.0, 22.0, 35.0, 37.0, 32.0, 30.0, 37.0, 41.0, 42.0, 42.0, 31.0, 38.0, 40.0, 43.0, 22.0, 32.0, 24.0, 28.0, 23.0, 27.0, 16.0, 12.0, 11.0, 15.0, 15.0, 11.0, 9.0, 8.0, 8.0, 4.0, 7.0, 4.0, 8.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-21.380128860473633, -20.699838638305664, -20.019548416137695, -19.339258193969727, -18.658967971801758, -17.97867774963379, -17.298389434814453, -16.618099212646484, -15.9378080368042, -15.25751781463623, -14.577227592468262, -13.89693832397461, -13.21664810180664, -12.536357879638672, -11.856067657470703, -11.175777435302734, -10.495487213134766, -9.815196990966797, -9.134906768798828, -8.45461654663086, -7.774326801300049, -7.09403657913208, -6.4137468338012695, -5.733456611633301, -5.053166389465332, -4.372876167297363, -3.6925861835479736, -3.012296199798584, -2.3320059776306152, -1.6517157554626465, -0.9714260101318359, -0.2911357879638672, 0.38915443420410156, 1.0694445371627808, 1.74973464012146, 2.4300246238708496, 3.1103148460388184, 3.790605068206787, 4.470894813537598, 5.151185035705566, 5.831475257873535, 6.511765480041504, 7.192055702209473, 7.872345447540283, 8.552635192871094, 9.232925415039062, 9.913215637207031, 10.593505859375, 11.273796081542969, 11.954086303710938, 12.634376525878906, 13.314666748046875, 13.994956970214844, 14.675247192382812, 15.355536460876465, 16.03582763671875, 16.71611785888672, 17.396408081054688, 18.076698303222656, 18.756988525390625, 19.437278747558594, 20.117568969726562, 20.79785919189453, 21.4781494140625, 22.158437728881836]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 8.0, 13.0, 15.0, 27.0, 47.0, 81.0, 125.0, 180.0, 304.0, 497.0, 809.0, 1332.0, 2214.0, 3590.0, 6102.0, 10400.0, 18062.0, 33305.0, 62867.0, 127469.0, 296389.0, 747645.0, 1287171.0, 915094.0, 370714.0, 151622.0, 72225.0, 37897.0, 20423.0, 11429.0, 6597.0, 3805.0, 2256.0, 1368.0, 829.0, 515.0, 323.0, 185.0, 125.0, 88.0, 44.0, 37.0, 24.0, 8.0, 14.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-30.375, -29.44384765625, -28.5126953125, -27.58154296875, -26.650390625, -25.71923828125, -24.7880859375, -23.85693359375, -22.92578125, -21.99462890625, -21.0634765625, -20.13232421875, -19.201171875, -18.27001953125, -17.3388671875, -16.40771484375, -15.4765625, -14.54541015625, -13.6142578125, -12.68310546875, -11.751953125, -10.82080078125, -9.8896484375, -8.95849609375, -8.02734375, -7.09619140625, -6.1650390625, -5.23388671875, -4.302734375, -3.37158203125, -2.4404296875, -1.50927734375, -0.578125, 0.35302734375, 1.2841796875, 2.21533203125, 3.146484375, 4.07763671875, 5.0087890625, 5.93994140625, 6.87109375, 7.80224609375, 8.7333984375, 9.66455078125, 10.595703125, 11.52685546875, 12.4580078125, 13.38916015625, 14.3203125, 15.25146484375, 16.1826171875, 17.11376953125, 18.044921875, 18.97607421875, 19.9072265625, 20.83837890625, 21.76953125, 22.70068359375, 23.6318359375, 24.56298828125, 25.494140625, 26.42529296875, 27.3564453125, 28.28759765625, 29.21875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 7.0, 12.0, 6.0, 11.0, 17.0, 4.0, 17.0, 18.0, 18.0, 23.0, 17.0, 26.0, 30.0, 31.0, 38.0, 29.0, 32.0, 35.0, 40.0, 38.0, 35.0, 34.0, 39.0, 37.0, 45.0, 41.0, 29.0, 30.0, 30.0, 17.0, 36.0, 23.0, 21.0, 22.0, 10.0, 12.0, 16.0, 11.0, 9.0, 6.0, 7.0, 6.0, 7.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-15.046875, -14.593505859375, -14.14013671875, -13.686767578125, -13.2333984375, -12.780029296875, -12.32666015625, -11.873291015625, -11.419921875, -10.966552734375, -10.51318359375, -10.059814453125, -9.6064453125, -9.153076171875, -8.69970703125, -8.246337890625, -7.79296875, -7.339599609375, -6.88623046875, -6.432861328125, -5.9794921875, -5.526123046875, -5.07275390625, -4.619384765625, -4.166015625, -3.712646484375, -3.25927734375, -2.805908203125, -2.3525390625, -1.899169921875, -1.44580078125, -0.992431640625, -0.5390625, -0.085693359375, 0.36767578125, 0.821044921875, 1.2744140625, 1.727783203125, 2.18115234375, 2.634521484375, 3.087890625, 3.541259765625, 3.99462890625, 4.447998046875, 4.9013671875, 5.354736328125, 5.80810546875, 6.261474609375, 6.71484375, 7.168212890625, 7.62158203125, 8.074951171875, 8.5283203125, 8.981689453125, 9.43505859375, 9.888427734375, 10.341796875, 10.795166015625, 11.24853515625, 11.701904296875, 12.1552734375, 12.608642578125, 13.06201171875, 13.515380859375, 13.96875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 14.0, 7.0, 29.0, 43.0, 59.0, 81.0, 141.0, 187.0, 326.0, 527.0, 826.0, 1407.0, 2393.0, 4096.0, 7037.0, 12258.0, 22276.0, 40195.0, 75436.0, 145883.0, 291993.0, 593150.0, 1029057.0, 941153.0, 505559.0, 249119.0, 125115.0, 65405.0, 34923.0, 19357.0, 10768.0, 6219.0, 3561.0, 2130.0, 1277.0, 824.0, 513.0, 325.0, 188.0, 136.0, 94.0, 68.0, 46.0, 28.0, 18.0, 9.0, 11.0, 5.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.96875, -24.13330078125, -23.2978515625, -22.46240234375, -21.626953125, -20.79150390625, -19.9560546875, -19.12060546875, -18.28515625, -17.44970703125, -16.6142578125, -15.77880859375, -14.943359375, -14.10791015625, -13.2724609375, -12.43701171875, -11.6015625, -10.76611328125, -9.9306640625, -9.09521484375, -8.259765625, -7.42431640625, -6.5888671875, -5.75341796875, -4.91796875, -4.08251953125, -3.2470703125, -2.41162109375, -1.576171875, -0.74072265625, 0.0947265625, 0.93017578125, 1.765625, 2.60107421875, 3.4365234375, 4.27197265625, 5.107421875, 5.94287109375, 6.7783203125, 7.61376953125, 8.44921875, 9.28466796875, 10.1201171875, 10.95556640625, 11.791015625, 12.62646484375, 13.4619140625, 14.29736328125, 15.1328125, 15.96826171875, 16.8037109375, 17.63916015625, 18.474609375, 19.31005859375, 20.1455078125, 20.98095703125, 21.81640625, 22.65185546875, 23.4873046875, 24.32275390625, 25.158203125, 25.99365234375, 26.8291015625, 27.66455078125, 28.5]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 2.0, 5.0, 4.0, 9.0, 9.0, 9.0, 18.0, 21.0, 27.0, 41.0, 41.0, 48.0, 58.0, 90.0, 94.0, 115.0, 122.0, 135.0, 182.0, 218.0, 276.0, 300.0, 283.0, 309.0, 288.0, 248.0, 209.0, 158.0, 152.0, 126.0, 109.0, 64.0, 71.0, 53.0, 30.0, 40.0, 26.0, 19.0, 24.0, 9.0, 11.0, 9.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-9.8125, -9.528564453125, -9.24462890625, -8.960693359375, -8.6767578125, -8.392822265625, -8.10888671875, -7.824951171875, -7.541015625, -7.257080078125, -6.97314453125, -6.689208984375, -6.4052734375, -6.121337890625, -5.83740234375, -5.553466796875, -5.26953125, -4.985595703125, -4.70166015625, -4.417724609375, -4.1337890625, -3.849853515625, -3.56591796875, -3.281982421875, -2.998046875, -2.714111328125, -2.43017578125, -2.146240234375, -1.8623046875, -1.578369140625, -1.29443359375, -1.010498046875, -0.7265625, -0.442626953125, -0.15869140625, 0.125244140625, 0.4091796875, 0.693115234375, 0.97705078125, 1.260986328125, 1.544921875, 1.828857421875, 2.11279296875, 2.396728515625, 2.6806640625, 2.964599609375, 3.24853515625, 3.532470703125, 3.81640625, 4.100341796875, 4.38427734375, 4.668212890625, 4.9521484375, 5.236083984375, 5.52001953125, 5.803955078125, 6.087890625, 6.371826171875, 6.65576171875, 6.939697265625, 7.2236328125, 7.507568359375, 7.79150390625, 8.075439453125, 8.359375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 4.0, 3.0, 6.0, 16.0, 16.0, 14.0, 25.0, 33.0, 36.0, 48.0, 47.0, 69.0, 76.0, 71.0, 85.0, 70.0, 82.0, 54.0, 53.0, 40.0, 39.0, 27.0, 22.0, 18.0, 15.0, 9.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.57342529296875, -34.563270568847656, -33.5531120300293, -32.5429573059082, -31.53280258178711, -30.522645950317383, -29.512489318847656, -28.502334594726562, -27.492177963256836, -26.48202133178711, -25.471866607666016, -24.46170997619629, -23.451553344726562, -22.44139862060547, -21.431241989135742, -20.421085357666016, -19.410930633544922, -18.400774002075195, -17.3906192779541, -16.380462646484375, -15.370306968688965, -14.360151290893555, -13.349994659423828, -12.339838981628418, -11.329683303833008, -10.319527626037598, -9.309371948242188, -8.299215316772461, -7.289059638977051, -6.278903961181641, -5.268747806549072, -4.258591651916504, -3.248432159423828, -2.238276243209839, -1.2281203269958496, -0.21796441078186035, 0.7921915054321289, 1.802347183227539, 2.8125033378601074, 3.822659492492676, 4.832815170288086, 5.842970848083496, 6.8531270027160645, 7.863283157348633, 8.873438835144043, 9.883594512939453, 10.89375114440918, 11.90390682220459, 12.9140625, 13.92421817779541, 14.93437385559082, 15.944530487060547, 16.95468521118164, 17.964841842651367, 18.974998474121094, 19.985153198242188, 20.995309829711914, 22.00546646118164, 23.015621185302734, 24.02577781677246, 25.035934448242188, 26.04608917236328, 27.056245803833008, 28.066402435302734, 29.076557159423828]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 8.0, 10.0, 12.0, 16.0, 8.0, 14.0, 19.0, 16.0, 29.0, 24.0, 21.0, 28.0, 38.0, 42.0, 32.0, 32.0, 51.0, 43.0, 40.0, 33.0, 35.0, 40.0, 39.0, 52.0, 36.0, 33.0, 19.0, 23.0, 24.0, 18.0, 19.0, 20.0, 18.0, 20.0, 18.0, 11.0, 14.0, 9.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-20.64584732055664, -20.00339698791504, -19.360946655273438, -18.71849822998047, -18.076047897338867, -17.433597564697266, -16.791149139404297, -16.148698806762695, -15.506248474121094, -14.863798141479492, -14.221348762512207, -13.578899383544922, -12.93644905090332, -12.293998718261719, -11.651549339294434, -11.009099960327148, -10.366649627685547, -9.724199295043945, -9.08174991607666, -8.439300537109375, -7.796850204467773, -7.15440034866333, -6.511950492858887, -5.869500637054443, -5.22705078125, -4.584600925445557, -3.9421510696411133, -3.29970121383667, -2.6572513580322266, -2.014801502227783, -1.3723516464233398, -0.7299017906188965, -0.08745193481445312, 0.5549979209899902, 1.1974477767944336, 1.839897632598877, 2.4823474884033203, 3.1247973442077637, 3.767247200012207, 4.40969705581665, 5.052146911621094, 5.694596767425537, 6.3370466232299805, 6.979496479034424, 7.621946334838867, 8.264396667480469, 8.906846046447754, 9.549295425415039, 10.19174575805664, 10.834196090698242, 11.476645469665527, 12.119094848632812, 12.761545181274414, 13.403995513916016, 14.0464448928833, 14.688894271850586, 15.331344604492188, 15.973794937133789, 16.61624526977539, 17.25869369506836, 17.90114402770996, 18.543594360351562, 19.18604278564453, 19.828493118286133, 20.470943450927734]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 5.0, 13.0, 10.0, 21.0, 17.0, 42.0, 46.0, 83.0, 91.0, 188.0, 241.0, 349.0, 553.0, 775.0, 1239.0, 1865.0, 3104.0, 4937.0, 8022.0, 13539.0, 23809.0, 44951.0, 87947.0, 173445.0, 260211.0, 199595.0, 103846.0, 52240.0, 27816.0, 15416.0, 9000.0, 5564.0, 3292.0, 2139.0, 1379.0, 943.0, 586.0, 385.0, 278.0, 184.0, 112.0, 86.0, 46.0, 41.0, 30.0, 25.0, 20.0, 5.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-29.1875, -28.292724609375, -27.39794921875, -26.503173828125, -25.6083984375, -24.713623046875, -23.81884765625, -22.924072265625, -22.029296875, -21.134521484375, -20.23974609375, -19.344970703125, -18.4501953125, -17.555419921875, -16.66064453125, -15.765869140625, -14.87109375, -13.976318359375, -13.08154296875, -12.186767578125, -11.2919921875, -10.397216796875, -9.50244140625, -8.607666015625, -7.712890625, -6.818115234375, -5.92333984375, -5.028564453125, -4.1337890625, -3.239013671875, -2.34423828125, -1.449462890625, -0.5546875, 0.340087890625, 1.23486328125, 2.129638671875, 3.0244140625, 3.919189453125, 4.81396484375, 5.708740234375, 6.603515625, 7.498291015625, 8.39306640625, 9.287841796875, 10.1826171875, 11.077392578125, 11.97216796875, 12.866943359375, 13.76171875, 14.656494140625, 15.55126953125, 16.446044921875, 17.3408203125, 18.235595703125, 19.13037109375, 20.025146484375, 20.919921875, 21.814697265625, 22.70947265625, 23.604248046875, 24.4990234375, 25.393798828125, 26.28857421875, 27.183349609375, 28.078125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 8.0, 1.0, 8.0, 15.0, 16.0, 15.0, 29.0, 24.0, 27.0, 23.0, 36.0, 35.0, 39.0, 25.0, 42.0, 34.0, 58.0, 46.0, 34.0, 59.0, 39.0, 52.0, 49.0, 33.0, 27.0, 33.0, 26.0, 20.0, 28.0, 9.0, 17.0, 19.0, 17.0, 8.0, 12.0, 3.0, 6.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.375, -21.67138671875, -20.9677734375, -20.26416015625, -19.560546875, -18.85693359375, -18.1533203125, -17.44970703125, -16.74609375, -16.04248046875, -15.3388671875, -14.63525390625, -13.931640625, -13.22802734375, -12.5244140625, -11.82080078125, -11.1171875, -10.41357421875, -9.7099609375, -9.00634765625, -8.302734375, -7.59912109375, -6.8955078125, -6.19189453125, -5.48828125, -4.78466796875, -4.0810546875, -3.37744140625, -2.673828125, -1.97021484375, -1.2666015625, -0.56298828125, 0.140625, 0.84423828125, 1.5478515625, 2.25146484375, 2.955078125, 3.65869140625, 4.3623046875, 5.06591796875, 5.76953125, 6.47314453125, 7.1767578125, 7.88037109375, 8.583984375, 9.28759765625, 9.9912109375, 10.69482421875, 11.3984375, 12.10205078125, 12.8056640625, 13.50927734375, 14.212890625, 14.91650390625, 15.6201171875, 16.32373046875, 17.02734375, 17.73095703125, 18.4345703125, 19.13818359375, 19.841796875, 20.54541015625, 21.2490234375, 21.95263671875, 22.65625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 10.0, 18.0, 23.0, 17.0, 29.0, 28.0, 51.0, 75.0, 112.0, 151.0, 231.0, 305.0, 498.0, 720.0, 1099.0, 1665.0, 2764.0, 4615.0, 8312.0, 16142.0, 35204.0, 90886.0, 262570.0, 370165.0, 149504.0, 54028.0, 22750.0, 10966.0, 6015.0, 3427.0, 2110.0, 1363.0, 836.0, 565.0, 389.0, 276.0, 181.0, 137.0, 92.0, 58.0, 40.0, 35.0, 20.0, 21.0, 11.0, 13.0, 8.0, 10.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.625, -36.337890625, -35.05078125, -33.763671875, -32.4765625, -31.189453125, -29.90234375, -28.615234375, -27.328125, -26.041015625, -24.75390625, -23.466796875, -22.1796875, -20.892578125, -19.60546875, -18.318359375, -17.03125, -15.744140625, -14.45703125, -13.169921875, -11.8828125, -10.595703125, -9.30859375, -8.021484375, -6.734375, -5.447265625, -4.16015625, -2.873046875, -1.5859375, -0.298828125, 0.98828125, 2.275390625, 3.5625, 4.849609375, 6.13671875, 7.423828125, 8.7109375, 9.998046875, 11.28515625, 12.572265625, 13.859375, 15.146484375, 16.43359375, 17.720703125, 19.0078125, 20.294921875, 21.58203125, 22.869140625, 24.15625, 25.443359375, 26.73046875, 28.017578125, 29.3046875, 30.591796875, 31.87890625, 33.166015625, 34.453125, 35.740234375, 37.02734375, 38.314453125, 39.6015625, 40.888671875, 42.17578125, 43.462890625, 44.75]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 6.0, 13.0, 4.0, 12.0, 14.0, 18.0, 21.0, 15.0, 26.0, 21.0, 22.0, 29.0, 21.0, 43.0, 32.0, 38.0, 26.0, 35.0, 30.0, 40.0, 28.0, 29.0, 25.0, 45.0, 23.0, 32.0, 23.0, 21.0, 26.0, 31.0, 27.0, 24.0, 32.0, 19.0, 17.0, 17.0, 18.0, 14.0, 15.0, 6.0, 5.0, 3.0, 5.0, 3.0, 4.0, 3.0, 8.0, 3.0, 2.0, 4.0, 1.0], "bins": [-10.921875, -10.59521484375, -10.2685546875, -9.94189453125, -9.615234375, -9.28857421875, -8.9619140625, -8.63525390625, -8.30859375, -7.98193359375, -7.6552734375, -7.32861328125, -7.001953125, -6.67529296875, -6.3486328125, -6.02197265625, -5.6953125, -5.36865234375, -5.0419921875, -4.71533203125, -4.388671875, -4.06201171875, -3.7353515625, -3.40869140625, -3.08203125, -2.75537109375, -2.4287109375, -2.10205078125, -1.775390625, -1.44873046875, -1.1220703125, -0.79541015625, -0.46875, -0.14208984375, 0.1845703125, 0.51123046875, 0.837890625, 1.16455078125, 1.4912109375, 1.81787109375, 2.14453125, 2.47119140625, 2.7978515625, 3.12451171875, 3.451171875, 3.77783203125, 4.1044921875, 4.43115234375, 4.7578125, 5.08447265625, 5.4111328125, 5.73779296875, 6.064453125, 6.39111328125, 6.7177734375, 7.04443359375, 7.37109375, 7.69775390625, 8.0244140625, 8.35107421875, 8.677734375, 9.00439453125, 9.3310546875, 9.65771484375, 9.984375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 11.0, 10.0, 20.0, 24.0, 31.0, 49.0, 75.0, 103.0, 166.0, 214.0, 327.0, 473.0, 747.0, 1063.0, 1727.0, 2801.0, 4450.0, 7558.0, 13695.0, 26917.0, 59508.0, 152028.0, 358886.0, 244497.0, 90704.0, 38305.0, 18526.0, 10080.0, 5664.0, 3469.0, 2175.0, 1419.0, 881.0, 584.0, 432.0, 265.0, 200.0, 142.0, 93.0, 65.0, 62.0, 31.0, 20.0, 12.0, 16.0, 11.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.53125, -13.117919921875, -12.70458984375, -12.291259765625, -11.8779296875, -11.464599609375, -11.05126953125, -10.637939453125, -10.224609375, -9.811279296875, -9.39794921875, -8.984619140625, -8.5712890625, -8.157958984375, -7.74462890625, -7.331298828125, -6.91796875, -6.504638671875, -6.09130859375, -5.677978515625, -5.2646484375, -4.851318359375, -4.43798828125, -4.024658203125, -3.611328125, -3.197998046875, -2.78466796875, -2.371337890625, -1.9580078125, -1.544677734375, -1.13134765625, -0.718017578125, -0.3046875, 0.108642578125, 0.52197265625, 0.935302734375, 1.3486328125, 1.761962890625, 2.17529296875, 2.588623046875, 3.001953125, 3.415283203125, 3.82861328125, 4.241943359375, 4.6552734375, 5.068603515625, 5.48193359375, 5.895263671875, 6.30859375, 6.721923828125, 7.13525390625, 7.548583984375, 7.9619140625, 8.375244140625, 8.78857421875, 9.201904296875, 9.615234375, 10.028564453125, 10.44189453125, 10.855224609375, 11.2685546875, 11.681884765625, 12.09521484375, 12.508544921875, 12.921875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 5.0, 11.0, 13.0, 13.0, 21.0, 36.0, 44.0, 72.0, 86.0, 117.0, 111.0, 106.0, 98.0, 54.0, 49.0, 37.0, 29.0, 15.0, 18.0, 11.0, 13.0, 8.0, 2.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011739730834960938, -0.001140102744102478, -0.0011062324047088623, -0.0010723620653152466, -0.0010384917259216309, -0.0010046213865280151, -0.0009707510471343994, -0.0009368807077407837, -0.000903010368347168, -0.0008691400289535522, -0.0008352696895599365, -0.0008013993501663208, -0.0007675290107727051, -0.0007336586713790894, -0.0006997883319854736, -0.0006659179925918579, -0.0006320476531982422, -0.0005981773138046265, -0.0005643069744110107, -0.000530436635017395, -0.0004965662956237793, -0.0004626959562301636, -0.00042882561683654785, -0.00039495527744293213, -0.0003610849380493164, -0.0003272145986557007, -0.00029334425926208496, -0.00025947391986846924, -0.00022560358047485352, -0.0001917332410812378, -0.00015786290168762207, -0.00012399256229400635, -9.012222290039062e-05, -5.62518835067749e-05, -2.238154411315918e-05, 1.1488795280456543e-05, 4.5359134674072266e-05, 7.922947406768799e-05, 0.00011309981346130371, 0.00014697015285491943, 0.00018084049224853516, 0.00021471083164215088, 0.0002485811710357666, 0.0002824515104293823, 0.00031632184982299805, 0.00035019218921661377, 0.0003840625286102295, 0.0004179328680038452, 0.00045180320739746094, 0.00048567354679107666, 0.0005195438861846924, 0.0005534142255783081, 0.0005872845649719238, 0.0006211549043655396, 0.0006550252437591553, 0.000688895583152771, 0.0007227659225463867, 0.0007566362619400024, 0.0007905066013336182, 0.0008243769407272339, 0.0008582472801208496, 0.0008921176195144653, 0.0009259879589080811, 0.0009598582983016968, 0.0009937286376953125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 11.0, 14.0, 16.0, 13.0, 23.0, 39.0, 51.0, 91.0, 124.0, 152.0, 259.0, 362.0, 501.0, 768.0, 1072.0, 1670.0, 2570.0, 4233.0, 7364.0, 13400.0, 25690.0, 54222.0, 119218.0, 234953.0, 272051.0, 160756.0, 73813.0, 34349.0, 17124.0, 9267.0, 5229.0, 3196.0, 1999.0, 1306.0, 827.0, 562.0, 378.0, 264.0, 198.0, 112.0, 91.0, 67.0, 50.0, 38.0, 24.0, 13.0, 10.0, 9.0, 1.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-12.1328125, -11.7559814453125, -11.379150390625, -11.0023193359375, -10.62548828125, -10.2486572265625, -9.871826171875, -9.4949951171875, -9.1181640625, -8.7413330078125, -8.364501953125, -7.9876708984375, -7.61083984375, -7.2340087890625, -6.857177734375, -6.4803466796875, -6.103515625, -5.7266845703125, -5.349853515625, -4.9730224609375, -4.59619140625, -4.2193603515625, -3.842529296875, -3.4656982421875, -3.0888671875, -2.7120361328125, -2.335205078125, -1.9583740234375, -1.58154296875, -1.2047119140625, -0.827880859375, -0.4510498046875, -0.07421875, 0.3026123046875, 0.679443359375, 1.0562744140625, 1.43310546875, 1.8099365234375, 2.186767578125, 2.5635986328125, 2.9404296875, 3.3172607421875, 3.694091796875, 4.0709228515625, 4.44775390625, 4.8245849609375, 5.201416015625, 5.5782470703125, 5.955078125, 6.3319091796875, 6.708740234375, 7.0855712890625, 7.46240234375, 7.8392333984375, 8.216064453125, 8.5928955078125, 8.9697265625, 9.3465576171875, 9.723388671875, 10.1002197265625, 10.47705078125, 10.8538818359375, 11.230712890625, 11.6075439453125, 11.984375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 9.0, 10.0, 13.0, 15.0, 14.0, 22.0, 31.0, 34.0, 50.0, 53.0, 59.0, 52.0, 66.0, 59.0, 65.0, 65.0, 53.0, 58.0, 41.0, 46.0, 24.0, 30.0, 19.0, 18.0, 9.0, 11.0, 16.0, 11.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8359375, -2.73370361328125, -2.6314697265625, -2.52923583984375, -2.427001953125, -2.32476806640625, -2.2225341796875, -2.12030029296875, -2.01806640625, -1.91583251953125, -1.8135986328125, -1.71136474609375, -1.609130859375, -1.50689697265625, -1.4046630859375, -1.30242919921875, -1.2001953125, -1.09796142578125, -0.9957275390625, -0.89349365234375, -0.791259765625, -0.68902587890625, -0.5867919921875, -0.48455810546875, -0.38232421875, -0.28009033203125, -0.1778564453125, -0.07562255859375, 0.026611328125, 0.12884521484375, 0.2310791015625, 0.33331298828125, 0.435546875, 0.53778076171875, 0.6400146484375, 0.74224853515625, 0.844482421875, 0.94671630859375, 1.0489501953125, 1.15118408203125, 1.25341796875, 1.35565185546875, 1.4578857421875, 1.56011962890625, 1.662353515625, 1.76458740234375, 1.8668212890625, 1.96905517578125, 2.0712890625, 2.17352294921875, 2.2757568359375, 2.37799072265625, 2.480224609375, 2.58245849609375, 2.6846923828125, 2.78692626953125, 2.88916015625, 2.99139404296875, 3.0936279296875, 3.19586181640625, 3.298095703125, 3.40032958984375, 3.5025634765625, 3.60479736328125, 3.70703125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 3.0, 9.0, 9.0, 5.0, 14.0, 13.0, 31.0, 40.0, 49.0, 34.0, 61.0, 73.0, 93.0, 87.0, 80.0, 73.0, 70.0, 59.0, 50.0, 29.0, 33.0, 24.0, 21.0, 14.0, 9.0, 4.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.513336181640625, -39.43730163574219, -38.36126708984375, -37.28523635864258, -36.20920181274414, -35.1331672668457, -34.05713653564453, -32.981101989746094, -31.905067443847656, -30.82903289794922, -29.753000259399414, -28.67696762084961, -27.600933074951172, -26.524898529052734, -25.44886589050293, -24.372833251953125, -23.296798706054688, -22.22076416015625, -21.144731521606445, -20.06869888305664, -18.992664337158203, -17.916629791259766, -16.84059715270996, -15.76456356048584, -14.688529968261719, -13.612496376037598, -12.536462783813477, -11.460429191589355, -10.384395599365234, -9.308362007141113, -8.232328414916992, -7.156294822692871, -6.080257415771484, -5.004223823547363, -3.928190231323242, -2.852156639099121, -1.776123046875, -0.7000894546508789, 0.3759441375732422, 1.4519777297973633, 2.5280113220214844, 3.6040449142456055, 4.680078506469727, 5.756112098693848, 6.832145690917969, 7.90817928314209, 8.984212875366211, 10.060246467590332, 11.136280059814453, 12.212313652038574, 13.288347244262695, 14.364380836486816, 15.440414428710938, 16.516448974609375, 17.59248161315918, 18.668514251708984, 19.744548797607422, 20.82058334350586, 21.896615982055664, 22.97264862060547, 24.048683166503906, 25.124717712402344, 26.20075035095215, 27.276782989501953, 28.35281753540039]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 12.0, 8.0, 15.0, 10.0, 14.0, 8.0, 18.0, 18.0, 20.0, 29.0, 27.0, 32.0, 28.0, 33.0, 38.0, 31.0, 39.0, 54.0, 48.0, 33.0, 41.0, 31.0, 41.0, 49.0, 39.0, 35.0, 28.0, 21.0, 24.0, 19.0, 15.0, 25.0, 18.0, 16.0, 17.0, 11.0, 13.0, 6.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-20.40717124938965, -19.779266357421875, -19.15135955810547, -18.523454666137695, -17.895549774169922, -17.267642974853516, -16.639738082885742, -16.01183319091797, -15.383927345275879, -14.756021499633789, -14.128116607666016, -13.500210762023926, -12.872304916381836, -12.244400024414062, -11.616494178771973, -10.988588333129883, -10.36068344116211, -9.73277759552002, -9.104872703552246, -8.476966857910156, -7.849061489105225, -7.221156120300293, -6.593250274658203, -5.9653449058532715, -5.33743953704834, -4.709534168243408, -4.081628799438477, -3.4537229537963867, -2.825817584991455, -2.1979122161865234, -1.5700066089630127, -0.942101001739502, -0.3141975402832031, 0.31370794773101807, 0.9416134357452393, 1.5695189237594604, 2.1974244117736816, 2.8253297805786133, 3.453235387802124, 4.081140995025635, 4.709046363830566, 5.336951732635498, 5.96485710144043, 6.5927629470825195, 7.220668315887451, 7.848573684692383, 8.476479530334473, 9.104385375976562, 9.732290267944336, 10.360196113586426, 10.9881010055542, 11.616006851196289, 12.243911743164062, 12.871817588806152, 13.499723434448242, 14.127628326416016, 14.755534172058105, 15.383440017700195, 16.01134490966797, 16.639249801635742, 17.26715660095215, 17.895061492919922, 18.522966384887695, 19.1508731842041, 19.778778076171875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 16.0, 20.0, 32.0, 28.0, 46.0, 77.0, 113.0, 175.0, 243.0, 429.0, 647.0, 977.0, 1543.0, 2396.0, 3931.0, 6232.0, 10146.0, 16175.0, 27403.0, 45848.0, 76744.0, 123715.0, 172745.0, 182832.0, 142887.0, 92821.0, 55655.0, 32676.0, 19908.0, 12131.0, 7456.0, 4555.0, 2893.0, 1793.0, 1184.0, 725.0, 501.0, 318.0, 179.0, 105.0, 85.0, 61.0, 47.0, 24.0, 11.0, 13.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.6875, -26.73876953125, -25.7900390625, -24.84130859375, -23.892578125, -22.94384765625, -21.9951171875, -21.04638671875, -20.09765625, -19.14892578125, -18.2001953125, -17.25146484375, -16.302734375, -15.35400390625, -14.4052734375, -13.45654296875, -12.5078125, -11.55908203125, -10.6103515625, -9.66162109375, -8.712890625, -7.76416015625, -6.8154296875, -5.86669921875, -4.91796875, -3.96923828125, -3.0205078125, -2.07177734375, -1.123046875, -0.17431640625, 0.7744140625, 1.72314453125, 2.671875, 3.62060546875, 4.5693359375, 5.51806640625, 6.466796875, 7.41552734375, 8.3642578125, 9.31298828125, 10.26171875, 11.21044921875, 12.1591796875, 13.10791015625, 14.056640625, 15.00537109375, 15.9541015625, 16.90283203125, 17.8515625, 18.80029296875, 19.7490234375, 20.69775390625, 21.646484375, 22.59521484375, 23.5439453125, 24.49267578125, 25.44140625, 26.39013671875, 27.3388671875, 28.28759765625, 29.236328125, 30.18505859375, 31.1337890625, 32.08251953125, 33.03125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 11.0, 4.0, 9.0, 12.0, 11.0, 17.0, 19.0, 22.0, 23.0, 23.0, 31.0, 30.0, 42.0, 37.0, 38.0, 33.0, 39.0, 43.0, 43.0, 32.0, 43.0, 44.0, 49.0, 35.0, 31.0, 32.0, 22.0, 37.0, 18.0, 17.0, 23.0, 14.0, 12.0, 16.0, 16.0, 16.0, 11.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.578125, -17.97802734375, -17.3779296875, -16.77783203125, -16.177734375, -15.57763671875, -14.9775390625, -14.37744140625, -13.77734375, -13.17724609375, -12.5771484375, -11.97705078125, -11.376953125, -10.77685546875, -10.1767578125, -9.57666015625, -8.9765625, -8.37646484375, -7.7763671875, -7.17626953125, -6.576171875, -5.97607421875, -5.3759765625, -4.77587890625, -4.17578125, -3.57568359375, -2.9755859375, -2.37548828125, -1.775390625, -1.17529296875, -0.5751953125, 0.02490234375, 0.625, 1.22509765625, 1.8251953125, 2.42529296875, 3.025390625, 3.62548828125, 4.2255859375, 4.82568359375, 5.42578125, 6.02587890625, 6.6259765625, 7.22607421875, 7.826171875, 8.42626953125, 9.0263671875, 9.62646484375, 10.2265625, 10.82666015625, 11.4267578125, 12.02685546875, 12.626953125, 13.22705078125, 13.8271484375, 14.42724609375, 15.02734375, 15.62744140625, 16.2275390625, 16.82763671875, 17.427734375, 18.02783203125, 18.6279296875, 19.22802734375, 19.828125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 13.0, 12.0, 20.0, 34.0, 66.0, 72.0, 118.0, 179.0, 231.0, 370.0, 583.0, 871.0, 1276.0, 1920.0, 3077.0, 4805.0, 7528.0, 11822.0, 19135.0, 31268.0, 49780.0, 77373.0, 115421.0, 151244.0, 162121.0, 137984.0, 98403.0, 63831.0, 40489.0, 25328.0, 15767.0, 9891.0, 6105.0, 3936.0, 2562.0, 1672.0, 1080.0, 669.0, 498.0, 321.0, 210.0, 153.0, 94.0, 82.0, 51.0, 22.0, 20.0, 12.0, 13.0, 9.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.953125, -22.219482421875, -21.48583984375, -20.752197265625, -20.0185546875, -19.284912109375, -18.55126953125, -17.817626953125, -17.083984375, -16.350341796875, -15.61669921875, -14.883056640625, -14.1494140625, -13.415771484375, -12.68212890625, -11.948486328125, -11.21484375, -10.481201171875, -9.74755859375, -9.013916015625, -8.2802734375, -7.546630859375, -6.81298828125, -6.079345703125, -5.345703125, -4.612060546875, -3.87841796875, -3.144775390625, -2.4111328125, -1.677490234375, -0.94384765625, -0.210205078125, 0.5234375, 1.257080078125, 1.99072265625, 2.724365234375, 3.4580078125, 4.191650390625, 4.92529296875, 5.658935546875, 6.392578125, 7.126220703125, 7.85986328125, 8.593505859375, 9.3271484375, 10.060791015625, 10.79443359375, 11.528076171875, 12.26171875, 12.995361328125, 13.72900390625, 14.462646484375, 15.1962890625, 15.929931640625, 16.66357421875, 17.397216796875, 18.130859375, 18.864501953125, 19.59814453125, 20.331787109375, 21.0654296875, 21.799072265625, 22.53271484375, 23.266357421875, 24.0]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 9.0, 11.0, 15.0, 10.0, 17.0, 19.0, 21.0, 19.0, 32.0, 31.0, 32.0, 38.0, 41.0, 43.0, 43.0, 50.0, 48.0, 48.0, 50.0, 48.0, 41.0, 41.0, 38.0, 39.0, 34.0, 37.0, 29.0, 11.0, 18.0, 16.0, 20.0, 13.0, 7.0, 5.0, 9.0, 7.0, 1.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6484375, -10.2254638671875, -9.802490234375, -9.3795166015625, -8.95654296875, -8.5335693359375, -8.110595703125, -7.6876220703125, -7.2646484375, -6.8416748046875, -6.418701171875, -5.9957275390625, -5.57275390625, -5.1497802734375, -4.726806640625, -4.3038330078125, -3.880859375, -3.4578857421875, -3.034912109375, -2.6119384765625, -2.18896484375, -1.7659912109375, -1.343017578125, -0.9200439453125, -0.4970703125, -0.0740966796875, 0.348876953125, 0.7718505859375, 1.19482421875, 1.6177978515625, 2.040771484375, 2.4637451171875, 2.88671875, 3.3096923828125, 3.732666015625, 4.1556396484375, 4.57861328125, 5.0015869140625, 5.424560546875, 5.8475341796875, 6.2705078125, 6.6934814453125, 7.116455078125, 7.5394287109375, 7.96240234375, 8.3853759765625, 8.808349609375, 9.2313232421875, 9.654296875, 10.0772705078125, 10.500244140625, 10.9232177734375, 11.34619140625, 11.7691650390625, 12.192138671875, 12.6151123046875, 13.0380859375, 13.4610595703125, 13.884033203125, 14.3070068359375, 14.72998046875, 15.1529541015625, 15.575927734375, 15.9989013671875, 16.421875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 7.0, 4.0, 5.0, 9.0, 20.0, 25.0, 35.0, 52.0, 69.0, 104.0, 147.0, 234.0, 352.0, 525.0, 812.0, 1383.0, 2230.0, 3573.0, 6153.0, 10407.0, 19143.0, 37192.0, 77164.0, 160943.0, 264611.0, 226710.0, 117714.0, 55671.0, 27557.0, 14873.0, 8194.0, 4789.0, 2904.0, 1729.0, 1145.0, 664.0, 456.0, 296.0, 203.0, 149.0, 106.0, 60.0, 51.0, 34.0, 13.0, 16.0, 13.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.53125, -22.834716796875, -22.13818359375, -21.441650390625, -20.7451171875, -20.048583984375, -19.35205078125, -18.655517578125, -17.958984375, -17.262451171875, -16.56591796875, -15.869384765625, -15.1728515625, -14.476318359375, -13.77978515625, -13.083251953125, -12.38671875, -11.690185546875, -10.99365234375, -10.297119140625, -9.6005859375, -8.904052734375, -8.20751953125, -7.510986328125, -6.814453125, -6.117919921875, -5.42138671875, -4.724853515625, -4.0283203125, -3.331787109375, -2.63525390625, -1.938720703125, -1.2421875, -0.545654296875, 0.15087890625, 0.847412109375, 1.5439453125, 2.240478515625, 2.93701171875, 3.633544921875, 4.330078125, 5.026611328125, 5.72314453125, 6.419677734375, 7.1162109375, 7.812744140625, 8.50927734375, 9.205810546875, 9.90234375, 10.598876953125, 11.29541015625, 11.991943359375, 12.6884765625, 13.385009765625, 14.08154296875, 14.778076171875, 15.474609375, 16.171142578125, 16.86767578125, 17.564208984375, 18.2607421875, 18.957275390625, 19.65380859375, 20.350341796875, 21.046875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 10.0, 6.0, 5.0, 13.0, 12.0, 16.0, 16.0, 24.0, 42.0, 52.0, 60.0, 79.0, 85.0, 101.0, 93.0, 86.0, 65.0, 53.0, 52.0, 30.0, 29.0, 24.0, 15.0, 7.0, 5.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00269317626953125, -0.0026217252016067505, -0.002550274133682251, -0.0024788230657577515, -0.002407371997833252, -0.0023359209299087524, -0.002264469861984253, -0.0021930187940597534, -0.002121567726135254, -0.0020501166582107544, -0.001978665590286255, -0.0019072145223617554, -0.0018357634544372559, -0.0017643123865127563, -0.0016928613185882568, -0.0016214102506637573, -0.0015499591827392578, -0.0014785081148147583, -0.0014070570468902588, -0.0013356059789657593, -0.0012641549110412598, -0.0011927038431167603, -0.0011212527751922607, -0.0010498017072677612, -0.0009783506393432617, -0.0009068995714187622, -0.0008354485034942627, -0.0007639974355697632, -0.0006925463676452637, -0.0006210952997207642, -0.0005496442317962646, -0.00047819316387176514, -0.0004067420959472656, -0.0003352910280227661, -0.0002638399600982666, -0.0001923888921737671, -0.00012093782424926758, -4.9486756324768066e-05, 2.1964311599731445e-05, 9.341537952423096e-05, 0.00016486644744873047, 0.00023631751537322998, 0.0003077685832977295, 0.000379219651222229, 0.0004506707191467285, 0.000522121787071228, 0.0005935728549957275, 0.000665023922920227, 0.0007364749908447266, 0.0008079260587692261, 0.0008793771266937256, 0.0009508281946182251, 0.0010222792625427246, 0.0010937303304672241, 0.0011651813983917236, 0.0012366324663162231, 0.0013080835342407227, 0.0013795346021652222, 0.0014509856700897217, 0.0015224367380142212, 0.0015938878059387207, 0.0016653388738632202, 0.0017367899417877197, 0.0018082410097122192, 0.0018796920776367188]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 11.0, 11.0, 8.0, 16.0, 34.0, 47.0, 55.0, 93.0, 136.0, 191.0, 283.0, 439.0, 702.0, 1083.0, 1669.0, 2775.0, 4676.0, 7957.0, 13626.0, 25774.0, 50356.0, 101901.0, 192673.0, 257301.0, 185043.0, 96316.0, 48224.0, 24604.0, 13307.0, 7433.0, 4434.0, 2781.0, 1601.0, 1015.0, 673.0, 438.0, 267.0, 194.0, 137.0, 77.0, 63.0, 43.0, 22.0, 19.0, 17.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0], "bins": [-21.96875, -21.331298828125, -20.69384765625, -20.056396484375, -19.4189453125, -18.781494140625, -18.14404296875, -17.506591796875, -16.869140625, -16.231689453125, -15.59423828125, -14.956787109375, -14.3193359375, -13.681884765625, -13.04443359375, -12.406982421875, -11.76953125, -11.132080078125, -10.49462890625, -9.857177734375, -9.2197265625, -8.582275390625, -7.94482421875, -7.307373046875, -6.669921875, -6.032470703125, -5.39501953125, -4.757568359375, -4.1201171875, -3.482666015625, -2.84521484375, -2.207763671875, -1.5703125, -0.932861328125, -0.29541015625, 0.342041015625, 0.9794921875, 1.616943359375, 2.25439453125, 2.891845703125, 3.529296875, 4.166748046875, 4.80419921875, 5.441650390625, 6.0791015625, 6.716552734375, 7.35400390625, 7.991455078125, 8.62890625, 9.266357421875, 9.90380859375, 10.541259765625, 11.1787109375, 11.816162109375, 12.45361328125, 13.091064453125, 13.728515625, 14.365966796875, 15.00341796875, 15.640869140625, 16.2783203125, 16.915771484375, 17.55322265625, 18.190673828125, 18.828125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 3.0, 7.0, 13.0, 6.0, 22.0, 13.0, 20.0, 29.0, 23.0, 30.0, 42.0, 53.0, 46.0, 52.0, 80.0, 67.0, 48.0, 67.0, 54.0, 50.0, 55.0, 43.0, 30.0, 27.0, 25.0, 21.0, 9.0, 9.0, 12.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87109375, -6.66668701171875, -6.4622802734375, -6.25787353515625, -6.053466796875, -5.84906005859375, -5.6446533203125, -5.44024658203125, -5.23583984375, -5.03143310546875, -4.8270263671875, -4.62261962890625, -4.418212890625, -4.21380615234375, -4.0093994140625, -3.80499267578125, -3.6005859375, -3.39617919921875, -3.1917724609375, -2.98736572265625, -2.782958984375, -2.57855224609375, -2.3741455078125, -2.16973876953125, -1.96533203125, -1.76092529296875, -1.5565185546875, -1.35211181640625, -1.147705078125, -0.94329833984375, -0.7388916015625, -0.53448486328125, -0.330078125, -0.12567138671875, 0.0787353515625, 0.28314208984375, 0.487548828125, 0.69195556640625, 0.8963623046875, 1.10076904296875, 1.30517578125, 1.50958251953125, 1.7139892578125, 1.91839599609375, 2.122802734375, 2.32720947265625, 2.5316162109375, 2.73602294921875, 2.9404296875, 3.14483642578125, 3.3492431640625, 3.55364990234375, 3.758056640625, 3.96246337890625, 4.1668701171875, 4.37127685546875, 4.57568359375, 4.78009033203125, 4.9844970703125, 5.18890380859375, 5.393310546875, 5.59771728515625, 5.8021240234375, 6.00653076171875, 6.2109375]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 2.0, 6.0, 9.0, 10.0, 13.0, 14.0, 18.0, 12.0, 22.0, 46.0, 45.0, 58.0, 63.0, 48.0, 61.0, 65.0, 71.0, 68.0, 69.0, 51.0, 38.0, 48.0, 35.0, 31.0, 20.0, 25.0, 18.0, 8.0, 10.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-32.1630973815918, -31.305805206298828, -30.448514938354492, -29.591222763061523, -28.733930587768555, -27.87664031982422, -27.01934814453125, -26.16205596923828, -25.304763793945312, -24.447471618652344, -23.590181350708008, -22.73288917541504, -21.87559700012207, -21.018306732177734, -20.161014556884766, -19.303722381591797, -18.44643211364746, -17.589139938354492, -16.731849670410156, -15.874557495117188, -15.017265319824219, -14.159974098205566, -13.302682876586914, -12.445390701293945, -11.588099479675293, -10.73080825805664, -9.873516082763672, -9.01622486114502, -8.158933639526367, -7.301641464233398, -6.444350242614746, -5.5870585441589355, -4.729764938354492, -3.8724732398986816, -3.01518177986145, -2.1578903198242188, -1.3005986213684082, -0.44330692291259766, 0.4139842987060547, 1.2712759971618652, 2.128567695617676, 2.9858593940734863, 3.8431508541107178, 4.700442314147949, 5.55773401260376, 6.41502571105957, 7.272316932678223, 8.129608154296875, 8.986900329589844, 9.844191551208496, 10.701483726501465, 11.558774948120117, 12.416067123413086, 13.273358345031738, 14.13064956665039, 14.98794174194336, 15.845232963562012, 16.702524185180664, 17.559816360473633, 18.41710662841797, 19.274398803710938, 20.131690979003906, 20.988983154296875, 21.84627342224121, 22.70356559753418]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 5.0, 6.0, 7.0, 8.0, 18.0, 8.0, 18.0, 14.0, 17.0, 16.0, 25.0, 23.0, 37.0, 31.0, 44.0, 41.0, 41.0, 40.0, 33.0, 42.0, 36.0, 38.0, 32.0, 32.0, 35.0, 26.0, 29.0, 27.0, 24.0, 26.0, 24.0, 28.0, 23.0, 29.0, 15.0, 16.0, 12.0, 13.0, 9.0, 7.0, 8.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-17.78821563720703, -17.234272003173828, -16.680328369140625, -16.126384735107422, -15.572442054748535, -15.018498420715332, -14.464555740356445, -13.910612106323242, -13.356668472290039, -12.802724838256836, -12.248781204223633, -11.694838523864746, -11.140894889831543, -10.58695125579834, -10.033008575439453, -9.47906494140625, -8.925121307373047, -8.371177673339844, -7.817234516143799, -7.263291358947754, -6.709347724914551, -6.155404090881348, -5.601460933685303, -5.047517776489258, -4.493574142456055, -3.9396307468414307, -3.3856873512268066, -2.8317439556121826, -2.2778005599975586, -1.7238571643829346, -1.1699137687683105, -0.6159703731536865, -0.0620269775390625, 0.4919164180755615, 1.0458598136901855, 1.5998032093048096, 2.1537466049194336, 2.7076900005340576, 3.2616333961486816, 3.8155767917633057, 4.36952018737793, 4.923463821411133, 5.477406978607178, 6.031350135803223, 6.585293769836426, 7.139237403869629, 7.693180561065674, 8.247123718261719, 8.801067352294922, 9.355010986328125, 9.908954620361328, 10.462897300720215, 11.016840934753418, 11.570784568786621, 12.124727249145508, 12.678670883178711, 13.232614517211914, 13.786558151245117, 14.34050178527832, 14.894444465637207, 15.44838809967041, 16.002330780029297, 16.5562744140625, 17.110218048095703, 17.664161682128906]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 10.0, 20.0, 21.0, 35.0, 41.0, 82.0, 139.0, 164.0, 237.0, 354.0, 595.0, 874.0, 1330.0, 2048.0, 3266.0, 5453.0, 8833.0, 14703.0, 25698.0, 48105.0, 96546.0, 220211.0, 557134.0, 1167312.0, 1130109.0, 513901.0, 201722.0, 89836.0, 44741.0, 24489.0, 14045.0, 8367.0, 5032.0, 3131.0, 1989.0, 1262.0, 807.0, 571.0, 366.0, 215.0, 159.0, 104.0, 74.0, 43.0, 32.0, 22.0, 18.0, 13.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-26.0625, -25.271728515625, -24.48095703125, -23.690185546875, -22.8994140625, -22.108642578125, -21.31787109375, -20.527099609375, -19.736328125, -18.945556640625, -18.15478515625, -17.364013671875, -16.5732421875, -15.782470703125, -14.99169921875, -14.200927734375, -13.41015625, -12.619384765625, -11.82861328125, -11.037841796875, -10.2470703125, -9.456298828125, -8.66552734375, -7.874755859375, -7.083984375, -6.293212890625, -5.50244140625, -4.711669921875, -3.9208984375, -3.130126953125, -2.33935546875, -1.548583984375, -0.7578125, 0.032958984375, 0.82373046875, 1.614501953125, 2.4052734375, 3.196044921875, 3.98681640625, 4.777587890625, 5.568359375, 6.359130859375, 7.14990234375, 7.940673828125, 8.7314453125, 9.522216796875, 10.31298828125, 11.103759765625, 11.89453125, 12.685302734375, 13.47607421875, 14.266845703125, 15.0576171875, 15.848388671875, 16.63916015625, 17.429931640625, 18.220703125, 19.011474609375, 19.80224609375, 20.593017578125, 21.3837890625, 22.174560546875, 22.96533203125, 23.756103515625, 24.546875]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 9.0, 13.0, 16.0, 13.0, 25.0, 20.0, 24.0, 33.0, 32.0, 41.0, 38.0, 40.0, 50.0, 41.0, 54.0, 50.0, 39.0, 36.0, 30.0, 33.0, 34.0, 35.0, 26.0, 31.0, 34.0, 34.0, 20.0, 22.0, 19.0, 15.0, 12.0, 12.0, 5.0, 6.0, 8.0, 5.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5234375, -13.101318359375, -12.67919921875, -12.257080078125, -11.8349609375, -11.412841796875, -10.99072265625, -10.568603515625, -10.146484375, -9.724365234375, -9.30224609375, -8.880126953125, -8.4580078125, -8.035888671875, -7.61376953125, -7.191650390625, -6.76953125, -6.347412109375, -5.92529296875, -5.503173828125, -5.0810546875, -4.658935546875, -4.23681640625, -3.814697265625, -3.392578125, -2.970458984375, -2.54833984375, -2.126220703125, -1.7041015625, -1.281982421875, -0.85986328125, -0.437744140625, -0.015625, 0.406494140625, 0.82861328125, 1.250732421875, 1.6728515625, 2.094970703125, 2.51708984375, 2.939208984375, 3.361328125, 3.783447265625, 4.20556640625, 4.627685546875, 5.0498046875, 5.471923828125, 5.89404296875, 6.316162109375, 6.73828125, 7.160400390625, 7.58251953125, 8.004638671875, 8.4267578125, 8.848876953125, 9.27099609375, 9.693115234375, 10.115234375, 10.537353515625, 10.95947265625, 11.381591796875, 11.8037109375, 12.225830078125, 12.64794921875, 13.070068359375, 13.4921875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 0.0, 4.0, 8.0, 9.0, 12.0, 16.0, 29.0, 52.0, 66.0, 115.0, 224.0, 351.0, 606.0, 1023.0, 1796.0, 3257.0, 5905.0, 11205.0, 21617.0, 44142.0, 94207.0, 216346.0, 521327.0, 1134760.0, 1168347.0, 548569.0, 227556.0, 98537.0, 46148.0, 22769.0, 11556.0, 6092.0, 3263.0, 1819.0, 985.0, 615.0, 352.0, 205.0, 130.0, 105.0, 53.0, 30.0, 26.0, 21.0, 16.0, 10.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.125, -23.232421875, -22.33984375, -21.447265625, -20.5546875, -19.662109375, -18.76953125, -17.876953125, -16.984375, -16.091796875, -15.19921875, -14.306640625, -13.4140625, -12.521484375, -11.62890625, -10.736328125, -9.84375, -8.951171875, -8.05859375, -7.166015625, -6.2734375, -5.380859375, -4.48828125, -3.595703125, -2.703125, -1.810546875, -0.91796875, -0.025390625, 0.8671875, 1.759765625, 2.65234375, 3.544921875, 4.4375, 5.330078125, 6.22265625, 7.115234375, 8.0078125, 8.900390625, 9.79296875, 10.685546875, 11.578125, 12.470703125, 13.36328125, 14.255859375, 15.1484375, 16.041015625, 16.93359375, 17.826171875, 18.71875, 19.611328125, 20.50390625, 21.396484375, 22.2890625, 23.181640625, 24.07421875, 24.966796875, 25.859375, 26.751953125, 27.64453125, 28.537109375, 29.4296875, 30.322265625, 31.21484375, 32.107421875, 33.0]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 12.0, 8.0, 9.0, 9.0, 16.0, 12.0, 22.0, 21.0, 30.0, 34.0, 52.0, 68.0, 70.0, 86.0, 117.0, 132.0, 173.0, 230.0, 288.0, 293.0, 329.0, 300.0, 268.0, 241.0, 255.0, 190.0, 160.0, 153.0, 109.0, 91.0, 70.0, 52.0, 37.0, 32.0, 23.0, 21.0, 18.0, 11.0, 10.0, 7.0, 6.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.15625, -8.902587890625, -8.64892578125, -8.395263671875, -8.1416015625, -7.887939453125, -7.63427734375, -7.380615234375, -7.126953125, -6.873291015625, -6.61962890625, -6.365966796875, -6.1123046875, -5.858642578125, -5.60498046875, -5.351318359375, -5.09765625, -4.843994140625, -4.59033203125, -4.336669921875, -4.0830078125, -3.829345703125, -3.57568359375, -3.322021484375, -3.068359375, -2.814697265625, -2.56103515625, -2.307373046875, -2.0537109375, -1.800048828125, -1.54638671875, -1.292724609375, -1.0390625, -0.785400390625, -0.53173828125, -0.278076171875, -0.0244140625, 0.229248046875, 0.48291015625, 0.736572265625, 0.990234375, 1.243896484375, 1.49755859375, 1.751220703125, 2.0048828125, 2.258544921875, 2.51220703125, 2.765869140625, 3.01953125, 3.273193359375, 3.52685546875, 3.780517578125, 4.0341796875, 4.287841796875, 4.54150390625, 4.795166015625, 5.048828125, 5.302490234375, 5.55615234375, 5.809814453125, 6.0634765625, 6.317138671875, 6.57080078125, 6.824462890625, 7.078125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 10.0, 6.0, 5.0, 14.0, 12.0, 18.0, 24.0, 26.0, 40.0, 41.0, 39.0, 59.0, 60.0, 87.0, 77.0, 60.0, 58.0, 72.0, 59.0, 54.0, 35.0, 36.0, 26.0, 16.0, 17.0, 12.0, 11.0, 6.0, 5.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.712608337402344, -28.87921142578125, -28.04581642150879, -27.212419509887695, -26.379024505615234, -25.54562759399414, -24.712230682373047, -23.878833770751953, -23.045438766479492, -22.2120418548584, -21.378646850585938, -20.545249938964844, -19.71185302734375, -18.87845802307129, -18.045061111450195, -17.211666107177734, -16.37826919555664, -15.544873237609863, -14.711477279663086, -13.878080368041992, -13.044684410095215, -12.211288452148438, -11.377891540527344, -10.544495582580566, -9.711099624633789, -8.877703666687012, -8.044307708740234, -7.210910797119141, -6.377514839172363, -5.544118881225586, -4.71072244644165, -3.877326011657715, -3.0439319610595703, -2.210535764694214, -1.3771395683288574, -0.543743371963501, 0.28965282440185547, 1.1230487823486328, 1.9564452171325684, 2.789841651916504, 3.6232376098632812, 4.456633567810059, 5.290030002593994, 6.12342643737793, 6.956822395324707, 7.790218353271484, 8.623615264892578, 9.457011222839355, 10.290407180786133, 11.12380313873291, 11.957199096679688, 12.790596008300781, 13.623991966247559, 14.457387924194336, 15.29078483581543, 16.12417984008789, 16.957576751708984, 17.790973663330078, 18.62436866760254, 19.457765579223633, 20.291160583496094, 21.124557495117188, 21.95795440673828, 22.791351318359375, 23.624746322631836]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 7.0, 12.0, 10.0, 9.0, 21.0, 18.0, 24.0, 31.0, 28.0, 34.0, 34.0, 37.0, 33.0, 48.0, 35.0, 43.0, 34.0, 40.0, 39.0, 48.0, 37.0, 43.0, 38.0, 29.0, 36.0, 38.0, 20.0, 24.0, 22.0, 30.0, 8.0, 9.0, 9.0, 13.0, 9.0, 9.0, 6.0, 4.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-20.108001708984375, -19.531063079833984, -18.954124450683594, -18.377185821533203, -17.800247192382812, -17.223308563232422, -16.64636993408203, -16.06943130493164, -15.49249267578125, -14.91555404663086, -14.338615417480469, -13.761676788330078, -13.184738159179688, -12.607799530029297, -12.030860900878906, -11.453922271728516, -10.876983642578125, -10.300045013427734, -9.723106384277344, -9.146167755126953, -8.569229125976562, -7.992290496826172, -7.415351867675781, -6.838413238525391, -6.261474609375, -5.684535980224609, -5.107597351074219, -4.530658721923828, -3.9537200927734375, -3.376781463623047, -2.7998428344726562, -2.2229042053222656, -1.6459636688232422, -1.0690250396728516, -0.49208641052246094, 0.08485221862792969, 0.6617908477783203, 1.238729476928711, 1.8156681060791016, 2.392606735229492, 2.969545364379883, 3.5464839935302734, 4.123422622680664, 4.700361251831055, 5.277299880981445, 5.854238510131836, 6.431177139282227, 7.008115768432617, 7.585054397583008, 8.161993026733398, 8.738931655883789, 9.31587028503418, 9.89280891418457, 10.469747543334961, 11.046686172485352, 11.623624801635742, 12.200563430786133, 12.777502059936523, 13.354440689086914, 13.931379318237305, 14.508317947387695, 15.085256576538086, 15.662195205688477, 16.239133834838867, 16.816072463989258]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 11.0, 7.0, 19.0, 20.0, 24.0, 37.0, 43.0, 92.0, 107.0, 189.0, 240.0, 373.0, 525.0, 824.0, 1223.0, 1852.0, 2842.0, 4515.0, 7333.0, 11935.0, 19965.0, 33961.0, 58546.0, 100311.0, 159969.0, 203569.0, 171763.0, 110043.0, 64046.0, 36835.0, 21892.0, 13018.0, 8066.0, 5043.0, 3268.0, 2022.0, 1358.0, 877.0, 570.0, 402.0, 263.0, 178.0, 121.0, 85.0, 56.0, 43.0, 22.0, 24.0, 16.0, 6.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-16.8125, -16.296630859375, -15.78076171875, -15.264892578125, -14.7490234375, -14.233154296875, -13.71728515625, -13.201416015625, -12.685546875, -12.169677734375, -11.65380859375, -11.137939453125, -10.6220703125, -10.106201171875, -9.59033203125, -9.074462890625, -8.55859375, -8.042724609375, -7.52685546875, -7.010986328125, -6.4951171875, -5.979248046875, -5.46337890625, -4.947509765625, -4.431640625, -3.915771484375, -3.39990234375, -2.884033203125, -2.3681640625, -1.852294921875, -1.33642578125, -0.820556640625, -0.3046875, 0.211181640625, 0.72705078125, 1.242919921875, 1.7587890625, 2.274658203125, 2.79052734375, 3.306396484375, 3.822265625, 4.338134765625, 4.85400390625, 5.369873046875, 5.8857421875, 6.401611328125, 6.91748046875, 7.433349609375, 7.94921875, 8.465087890625, 8.98095703125, 9.496826171875, 10.0126953125, 10.528564453125, 11.04443359375, 11.560302734375, 12.076171875, 12.592041015625, 13.10791015625, 13.623779296875, 14.1396484375, 14.655517578125, 15.17138671875, 15.687255859375, 16.203125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 7.0, 8.0, 9.0, 15.0, 11.0, 17.0, 24.0, 25.0, 20.0, 25.0, 35.0, 24.0, 38.0, 31.0, 40.0, 45.0, 49.0, 37.0, 49.0, 45.0, 39.0, 40.0, 43.0, 26.0, 39.0, 36.0, 24.0, 30.0, 30.0, 20.0, 17.0, 21.0, 9.0, 8.0, 15.0, 4.0, 8.0, 7.0, 3.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-19.171875, -18.59033203125, -18.0087890625, -17.42724609375, -16.845703125, -16.26416015625, -15.6826171875, -15.10107421875, -14.51953125, -13.93798828125, -13.3564453125, -12.77490234375, -12.193359375, -11.61181640625, -11.0302734375, -10.44873046875, -9.8671875, -9.28564453125, -8.7041015625, -8.12255859375, -7.541015625, -6.95947265625, -6.3779296875, -5.79638671875, -5.21484375, -4.63330078125, -4.0517578125, -3.47021484375, -2.888671875, -2.30712890625, -1.7255859375, -1.14404296875, -0.5625, 0.01904296875, 0.6005859375, 1.18212890625, 1.763671875, 2.34521484375, 2.9267578125, 3.50830078125, 4.08984375, 4.67138671875, 5.2529296875, 5.83447265625, 6.416015625, 6.99755859375, 7.5791015625, 8.16064453125, 8.7421875, 9.32373046875, 9.9052734375, 10.48681640625, 11.068359375, 11.64990234375, 12.2314453125, 12.81298828125, 13.39453125, 13.97607421875, 14.5576171875, 15.13916015625, 15.720703125, 16.30224609375, 16.8837890625, 17.46533203125, 18.046875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 9.0, 12.0, 7.0, 20.0, 21.0, 33.0, 47.0, 59.0, 107.0, 148.0, 217.0, 313.0, 488.0, 825.0, 1360.0, 2410.0, 4568.0, 9438.0, 22417.0, 63936.0, 219168.0, 442618.0, 186738.0, 55408.0, 19963.0, 8310.0, 4167.0, 2220.0, 1309.0, 768.0, 474.0, 301.0, 195.0, 150.0, 95.0, 78.0, 42.0, 34.0, 24.0, 17.0, 10.0, 6.0, 9.0, 3.0, 0.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-39.65625, -38.47021484375, -37.2841796875, -36.09814453125, -34.912109375, -33.72607421875, -32.5400390625, -31.35400390625, -30.16796875, -28.98193359375, -27.7958984375, -26.60986328125, -25.423828125, -24.23779296875, -23.0517578125, -21.86572265625, -20.6796875, -19.49365234375, -18.3076171875, -17.12158203125, -15.935546875, -14.74951171875, -13.5634765625, -12.37744140625, -11.19140625, -10.00537109375, -8.8193359375, -7.63330078125, -6.447265625, -5.26123046875, -4.0751953125, -2.88916015625, -1.703125, -0.51708984375, 0.6689453125, 1.85498046875, 3.041015625, 4.22705078125, 5.4130859375, 6.59912109375, 7.78515625, 8.97119140625, 10.1572265625, 11.34326171875, 12.529296875, 13.71533203125, 14.9013671875, 16.08740234375, 17.2734375, 18.45947265625, 19.6455078125, 20.83154296875, 22.017578125, 23.20361328125, 24.3896484375, 25.57568359375, 26.76171875, 27.94775390625, 29.1337890625, 30.31982421875, 31.505859375, 32.69189453125, 33.8779296875, 35.06396484375, 36.25]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 2.0, 1.0, 5.0, 6.0, 7.0, 5.0, 12.0, 11.0, 13.0, 11.0, 25.0, 18.0, 22.0, 31.0, 41.0, 37.0, 49.0, 22.0, 38.0, 40.0, 38.0, 47.0, 29.0, 32.0, 41.0, 41.0, 48.0, 29.0, 33.0, 38.0, 42.0, 23.0, 21.0, 26.0, 16.0, 11.0, 11.0, 18.0, 13.0, 7.0, 10.0, 6.0, 9.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.3565673828125, -9.033447265625, -8.7103271484375, -8.38720703125, -8.0640869140625, -7.740966796875, -7.4178466796875, -7.0947265625, -6.7716064453125, -6.448486328125, -6.1253662109375, -5.80224609375, -5.4791259765625, -5.156005859375, -4.8328857421875, -4.509765625, -4.1866455078125, -3.863525390625, -3.5404052734375, -3.21728515625, -2.8941650390625, -2.571044921875, -2.2479248046875, -1.9248046875, -1.6016845703125, -1.278564453125, -0.9554443359375, -0.63232421875, -0.3092041015625, 0.013916015625, 0.3370361328125, 0.66015625, 0.9832763671875, 1.306396484375, 1.6295166015625, 1.95263671875, 2.2757568359375, 2.598876953125, 2.9219970703125, 3.2451171875, 3.5682373046875, 3.891357421875, 4.2144775390625, 4.53759765625, 4.8607177734375, 5.183837890625, 5.5069580078125, 5.830078125, 6.1531982421875, 6.476318359375, 6.7994384765625, 7.12255859375, 7.4456787109375, 7.768798828125, 8.0919189453125, 8.4150390625, 8.7381591796875, 9.061279296875, 9.3843994140625, 9.70751953125, 10.0306396484375, 10.353759765625, 10.6768798828125, 11.0]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 8.0, 13.0, 25.0, 19.0, 25.0, 32.0, 56.0, 102.0, 110.0, 173.0, 245.0, 413.0, 606.0, 881.0, 1402.0, 2286.0, 3919.0, 6778.0, 12521.0, 24454.0, 50371.0, 114225.0, 259136.0, 303518.0, 141652.0, 62036.0, 29047.0, 14668.0, 8052.0, 4460.0, 2674.0, 1664.0, 986.0, 646.0, 443.0, 242.0, 174.0, 141.0, 102.0, 66.0, 58.0, 41.0, 21.0, 21.0, 9.0, 8.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6796875, -8.3916015625, -8.103515625, -7.8154296875, -7.52734375, -7.2392578125, -6.951171875, -6.6630859375, -6.375, -6.0869140625, -5.798828125, -5.5107421875, -5.22265625, -4.9345703125, -4.646484375, -4.3583984375, -4.0703125, -3.7822265625, -3.494140625, -3.2060546875, -2.91796875, -2.6298828125, -2.341796875, -2.0537109375, -1.765625, -1.4775390625, -1.189453125, -0.9013671875, -0.61328125, -0.3251953125, -0.037109375, 0.2509765625, 0.5390625, 0.8271484375, 1.115234375, 1.4033203125, 1.69140625, 1.9794921875, 2.267578125, 2.5556640625, 2.84375, 3.1318359375, 3.419921875, 3.7080078125, 3.99609375, 4.2841796875, 4.572265625, 4.8603515625, 5.1484375, 5.4365234375, 5.724609375, 6.0126953125, 6.30078125, 6.5888671875, 6.876953125, 7.1650390625, 7.453125, 7.7412109375, 8.029296875, 8.3173828125, 8.60546875, 8.8935546875, 9.181640625, 9.4697265625, 9.7578125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 0.0, 3.0, 10.0, 9.0, 18.0, 20.0, 24.0, 42.0, 79.0, 85.0, 151.0, 131.0, 106.0, 94.0, 69.0, 35.0, 30.0, 19.0, 15.0, 17.0, 12.0, 5.0, 5.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006551742553710938, -0.0006259679794311523, -0.0005967617034912109, -0.0005675554275512695, -0.0005383491516113281, -0.0005091428756713867, -0.0004799365997314453, -0.0004507303237915039, -0.0004215240478515625, -0.0003923177719116211, -0.0003631114959716797, -0.0003339052200317383, -0.0003046989440917969, -0.00027549266815185547, -0.00024628639221191406, -0.00021708011627197266, -0.00018787384033203125, -0.00015866756439208984, -0.00012946128845214844, -0.00010025501251220703, -7.104873657226562e-05, -4.184246063232422e-05, -1.2636184692382812e-05, 1.6570091247558594e-05, 4.57763671875e-05, 7.49826431274414e-05, 0.00010418891906738281, 0.00013339519500732422, 0.00016260147094726562, 0.00019180774688720703, 0.00022101402282714844, 0.00025022029876708984, 0.00027942657470703125, 0.00030863285064697266, 0.00033783912658691406, 0.00036704540252685547, 0.0003962516784667969, 0.0004254579544067383, 0.0004546642303466797, 0.0004838705062866211, 0.0005130767822265625, 0.0005422830581665039, 0.0005714893341064453, 0.0006006956100463867, 0.0006299018859863281, 0.0006591081619262695, 0.0006883144378662109, 0.0007175207138061523, 0.0007467269897460938, 0.0007759332656860352, 0.0008051395416259766, 0.000834345817565918, 0.0008635520935058594, 0.0008927583694458008, 0.0009219646453857422, 0.0009511709213256836, 0.000980377197265625, 0.0010095834732055664, 0.0010387897491455078, 0.0010679960250854492, 0.0010972023010253906, 0.001126408576965332, 0.0011556148529052734, 0.0011848211288452148, 0.0012140274047851562]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 15.0, 19.0, 26.0, 34.0, 56.0, 78.0, 114.0, 162.0, 213.0, 361.0, 478.0, 823.0, 1137.0, 1852.0, 2746.0, 4379.0, 7063.0, 11846.0, 20061.0, 33961.0, 59112.0, 101993.0, 164642.0, 206599.0, 171051.0, 107260.0, 62331.0, 36050.0, 21049.0, 12593.0, 7561.0, 4554.0, 2903.0, 1830.0, 1156.0, 796.0, 534.0, 359.0, 235.0, 176.0, 101.0, 85.0, 47.0, 44.0, 26.0, 13.0, 11.0, 4.0, 6.0, 1.0, 6.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4296875, -6.22589111328125, -6.0220947265625, -5.81829833984375, -5.614501953125, -5.41070556640625, -5.2069091796875, -5.00311279296875, -4.79931640625, -4.59552001953125, -4.3917236328125, -4.18792724609375, -3.984130859375, -3.78033447265625, -3.5765380859375, -3.37274169921875, -3.1689453125, -2.96514892578125, -2.7613525390625, -2.55755615234375, -2.353759765625, -2.14996337890625, -1.9461669921875, -1.74237060546875, -1.53857421875, -1.33477783203125, -1.1309814453125, -0.92718505859375, -0.723388671875, -0.51959228515625, -0.3157958984375, -0.11199951171875, 0.091796875, 0.29559326171875, 0.4993896484375, 0.70318603515625, 0.906982421875, 1.11077880859375, 1.3145751953125, 1.51837158203125, 1.72216796875, 1.92596435546875, 2.1297607421875, 2.33355712890625, 2.537353515625, 2.74114990234375, 2.9449462890625, 3.14874267578125, 3.3525390625, 3.55633544921875, 3.7601318359375, 3.96392822265625, 4.167724609375, 4.37152099609375, 4.5753173828125, 4.77911376953125, 4.98291015625, 5.18670654296875, 5.3905029296875, 5.59429931640625, 5.798095703125, 6.00189208984375, 6.2056884765625, 6.40948486328125, 6.61328125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 9.0, 9.0, 7.0, 6.0, 10.0, 19.0, 12.0, 14.0, 24.0, 34.0, 31.0, 35.0, 55.0, 60.0, 67.0, 50.0, 58.0, 77.0, 57.0, 50.0, 49.0, 39.0, 48.0, 32.0, 22.0, 25.0, 19.0, 6.0, 18.0, 12.0, 6.0, 7.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.443359375, -2.373291015625, -2.30322265625, -2.233154296875, -2.1630859375, -2.093017578125, -2.02294921875, -1.952880859375, -1.8828125, -1.812744140625, -1.74267578125, -1.672607421875, -1.6025390625, -1.532470703125, -1.46240234375, -1.392333984375, -1.322265625, -1.252197265625, -1.18212890625, -1.112060546875, -1.0419921875, -0.971923828125, -0.90185546875, -0.831787109375, -0.76171875, -0.691650390625, -0.62158203125, -0.551513671875, -0.4814453125, -0.411376953125, -0.34130859375, -0.271240234375, -0.201171875, -0.131103515625, -0.06103515625, 0.009033203125, 0.0791015625, 0.149169921875, 0.21923828125, 0.289306640625, 0.359375, 0.429443359375, 0.49951171875, 0.569580078125, 0.6396484375, 0.709716796875, 0.77978515625, 0.849853515625, 0.919921875, 0.989990234375, 1.06005859375, 1.130126953125, 1.2001953125, 1.270263671875, 1.34033203125, 1.410400390625, 1.48046875, 1.550537109375, 1.62060546875, 1.690673828125, 1.7607421875, 1.830810546875, 1.90087890625, 1.970947265625, 2.041015625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 5.0, 2.0, 14.0, 9.0, 10.0, 17.0, 20.0, 24.0, 29.0, 34.0, 43.0, 37.0, 57.0, 78.0, 82.0, 77.0, 62.0, 68.0, 67.0, 58.0, 41.0, 33.0, 35.0, 20.0, 21.0, 14.0, 14.0, 6.0, 4.0, 8.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.31219482421875, -30.474313735961914, -29.636432647705078, -28.798551559448242, -27.960670471191406, -27.122787475585938, -26.284908294677734, -25.447025299072266, -24.60914421081543, -23.771263122558594, -22.933382034301758, -22.095500946044922, -21.257619857788086, -20.41973876953125, -19.58185577392578, -18.743974685668945, -17.90609359741211, -17.068212509155273, -16.230331420898438, -15.392450332641602, -14.55456829071045, -13.716687202453613, -12.878806114196777, -12.040924072265625, -11.203044891357422, -10.365163803100586, -9.52728271484375, -8.689401626586914, -7.851519584655762, -7.013638496398926, -6.17575740814209, -5.337875843048096, -4.499994277954102, -3.6621129512786865, -2.8242316246032715, -1.9863505363464355, -1.1484692096710205, -0.31058788299560547, 0.5272932052612305, 1.3651747703552246, 2.2030558586120605, 3.0409371852874756, 3.8788185119628906, 4.716699600219727, 5.5545806884765625, 6.392462253570557, 7.230343341827393, 8.068224906921387, 8.906105995178223, 9.743987083435059, 10.581868171691895, 11.419750213623047, 12.257631301879883, 13.095512390136719, 13.933393478393555, 14.77127456665039, 15.609155654907227, 16.447036743164062, 17.2849178314209, 18.122798919677734, 18.96068000793457, 19.798561096191406, 20.636444091796875, 21.47432518005371, 22.312206268310547]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 10.0, 10.0, 10.0, 6.0, 17.0, 21.0, 19.0, 19.0, 33.0, 35.0, 33.0, 29.0, 34.0, 43.0, 39.0, 38.0, 38.0, 32.0, 41.0, 45.0, 40.0, 38.0, 34.0, 41.0, 34.0, 31.0, 38.0, 24.0, 22.0, 26.0, 16.0, 16.0, 10.0, 10.0, 10.0, 12.0, 9.0, 8.0, 2.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-19.04004669189453, -18.49024772644043, -17.940448760986328, -17.390649795532227, -16.840850830078125, -16.291051864624023, -15.741252899169922, -15.19145393371582, -14.641654968261719, -14.091856002807617, -13.542057037353516, -12.992258071899414, -12.442459106445312, -11.892660140991211, -11.34286117553711, -10.793062210083008, -10.243263244628906, -9.693464279174805, -9.143665313720703, -8.593866348266602, -8.0440673828125, -7.494268417358398, -6.944469451904297, -6.394670486450195, -5.844871520996094, -5.295072555541992, -4.745273590087891, -4.195474624633789, -3.6456756591796875, -3.095876693725586, -2.5460777282714844, -1.9962787628173828, -1.4464797973632812, -0.8966808319091797, -0.3468818664550781, 0.20291709899902344, 0.752716064453125, 1.3025150299072266, 1.8523139953613281, 2.4021129608154297, 2.9519119262695312, 3.501710891723633, 4.051509857177734, 4.601308822631836, 5.1511077880859375, 5.700906753540039, 6.250705718994141, 6.800504684448242, 7.350303649902344, 7.900102615356445, 8.449901580810547, 8.999700546264648, 9.54949951171875, 10.099298477172852, 10.649097442626953, 11.198896408081055, 11.748695373535156, 12.298494338989258, 12.84829330444336, 13.398092269897461, 13.947891235351562, 14.497690200805664, 15.047489166259766, 15.597288131713867, 16.14708709716797]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 7.0, 19.0, 24.0, 24.0, 30.0, 50.0, 57.0, 114.0, 149.0, 216.0, 299.0, 407.0, 652.0, 978.0, 1435.0, 2196.0, 3322.0, 5129.0, 7661.0, 11773.0, 18715.0, 29101.0, 45634.0, 71640.0, 105930.0, 144135.0, 160938.0, 141295.0, 103211.0, 68965.0, 44404.0, 28644.0, 17820.0, 11575.0, 7467.0, 4962.0, 3189.0, 2072.0, 1387.0, 909.0, 610.0, 446.0, 313.0, 215.0, 144.0, 90.0, 63.0, 56.0, 27.0, 21.0, 12.0, 13.0, 1.0, 6.0, 3.0, 7.0, 0.0, 1.0], "bins": [-22.46875, -21.776611328125, -21.08447265625, -20.392333984375, -19.7001953125, -19.008056640625, -18.31591796875, -17.623779296875, -16.931640625, -16.239501953125, -15.54736328125, -14.855224609375, -14.1630859375, -13.470947265625, -12.77880859375, -12.086669921875, -11.39453125, -10.702392578125, -10.01025390625, -9.318115234375, -8.6259765625, -7.933837890625, -7.24169921875, -6.549560546875, -5.857421875, -5.165283203125, -4.47314453125, -3.781005859375, -3.0888671875, -2.396728515625, -1.70458984375, -1.012451171875, -0.3203125, 0.371826171875, 1.06396484375, 1.756103515625, 2.4482421875, 3.140380859375, 3.83251953125, 4.524658203125, 5.216796875, 5.908935546875, 6.60107421875, 7.293212890625, 7.9853515625, 8.677490234375, 9.36962890625, 10.061767578125, 10.75390625, 11.446044921875, 12.13818359375, 12.830322265625, 13.5224609375, 14.214599609375, 14.90673828125, 15.598876953125, 16.291015625, 16.983154296875, 17.67529296875, 18.367431640625, 19.0595703125, 19.751708984375, 20.44384765625, 21.135986328125, 21.828125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 8.0, 7.0, 12.0, 11.0, 10.0, 18.0, 22.0, 26.0, 33.0, 39.0, 32.0, 49.0, 43.0, 28.0, 52.0, 50.0, 38.0, 49.0, 43.0, 46.0, 40.0, 44.0, 41.0, 34.0, 42.0, 29.0, 19.0, 20.0, 20.0, 12.0, 14.0, 11.0, 11.0, 13.0, 5.0, 8.0, 5.0, 2.0, 3.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.015625, -18.430419921875, -17.84521484375, -17.260009765625, -16.6748046875, -16.089599609375, -15.50439453125, -14.919189453125, -14.333984375, -13.748779296875, -13.16357421875, -12.578369140625, -11.9931640625, -11.407958984375, -10.82275390625, -10.237548828125, -9.65234375, -9.067138671875, -8.48193359375, -7.896728515625, -7.3115234375, -6.726318359375, -6.14111328125, -5.555908203125, -4.970703125, -4.385498046875, -3.80029296875, -3.215087890625, -2.6298828125, -2.044677734375, -1.45947265625, -0.874267578125, -0.2890625, 0.296142578125, 0.88134765625, 1.466552734375, 2.0517578125, 2.636962890625, 3.22216796875, 3.807373046875, 4.392578125, 4.977783203125, 5.56298828125, 6.148193359375, 6.7333984375, 7.318603515625, 7.90380859375, 8.489013671875, 9.07421875, 9.659423828125, 10.24462890625, 10.829833984375, 11.4150390625, 12.000244140625, 12.58544921875, 13.170654296875, 13.755859375, 14.341064453125, 14.92626953125, 15.511474609375, 16.0966796875, 16.681884765625, 17.26708984375, 17.852294921875, 18.4375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 16.0, 28.0, 37.0, 57.0, 87.0, 122.0, 182.0, 276.0, 403.0, 651.0, 1071.0, 1687.0, 2801.0, 4524.0, 7607.0, 13049.0, 22323.0, 37500.0, 63435.0, 102307.0, 150740.0, 181062.0, 162660.0, 115452.0, 72844.0, 43708.0, 25903.0, 15196.0, 9097.0, 5212.0, 3212.0, 1952.0, 1137.0, 777.0, 480.0, 305.0, 224.0, 130.0, 98.0, 65.0, 41.0, 25.0, 22.0, 12.0, 10.0, 5.0, 1.0, 5.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.71875, -20.06396484375, -19.4091796875, -18.75439453125, -18.099609375, -17.44482421875, -16.7900390625, -16.13525390625, -15.48046875, -14.82568359375, -14.1708984375, -13.51611328125, -12.861328125, -12.20654296875, -11.5517578125, -10.89697265625, -10.2421875, -9.58740234375, -8.9326171875, -8.27783203125, -7.623046875, -6.96826171875, -6.3134765625, -5.65869140625, -5.00390625, -4.34912109375, -3.6943359375, -3.03955078125, -2.384765625, -1.72998046875, -1.0751953125, -0.42041015625, 0.234375, 0.88916015625, 1.5439453125, 2.19873046875, 2.853515625, 3.50830078125, 4.1630859375, 4.81787109375, 5.47265625, 6.12744140625, 6.7822265625, 7.43701171875, 8.091796875, 8.74658203125, 9.4013671875, 10.05615234375, 10.7109375, 11.36572265625, 12.0205078125, 12.67529296875, 13.330078125, 13.98486328125, 14.6396484375, 15.29443359375, 15.94921875, 16.60400390625, 17.2587890625, 17.91357421875, 18.568359375, 19.22314453125, 19.8779296875, 20.53271484375, 21.1875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 12.0, 8.0, 5.0, 15.0, 11.0, 19.0, 28.0, 25.0, 30.0, 32.0, 28.0, 33.0, 42.0, 27.0, 48.0, 32.0, 44.0, 44.0, 44.0, 33.0, 43.0, 41.0, 38.0, 37.0, 42.0, 28.0, 28.0, 25.0, 13.0, 28.0, 12.0, 21.0, 12.0, 12.0, 11.0, 11.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.90625, -9.587890625, -9.26953125, -8.951171875, -8.6328125, -8.314453125, -7.99609375, -7.677734375, -7.359375, -7.041015625, -6.72265625, -6.404296875, -6.0859375, -5.767578125, -5.44921875, -5.130859375, -4.8125, -4.494140625, -4.17578125, -3.857421875, -3.5390625, -3.220703125, -2.90234375, -2.583984375, -2.265625, -1.947265625, -1.62890625, -1.310546875, -0.9921875, -0.673828125, -0.35546875, -0.037109375, 0.28125, 0.599609375, 0.91796875, 1.236328125, 1.5546875, 1.873046875, 2.19140625, 2.509765625, 2.828125, 3.146484375, 3.46484375, 3.783203125, 4.1015625, 4.419921875, 4.73828125, 5.056640625, 5.375, 5.693359375, 6.01171875, 6.330078125, 6.6484375, 6.966796875, 7.28515625, 7.603515625, 7.921875, 8.240234375, 8.55859375, 8.876953125, 9.1953125, 9.513671875, 9.83203125, 10.150390625, 10.46875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 9.0, 9.0, 11.0, 24.0, 41.0, 48.0, 82.0, 107.0, 165.0, 267.0, 408.0, 608.0, 1001.0, 1475.0, 2485.0, 3898.0, 6459.0, 10733.0, 18947.0, 33194.0, 59089.0, 102710.0, 161691.0, 202082.0, 172867.0, 114166.0, 66848.0, 37428.0, 20968.0, 11834.0, 7078.0, 4367.0, 2764.0, 1644.0, 1090.0, 664.0, 437.0, 283.0, 210.0, 123.0, 95.0, 46.0, 36.0, 29.0, 19.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7578125, -11.3857421875, -11.013671875, -10.6416015625, -10.26953125, -9.8974609375, -9.525390625, -9.1533203125, -8.78125, -8.4091796875, -8.037109375, -7.6650390625, -7.29296875, -6.9208984375, -6.548828125, -6.1767578125, -5.8046875, -5.4326171875, -5.060546875, -4.6884765625, -4.31640625, -3.9443359375, -3.572265625, -3.2001953125, -2.828125, -2.4560546875, -2.083984375, -1.7119140625, -1.33984375, -0.9677734375, -0.595703125, -0.2236328125, 0.1484375, 0.5205078125, 0.892578125, 1.2646484375, 1.63671875, 2.0087890625, 2.380859375, 2.7529296875, 3.125, 3.4970703125, 3.869140625, 4.2412109375, 4.61328125, 4.9853515625, 5.357421875, 5.7294921875, 6.1015625, 6.4736328125, 6.845703125, 7.2177734375, 7.58984375, 7.9619140625, 8.333984375, 8.7060546875, 9.078125, 9.4501953125, 9.822265625, 10.1943359375, 10.56640625, 10.9384765625, 11.310546875, 11.6826171875, 12.0546875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 8.0, 10.0, 16.0, 13.0, 26.0, 18.0, 39.0, 46.0, 52.0, 74.0, 80.0, 89.0, 93.0, 71.0, 83.0, 64.0, 57.0, 38.0, 32.0, 29.0, 25.0, 12.0, 6.0, 9.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0019311904907226562, -0.0018766522407531738, -0.0018221139907836914, -0.001767575740814209, -0.0017130374908447266, -0.0016584992408752441, -0.0016039609909057617, -0.0015494227409362793, -0.0014948844909667969, -0.0014403462409973145, -0.001385807991027832, -0.0013312697410583496, -0.0012767314910888672, -0.0012221932411193848, -0.0011676549911499023, -0.00111311674118042, -0.0010585784912109375, -0.001004040241241455, -0.0009495019912719727, -0.0008949637413024902, -0.0008404254913330078, -0.0007858872413635254, -0.000731348991394043, -0.0006768107414245605, -0.0006222724914550781, -0.0005677342414855957, -0.0005131959915161133, -0.00045865774154663086, -0.00040411949157714844, -0.000349581241607666, -0.0002950429916381836, -0.00024050474166870117, -0.00018596649169921875, -0.00013142824172973633, -7.68899917602539e-05, -2.2351741790771484e-05, 3.218650817871094e-05, 8.672475814819336e-05, 0.00014126300811767578, 0.0001958012580871582, 0.0002503395080566406, 0.00030487775802612305, 0.00035941600799560547, 0.0004139542579650879, 0.0004684925079345703, 0.0005230307579040527, 0.0005775690078735352, 0.0006321072578430176, 0.0006866455078125, 0.0007411837577819824, 0.0007957220077514648, 0.0008502602577209473, 0.0009047985076904297, 0.0009593367576599121, 0.0010138750076293945, 0.001068413257598877, 0.0011229515075683594, 0.0011774897575378418, 0.0012320280075073242, 0.0012865662574768066, 0.001341104507446289, 0.0013956427574157715, 0.001450181007385254, 0.0015047192573547363, 0.0015592575073242188]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 10.0, 9.0, 9.0, 18.0, 27.0, 42.0, 65.0, 77.0, 137.0, 201.0, 295.0, 435.0, 645.0, 1036.0, 1506.0, 2400.0, 3754.0, 5830.0, 9492.0, 15142.0, 24695.0, 40865.0, 66320.0, 104411.0, 149860.0, 172866.0, 154493.0, 110623.0, 70318.0, 43157.0, 26446.0, 15993.0, 10050.0, 6215.0, 3997.0, 2434.0, 1615.0, 1009.0, 679.0, 447.0, 307.0, 214.0, 132.0, 86.0, 63.0, 39.0, 31.0, 26.0, 19.0, 8.0, 9.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.1953125, -9.8822021484375, -9.569091796875, -9.2559814453125, -8.94287109375, -8.6297607421875, -8.316650390625, -8.0035400390625, -7.6904296875, -7.3773193359375, -7.064208984375, -6.7510986328125, -6.43798828125, -6.1248779296875, -5.811767578125, -5.4986572265625, -5.185546875, -4.8724365234375, -4.559326171875, -4.2462158203125, -3.93310546875, -3.6199951171875, -3.306884765625, -2.9937744140625, -2.6806640625, -2.3675537109375, -2.054443359375, -1.7413330078125, -1.42822265625, -1.1151123046875, -0.802001953125, -0.4888916015625, -0.17578125, 0.1373291015625, 0.450439453125, 0.7635498046875, 1.07666015625, 1.3897705078125, 1.702880859375, 2.0159912109375, 2.3291015625, 2.6422119140625, 2.955322265625, 3.2684326171875, 3.58154296875, 3.8946533203125, 4.207763671875, 4.5208740234375, 4.833984375, 5.1470947265625, 5.460205078125, 5.7733154296875, 6.08642578125, 6.3995361328125, 6.712646484375, 7.0257568359375, 7.3388671875, 7.6519775390625, 7.965087890625, 8.2781982421875, 8.59130859375, 8.9044189453125, 9.217529296875, 9.5306396484375, 9.84375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 5.0, 4.0, 3.0, 18.0, 19.0, 24.0, 20.0, 33.0, 34.0, 34.0, 70.0, 51.0, 76.0, 77.0, 66.0, 65.0, 67.0, 57.0, 55.0, 38.0, 43.0, 26.0, 23.0, 18.0, 12.0, 14.0, 12.0, 6.0, 8.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9765625, -4.82794189453125, -4.6793212890625, -4.53070068359375, -4.382080078125, -4.23345947265625, -4.0848388671875, -3.93621826171875, -3.78759765625, -3.63897705078125, -3.4903564453125, -3.34173583984375, -3.193115234375, -3.04449462890625, -2.8958740234375, -2.74725341796875, -2.5986328125, -2.45001220703125, -2.3013916015625, -2.15277099609375, -2.004150390625, -1.85552978515625, -1.7069091796875, -1.55828857421875, -1.40966796875, -1.26104736328125, -1.1124267578125, -0.96380615234375, -0.815185546875, -0.66656494140625, -0.5179443359375, -0.36932373046875, -0.220703125, -0.07208251953125, 0.0765380859375, 0.22515869140625, 0.373779296875, 0.52239990234375, 0.6710205078125, 0.81964111328125, 0.96826171875, 1.11688232421875, 1.2655029296875, 1.41412353515625, 1.562744140625, 1.71136474609375, 1.8599853515625, 2.00860595703125, 2.1572265625, 2.30584716796875, 2.4544677734375, 2.60308837890625, 2.751708984375, 2.90032958984375, 3.0489501953125, 3.19757080078125, 3.34619140625, 3.49481201171875, 3.6434326171875, 3.79205322265625, 3.940673828125, 4.08929443359375, 4.2379150390625, 4.38653564453125, 4.53515625]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 5.0, 9.0, 13.0, 13.0, 10.0, 27.0, 29.0, 34.0, 34.0, 38.0, 58.0, 53.0, 58.0, 61.0, 66.0, 63.0, 63.0, 53.0, 37.0, 46.0, 51.0, 30.0, 25.0, 18.0, 15.0, 11.0, 17.0, 14.0, 9.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40544891357422, -21.735342025756836, -21.065237045288086, -20.395130157470703, -19.72502326965332, -19.054916381835938, -18.384811401367188, -17.714704513549805, -17.044597625732422, -16.37449073791504, -15.704384803771973, -15.034278869628906, -14.364171981811523, -13.694066047668457, -13.02396011352539, -12.353853225708008, -11.683747291564941, -11.013641357421875, -10.343534469604492, -9.673428535461426, -9.003321647644043, -8.333215713500977, -7.663109302520752, -6.993002891540527, -6.322896480560303, -5.652790069580078, -4.9826836585998535, -4.312577247619629, -3.6424710750579834, -2.972364664077759, -2.3022584915161133, -1.6321520805358887, -0.9620456695556641, -0.29193931818008423, 0.3781670331954956, 1.0482733249664307, 1.7183797359466553, 2.38848614692688, 3.0585923194885254, 3.72869873046875, 4.398805141448975, 5.068911552429199, 5.739017963409424, 6.409124374389648, 7.079230308532715, 7.749337196350098, 8.419443130493164, 9.089550018310547, 9.759655952453613, 10.42976188659668, 11.099868774414062, 11.769974708557129, 12.440081596374512, 13.110187530517578, 13.780294418334961, 14.450400352478027, 15.120506286621094, 15.79061222076416, 16.460718154907227, 17.13082504272461, 17.800931930541992, 18.471038818359375, 19.141143798828125, 19.811250686645508, 20.48135757446289]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 6.0, 7.0, 5.0, 8.0, 5.0, 14.0, 16.0, 16.0, 23.0, 35.0, 35.0, 38.0, 36.0, 41.0, 46.0, 37.0, 48.0, 45.0, 52.0, 52.0, 46.0, 39.0, 48.0, 49.0, 32.0, 33.0, 31.0, 28.0, 24.0, 20.0, 11.0, 20.0, 13.0, 8.0, 7.0, 9.0, 4.0, 7.0, 5.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.724685668945312, -19.14139747619629, -18.558109283447266, -17.97481918334961, -17.391530990600586, -16.808242797851562, -16.22495460510254, -15.641666412353516, -15.058377265930176, -14.475089073181152, -13.891799926757812, -13.308511734008789, -12.725223541259766, -12.141934394836426, -11.558646202087402, -10.975357055664062, -10.392068862915039, -9.808780670166016, -9.225491523742676, -8.642203330993652, -8.058914184570312, -7.475625991821289, -6.892337799072266, -6.309049129486084, -5.725760459899902, -5.142471790313721, -4.559183120727539, -3.9758949279785156, -3.392606258392334, -2.8093175888061523, -2.22602915763855, -1.6427407264709473, -1.0594520568847656, -0.47616350650787354, 0.10712504386901855, 0.6904135942459106, 1.2737021446228027, 1.8569908142089844, 2.440279245376587, 3.0235676765441895, 3.606856346130371, 4.190145015716553, 4.773433685302734, 5.356721878051758, 5.9400105476379395, 6.523299217224121, 7.1065874099731445, 7.689876079559326, 8.273164749145508, 8.856452941894531, 9.439742088317871, 10.023030281066895, 10.606319427490234, 11.189607620239258, 11.772895812988281, 12.356184005737305, 12.939473152160645, 13.522761344909668, 14.106050491333008, 14.689338684082031, 15.272626876831055, 15.855916023254395, 16.439205169677734, 17.022493362426758, 17.60578155517578]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 6.0, 6.0, 11.0, 18.0, 33.0, 40.0, 59.0, 94.0, 159.0, 243.0, 394.0, 588.0, 909.0, 1346.0, 2140.0, 3396.0, 5352.0, 8612.0, 14132.0, 23755.0, 42142.0, 78269.0, 158158.0, 347349.0, 743516.0, 1122446.0, 847643.0, 404780.0, 182341.0, 89386.0, 47133.0, 26602.0, 16160.0, 9643.0, 6051.0, 3905.0, 2535.0, 1701.0, 1073.0, 726.0, 469.0, 337.0, 211.0, 140.0, 95.0, 51.0, 49.0, 37.0, 15.0, 7.0, 6.0, 12.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-18.8125, -18.217041015625, -17.62158203125, -17.026123046875, -16.4306640625, -15.835205078125, -15.23974609375, -14.644287109375, -14.048828125, -13.453369140625, -12.85791015625, -12.262451171875, -11.6669921875, -11.071533203125, -10.47607421875, -9.880615234375, -9.28515625, -8.689697265625, -8.09423828125, -7.498779296875, -6.9033203125, -6.307861328125, -5.71240234375, -5.116943359375, -4.521484375, -3.926025390625, -3.33056640625, -2.735107421875, -2.1396484375, -1.544189453125, -0.94873046875, -0.353271484375, 0.2421875, 0.837646484375, 1.43310546875, 2.028564453125, 2.6240234375, 3.219482421875, 3.81494140625, 4.410400390625, 5.005859375, 5.601318359375, 6.19677734375, 6.792236328125, 7.3876953125, 7.983154296875, 8.57861328125, 9.174072265625, 9.76953125, 10.364990234375, 10.96044921875, 11.555908203125, 12.1513671875, 12.746826171875, 13.34228515625, 13.937744140625, 14.533203125, 15.128662109375, 15.72412109375, 16.319580078125, 16.9150390625, 17.510498046875, 18.10595703125, 18.701416015625, 19.296875]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 9.0, 6.0, 10.0, 10.0, 15.0, 15.0, 14.0, 21.0, 24.0, 29.0, 24.0, 38.0, 57.0, 48.0, 36.0, 34.0, 52.0, 53.0, 44.0, 31.0, 44.0, 43.0, 48.0, 47.0, 36.0, 32.0, 36.0, 18.0, 27.0, 15.0, 13.0, 13.0, 16.0, 11.0, 5.0, 5.0, 6.0, 3.0, 6.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.9765625, -12.5977783203125, -12.218994140625, -11.8402099609375, -11.46142578125, -11.0826416015625, -10.703857421875, -10.3250732421875, -9.9462890625, -9.5675048828125, -9.188720703125, -8.8099365234375, -8.43115234375, -8.0523681640625, -7.673583984375, -7.2947998046875, -6.916015625, -6.5372314453125, -6.158447265625, -5.7796630859375, -5.40087890625, -5.0220947265625, -4.643310546875, -4.2645263671875, -3.8857421875, -3.5069580078125, -3.128173828125, -2.7493896484375, -2.37060546875, -1.9918212890625, -1.613037109375, -1.2342529296875, -0.85546875, -0.4766845703125, -0.097900390625, 0.2808837890625, 0.65966796875, 1.0384521484375, 1.417236328125, 1.7960205078125, 2.1748046875, 2.5535888671875, 2.932373046875, 3.3111572265625, 3.68994140625, 4.0687255859375, 4.447509765625, 4.8262939453125, 5.205078125, 5.5838623046875, 5.962646484375, 6.3414306640625, 6.72021484375, 7.0989990234375, 7.477783203125, 7.8565673828125, 8.2353515625, 8.6141357421875, 8.992919921875, 9.3717041015625, 9.75048828125, 10.1292724609375, 10.508056640625, 10.8868408203125, 11.265625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 7.0, 9.0, 13.0, 26.0, 34.0, 56.0, 75.0, 112.0, 176.0, 234.0, 341.0, 646.0, 1087.0, 1762.0, 3138.0, 5444.0, 10057.0, 19801.0, 40228.0, 86528.0, 197452.0, 470914.0, 1030642.0, 1210334.0, 629962.0, 266463.0, 114236.0, 51497.0, 24489.0, 12694.0, 6688.0, 3691.0, 2197.0, 1211.0, 759.0, 465.0, 265.0, 180.0, 125.0, 85.0, 49.0, 33.0, 26.0, 21.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-25.21875, -24.480712890625, -23.74267578125, -23.004638671875, -22.2666015625, -21.528564453125, -20.79052734375, -20.052490234375, -19.314453125, -18.576416015625, -17.83837890625, -17.100341796875, -16.3623046875, -15.624267578125, -14.88623046875, -14.148193359375, -13.41015625, -12.672119140625, -11.93408203125, -11.196044921875, -10.4580078125, -9.719970703125, -8.98193359375, -8.243896484375, -7.505859375, -6.767822265625, -6.02978515625, -5.291748046875, -4.5537109375, -3.815673828125, -3.07763671875, -2.339599609375, -1.6015625, -0.863525390625, -0.12548828125, 0.612548828125, 1.3505859375, 2.088623046875, 2.82666015625, 3.564697265625, 4.302734375, 5.040771484375, 5.77880859375, 6.516845703125, 7.2548828125, 7.992919921875, 8.73095703125, 9.468994140625, 10.20703125, 10.945068359375, 11.68310546875, 12.421142578125, 13.1591796875, 13.897216796875, 14.63525390625, 15.373291015625, 16.111328125, 16.849365234375, 17.58740234375, 18.325439453125, 19.0634765625, 19.801513671875, 20.53955078125, 21.277587890625, 22.015625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 3.0, 7.0, 7.0, 5.0, 8.0, 16.0, 17.0, 24.0, 20.0, 32.0, 51.0, 63.0, 76.0, 113.0, 135.0, 189.0, 216.0, 252.0, 291.0, 316.0, 362.0, 352.0, 289.0, 265.0, 217.0, 176.0, 150.0, 99.0, 94.0, 72.0, 49.0, 35.0, 23.0, 24.0, 8.0, 8.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.9296875, -8.69171142578125, -8.4537353515625, -8.21575927734375, -7.977783203125, -7.73980712890625, -7.5018310546875, -7.26385498046875, -7.02587890625, -6.78790283203125, -6.5499267578125, -6.31195068359375, -6.073974609375, -5.83599853515625, -5.5980224609375, -5.36004638671875, -5.1220703125, -4.88409423828125, -4.6461181640625, -4.40814208984375, -4.170166015625, -3.93218994140625, -3.6942138671875, -3.45623779296875, -3.21826171875, -2.98028564453125, -2.7423095703125, -2.50433349609375, -2.266357421875, -2.02838134765625, -1.7904052734375, -1.55242919921875, -1.314453125, -1.07647705078125, -0.8385009765625, -0.60052490234375, -0.362548828125, -0.12457275390625, 0.1134033203125, 0.35137939453125, 0.58935546875, 0.82733154296875, 1.0653076171875, 1.30328369140625, 1.541259765625, 1.77923583984375, 2.0172119140625, 2.25518798828125, 2.4931640625, 2.73114013671875, 2.9691162109375, 3.20709228515625, 3.445068359375, 3.68304443359375, 3.9210205078125, 4.15899658203125, 4.39697265625, 4.63494873046875, 4.8729248046875, 5.11090087890625, 5.348876953125, 5.58685302734375, 5.8248291015625, 6.06280517578125, 6.30078125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 5.0, 9.0, 3.0, 11.0, 3.0, 11.0, 12.0, 18.0, 17.0, 19.0, 36.0, 41.0, 54.0, 63.0, 66.0, 65.0, 69.0, 67.0, 68.0, 53.0, 59.0, 53.0, 43.0, 36.0, 32.0, 23.0, 18.0, 12.0, 9.0, 5.0, 8.0, 9.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.6554012298584, -23.96820831298828, -23.281017303466797, -22.593826293945312, -21.906633377075195, -21.219440460205078, -20.532249450683594, -19.84505844116211, -19.157865524291992, -18.470672607421875, -17.78348159790039, -17.096290588378906, -16.40909767150879, -15.721905708312988, -15.034713745117188, -14.347521781921387, -13.660329818725586, -12.973137855529785, -12.285945892333984, -11.598753929138184, -10.911561965942383, -10.224370002746582, -9.537178039550781, -8.84998607635498, -8.16279411315918, -7.475602149963379, -6.788410186767578, -6.101218223571777, -5.414026260375977, -4.726834297180176, -4.039642333984375, -3.352450370788574, -2.6652603149414062, -1.9780683517456055, -1.2908763885498047, -0.6036844253540039, 0.08350753784179688, 0.7706995010375977, 1.4578914642333984, 2.145083427429199, 2.832275390625, 3.519467353820801, 4.206659317016602, 4.893851280212402, 5.581043243408203, 6.268235206604004, 6.955427169799805, 7.6426191329956055, 8.329811096191406, 9.017003059387207, 9.704195022583008, 10.391386985778809, 11.07857894897461, 11.76577091217041, 12.452962875366211, 13.140154838562012, 13.827346801757812, 14.514538764953613, 15.201730728149414, 15.888922691345215, 16.576114654541016, 17.2633056640625, 17.950498580932617, 18.637691497802734, 19.32488250732422]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 2.0, 4.0, 3.0, 3.0, 9.0, 8.0, 8.0, 14.0, 11.0, 21.0, 13.0, 30.0, 24.0, 30.0, 27.0, 33.0, 33.0, 35.0, 34.0, 37.0, 41.0, 22.0, 37.0, 39.0, 45.0, 42.0, 51.0, 31.0, 31.0, 38.0, 26.0, 36.0, 19.0, 15.0, 20.0, 18.0, 15.0, 17.0, 14.0, 8.0, 13.0, 7.0, 10.0, 4.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-14.058521270751953, -13.622529983520508, -13.186539649963379, -12.750548362731934, -12.314558029174805, -11.87856674194336, -11.442575454711914, -11.006584167480469, -10.57059383392334, -10.134602546691895, -9.698612213134766, -9.26262092590332, -8.826629638671875, -8.390639305114746, -7.954648017883301, -7.518657207489014, -7.082666397094727, -6.6466755867004395, -6.210684776306152, -5.774693489074707, -5.33870267868042, -4.902711868286133, -4.4667205810546875, -4.0307297706604, -3.5947389602661133, -3.158748149871826, -2.72275710105896, -2.2867660522460938, -1.8507752418518066, -1.4147844314575195, -0.9787933826446533, -0.5428023338317871, -0.1068124771118164, 0.32917845249176025, 0.7651693820953369, 1.2011603116989136, 1.6371512413024902, 2.0731420516967773, 2.5091331005096436, 2.9451241493225098, 3.381114959716797, 3.817105770111084, 4.253096580505371, 4.689087867736816, 5.1250786781311035, 5.561069488525391, 5.997060775756836, 6.433051586151123, 6.86904239654541, 7.305033206939697, 7.741024017333984, 8.17701530456543, 8.613006591796875, 9.048996925354004, 9.48498821258545, 9.920978546142578, 10.356969833374023, 10.792961120605469, 11.228951454162598, 11.664942741394043, 12.100933074951172, 12.536924362182617, 12.972915649414062, 13.408906936645508, 13.844897270202637]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 10.0, 6.0, 16.0, 23.0, 35.0, 49.0, 81.0, 127.0, 204.0, 339.0, 587.0, 825.0, 1495.0, 2558.0, 4520.0, 7584.0, 14333.0, 26688.0, 52698.0, 104643.0, 190646.0, 247384.0, 185086.0, 100653.0, 50492.0, 25778.0, 13604.0, 7540.0, 4315.0, 2440.0, 1437.0, 915.0, 519.0, 355.0, 230.0, 113.0, 95.0, 47.0, 33.0, 23.0, 11.0, 11.0, 9.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-16.15625, -15.7132568359375, -15.270263671875, -14.8272705078125, -14.38427734375, -13.9412841796875, -13.498291015625, -13.0552978515625, -12.6123046875, -12.1693115234375, -11.726318359375, -11.2833251953125, -10.84033203125, -10.3973388671875, -9.954345703125, -9.5113525390625, -9.068359375, -8.6253662109375, -8.182373046875, -7.7393798828125, -7.29638671875, -6.8533935546875, -6.410400390625, -5.9674072265625, -5.5244140625, -5.0814208984375, -4.638427734375, -4.1954345703125, -3.75244140625, -3.3094482421875, -2.866455078125, -2.4234619140625, -1.98046875, -1.5374755859375, -1.094482421875, -0.6514892578125, -0.20849609375, 0.2344970703125, 0.677490234375, 1.1204833984375, 1.5634765625, 2.0064697265625, 2.449462890625, 2.8924560546875, 3.33544921875, 3.7784423828125, 4.221435546875, 4.6644287109375, 5.107421875, 5.5504150390625, 5.993408203125, 6.4364013671875, 6.87939453125, 7.3223876953125, 7.765380859375, 8.2083740234375, 8.6513671875, 9.0943603515625, 9.537353515625, 9.9803466796875, 10.42333984375, 10.8663330078125, 11.309326171875, 11.7523193359375, 12.1953125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 6.0, 5.0, 2.0, 7.0, 10.0, 13.0, 13.0, 17.0, 21.0, 19.0, 36.0, 27.0, 26.0, 34.0, 36.0, 37.0, 36.0, 33.0, 34.0, 46.0, 40.0, 35.0, 46.0, 51.0, 34.0, 36.0, 36.0, 32.0, 30.0, 36.0, 17.0, 19.0, 16.0, 11.0, 19.0, 14.0, 14.0, 12.0, 9.0, 9.0, 7.0, 3.0, 1.0, 1.0, 9.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.7578125, -14.2823486328125, -13.806884765625, -13.3314208984375, -12.85595703125, -12.3804931640625, -11.905029296875, -11.4295654296875, -10.9541015625, -10.4786376953125, -10.003173828125, -9.5277099609375, -9.05224609375, -8.5767822265625, -8.101318359375, -7.6258544921875, -7.150390625, -6.6749267578125, -6.199462890625, -5.7239990234375, -5.24853515625, -4.7730712890625, -4.297607421875, -3.8221435546875, -3.3466796875, -2.8712158203125, -2.395751953125, -1.9202880859375, -1.44482421875, -0.9693603515625, -0.493896484375, -0.0184326171875, 0.45703125, 0.9324951171875, 1.407958984375, 1.8834228515625, 2.35888671875, 2.8343505859375, 3.309814453125, 3.7852783203125, 4.2607421875, 4.7362060546875, 5.211669921875, 5.6871337890625, 6.16259765625, 6.6380615234375, 7.113525390625, 7.5889892578125, 8.064453125, 8.5399169921875, 9.015380859375, 9.4908447265625, 9.96630859375, 10.4417724609375, 10.917236328125, 11.3927001953125, 11.8681640625, 12.3436279296875, 12.819091796875, 13.2945556640625, 13.77001953125, 14.2454833984375, 14.720947265625, 15.1964111328125, 15.671875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 8.0, 15.0, 11.0, 15.0, 26.0, 27.0, 35.0, 38.0, 71.0, 99.0, 123.0, 210.0, 339.0, 541.0, 828.0, 1374.0, 2215.0, 3796.0, 6884.0, 14047.0, 30600.0, 73998.0, 186090.0, 344090.0, 222220.0, 89602.0, 36524.0, 16248.0, 7875.0, 4122.0, 2400.0, 1442.0, 910.0, 597.0, 351.0, 253.0, 150.0, 106.0, 71.0, 53.0, 38.0, 17.0, 30.0, 20.0, 12.0, 6.0, 11.0, 7.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1875, -18.580322265625, -17.97314453125, -17.365966796875, -16.7587890625, -16.151611328125, -15.54443359375, -14.937255859375, -14.330078125, -13.722900390625, -13.11572265625, -12.508544921875, -11.9013671875, -11.294189453125, -10.68701171875, -10.079833984375, -9.47265625, -8.865478515625, -8.25830078125, -7.651123046875, -7.0439453125, -6.436767578125, -5.82958984375, -5.222412109375, -4.615234375, -4.008056640625, -3.40087890625, -2.793701171875, -2.1865234375, -1.579345703125, -0.97216796875, -0.364990234375, 0.2421875, 0.849365234375, 1.45654296875, 2.063720703125, 2.6708984375, 3.278076171875, 3.88525390625, 4.492431640625, 5.099609375, 5.706787109375, 6.31396484375, 6.921142578125, 7.5283203125, 8.135498046875, 8.74267578125, 9.349853515625, 9.95703125, 10.564208984375, 11.17138671875, 11.778564453125, 12.3857421875, 12.992919921875, 13.60009765625, 14.207275390625, 14.814453125, 15.421630859375, 16.02880859375, 16.635986328125, 17.2431640625, 17.850341796875, 18.45751953125, 19.064697265625, 19.671875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 3.0, 8.0, 3.0, 7.0, 2.0, 8.0, 12.0, 12.0, 19.0, 20.0, 22.0, 24.0, 28.0, 35.0, 29.0, 28.0, 25.0, 28.0, 24.0, 46.0, 46.0, 56.0, 43.0, 38.0, 41.0, 42.0, 34.0, 40.0, 31.0, 28.0, 32.0, 20.0, 22.0, 19.0, 30.0, 15.0, 13.0, 15.0, 6.0, 8.0, 5.0, 7.0, 5.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.296875, -8.03662109375, -7.7763671875, -7.51611328125, -7.255859375, -6.99560546875, -6.7353515625, -6.47509765625, -6.21484375, -5.95458984375, -5.6943359375, -5.43408203125, -5.173828125, -4.91357421875, -4.6533203125, -4.39306640625, -4.1328125, -3.87255859375, -3.6123046875, -3.35205078125, -3.091796875, -2.83154296875, -2.5712890625, -2.31103515625, -2.05078125, -1.79052734375, -1.5302734375, -1.27001953125, -1.009765625, -0.74951171875, -0.4892578125, -0.22900390625, 0.03125, 0.29150390625, 0.5517578125, 0.81201171875, 1.072265625, 1.33251953125, 1.5927734375, 1.85302734375, 2.11328125, 2.37353515625, 2.6337890625, 2.89404296875, 3.154296875, 3.41455078125, 3.6748046875, 3.93505859375, 4.1953125, 4.45556640625, 4.7158203125, 4.97607421875, 5.236328125, 5.49658203125, 5.7568359375, 6.01708984375, 6.27734375, 6.53759765625, 6.7978515625, 7.05810546875, 7.318359375, 7.57861328125, 7.8388671875, 8.09912109375, 8.359375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 9.0, 11.0, 11.0, 13.0, 22.0, 31.0, 33.0, 82.0, 111.0, 177.0, 256.0, 369.0, 608.0, 868.0, 1471.0, 2578.0, 4161.0, 7060.0, 12674.0, 23010.0, 43531.0, 86027.0, 171233.0, 273485.0, 202614.0, 103694.0, 52188.0, 27026.0, 14573.0, 8278.0, 4727.0, 2832.0, 1744.0, 1118.0, 676.0, 446.0, 273.0, 178.0, 119.0, 64.0, 65.0, 31.0, 30.0, 10.0, 16.0, 11.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.4375, -5.2708740234375, -5.104248046875, -4.9376220703125, -4.77099609375, -4.6043701171875, -4.437744140625, -4.2711181640625, -4.1044921875, -3.9378662109375, -3.771240234375, -3.6046142578125, -3.43798828125, -3.2713623046875, -3.104736328125, -2.9381103515625, -2.771484375, -2.6048583984375, -2.438232421875, -2.2716064453125, -2.10498046875, -1.9383544921875, -1.771728515625, -1.6051025390625, -1.4384765625, -1.2718505859375, -1.105224609375, -0.9385986328125, -0.77197265625, -0.6053466796875, -0.438720703125, -0.2720947265625, -0.10546875, 0.0611572265625, 0.227783203125, 0.3944091796875, 0.56103515625, 0.7276611328125, 0.894287109375, 1.0609130859375, 1.2275390625, 1.3941650390625, 1.560791015625, 1.7274169921875, 1.89404296875, 2.0606689453125, 2.227294921875, 2.3939208984375, 2.560546875, 2.7271728515625, 2.893798828125, 3.0604248046875, 3.22705078125, 3.3936767578125, 3.560302734375, 3.7269287109375, 3.8935546875, 4.0601806640625, 4.226806640625, 4.3934326171875, 4.56005859375, 4.7266845703125, 4.893310546875, 5.0599365234375, 5.2265625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 6.0, 12.0, 6.0, 13.0, 11.0, 10.0, 18.0, 26.0, 30.0, 26.0, 48.0, 46.0, 40.0, 46.0, 54.0, 71.0, 65.0, 57.0, 72.0, 48.0, 52.0, 36.0, 38.0, 30.0, 25.0, 21.0, 16.0, 14.0, 16.0, 7.0, 10.0, 4.0, 5.0, 2.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00027680397033691406, -0.0002676956355571747, -0.0002585873007774353, -0.0002494789659976959, -0.00024037063121795654, -0.00023126229643821716, -0.00022215396165847778, -0.0002130456268787384, -0.00020393729209899902, -0.00019482895731925964, -0.00018572062253952026, -0.00017661228775978088, -0.0001675039529800415, -0.00015839561820030212, -0.00014928728342056274, -0.00014017894864082336, -0.00013107061386108398, -0.0001219622790813446, -0.00011285394430160522, -0.00010374560952186584, -9.463727474212646e-05, -8.552893996238708e-05, -7.64206051826477e-05, -6.731227040290833e-05, -5.8203935623168945e-05, -4.9095600843429565e-05, -3.9987266063690186e-05, -3.0878931283950806e-05, -2.1770596504211426e-05, -1.2662261724472046e-05, -3.553926944732666e-06, 5.554407835006714e-06, 1.4662742614746094e-05, 2.3771077394485474e-05, 3.2879412174224854e-05, 4.1987746953964233e-05, 5.109608173370361e-05, 6.020441651344299e-05, 6.931275129318237e-05, 7.842108607292175e-05, 8.752942085266113e-05, 9.663775563240051e-05, 0.00010574609041213989, 0.00011485442519187927, 0.00012396275997161865, 0.00013307109475135803, 0.0001421794295310974, 0.0001512877643108368, 0.00016039609909057617, 0.00016950443387031555, 0.00017861276865005493, 0.0001877211034297943, 0.0001968294382095337, 0.00020593777298927307, 0.00021504610776901245, 0.00022415444254875183, 0.0002332627773284912, 0.0002423711121082306, 0.00025147944688796997, 0.00026058778166770935, 0.00026969611644744873, 0.0002788044512271881, 0.0002879127860069275, 0.00029702112078666687, 0.00030612945556640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 1.0, 9.0, 24.0, 16.0, 44.0, 80.0, 126.0, 236.0, 412.0, 808.0, 1670.0, 3316.0, 7120.0, 15501.0, 34388.0, 78449.0, 167563.0, 273607.0, 237387.0, 125439.0, 55956.0, 24580.0, 11373.0, 5334.0, 2571.0, 1233.0, 575.0, 320.0, 165.0, 96.0, 46.0, 31.0, 19.0, 11.0, 13.0, 8.0, 2.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.41015625, -6.20855712890625, -6.0069580078125, -5.80535888671875, -5.603759765625, -5.40216064453125, -5.2005615234375, -4.99896240234375, -4.79736328125, -4.59576416015625, -4.3941650390625, -4.19256591796875, -3.990966796875, -3.78936767578125, -3.5877685546875, -3.38616943359375, -3.1845703125, -2.98297119140625, -2.7813720703125, -2.57977294921875, -2.378173828125, -2.17657470703125, -1.9749755859375, -1.77337646484375, -1.57177734375, -1.37017822265625, -1.1685791015625, -0.96697998046875, -0.765380859375, -0.56378173828125, -0.3621826171875, -0.16058349609375, 0.041015625, 0.24261474609375, 0.4442138671875, 0.64581298828125, 0.847412109375, 1.04901123046875, 1.2506103515625, 1.45220947265625, 1.65380859375, 1.85540771484375, 2.0570068359375, 2.25860595703125, 2.460205078125, 2.66180419921875, 2.8634033203125, 3.06500244140625, 3.2666015625, 3.46820068359375, 3.6697998046875, 3.87139892578125, 4.072998046875, 4.27459716796875, 4.4761962890625, 4.67779541015625, 4.87939453125, 5.08099365234375, 5.2825927734375, 5.48419189453125, 5.685791015625, 5.88739013671875, 6.0889892578125, 6.29058837890625, 6.4921875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 14.0, 2.0, 17.0, 13.0, 18.0, 23.0, 28.0, 31.0, 48.0, 47.0, 68.0, 62.0, 87.0, 76.0, 76.0, 65.0, 64.0, 67.0, 37.0, 33.0, 36.0, 25.0, 18.0, 19.0, 12.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2099609375, -1.1562957763671875, -1.102630615234375, -1.0489654541015625, -0.99530029296875, -0.9416351318359375, -0.887969970703125, -0.8343048095703125, -0.7806396484375, -0.7269744873046875, -0.673309326171875, -0.6196441650390625, -0.56597900390625, -0.5123138427734375, -0.458648681640625, -0.4049835205078125, -0.351318359375, -0.2976531982421875, -0.243988037109375, -0.1903228759765625, -0.13665771484375, -0.0829925537109375, -0.029327392578125, 0.0243377685546875, 0.0780029296875, 0.1316680908203125, 0.185333251953125, 0.2389984130859375, 0.29266357421875, 0.3463287353515625, 0.399993896484375, 0.4536590576171875, 0.50732421875, 0.5609893798828125, 0.614654541015625, 0.6683197021484375, 0.72198486328125, 0.7756500244140625, 0.829315185546875, 0.8829803466796875, 0.9366455078125, 0.9903106689453125, 1.043975830078125, 1.0976409912109375, 1.15130615234375, 1.2049713134765625, 1.258636474609375, 1.3123016357421875, 1.365966796875, 1.4196319580078125, 1.473297119140625, 1.5269622802734375, 1.58062744140625, 1.6342926025390625, 1.687957763671875, 1.7416229248046875, 1.7952880859375, 1.8489532470703125, 1.902618408203125, 1.9562835693359375, 2.00994873046875, 2.0636138916015625, 2.117279052734375, 2.1709442138671875, 2.224609375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 7.0, 9.0, 5.0, 9.0, 8.0, 24.0, 18.0, 26.0, 37.0, 40.0, 64.0, 52.0, 76.0, 60.0, 79.0, 69.0, 74.0, 59.0, 50.0, 42.0, 45.0, 36.0, 30.0, 15.0, 20.0, 13.0, 10.0, 2.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.163774490356445, -24.45777702331543, -23.75177764892578, -23.045780181884766, -22.33978271484375, -21.633785247802734, -20.92778778076172, -20.22178840637207, -19.515790939331055, -18.80979347229004, -18.10379409790039, -17.397796630859375, -16.69179916381836, -15.985801696777344, -15.279803276062012, -14.57380485534668, -13.867807388305664, -13.161809921264648, -12.455811500549316, -11.749813079833984, -11.043815612792969, -10.337818145751953, -9.631819725036621, -8.925821304321289, -8.219823837280273, -7.5138258934021, -6.807827949523926, -6.101830005645752, -5.395832061767578, -4.689834117889404, -3.9838361740112305, -3.2778382301330566, -2.571840286254883, -1.865842342376709, -1.1598443984985352, -0.45384645462036133, 0.2521514892578125, 0.9581494331359863, 1.6641473770141602, 2.370145320892334, 3.076143264770508, 3.7821412086486816, 4.4881391525268555, 5.194137096405029, 5.900135040283203, 6.606132984161377, 7.312130928039551, 8.018129348754883, 8.724126815795898, 9.430124282836914, 10.136122703552246, 10.842121124267578, 11.548118591308594, 12.25411605834961, 12.960114479064941, 13.666112899780273, 14.372110366821289, 15.078107833862305, 15.784106254577637, 16.49010467529297, 17.196102142333984, 17.902099609375, 18.608097076416016, 19.314096450805664, 20.02009391784668]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 2.0, 3.0, 5.0, 1.0, 8.0, 10.0, 5.0, 11.0, 13.0, 18.0, 18.0, 18.0, 23.0, 27.0, 39.0, 38.0, 23.0, 37.0, 43.0, 34.0, 29.0, 36.0, 23.0, 53.0, 29.0, 47.0, 50.0, 33.0, 31.0, 32.0, 36.0, 32.0, 28.0, 19.0, 15.0, 17.0, 13.0, 17.0, 16.0, 15.0, 5.0, 13.0, 8.0, 7.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.621931076049805, -13.190160751342773, -12.758390426635742, -12.326620101928711, -11.89484977722168, -11.463079452514648, -11.031309127807617, -10.599538803100586, -10.167768478393555, -9.735998153686523, -9.304227828979492, -8.872457504272461, -8.44068717956543, -8.008916854858398, -7.577147006988525, -7.145376682281494, -6.713606834411621, -6.28183650970459, -5.850066184997559, -5.418295860290527, -4.986525535583496, -4.554755210876465, -4.122985363006592, -3.6912150382995605, -3.2594447135925293, -2.827674388885498, -2.395904064178467, -1.9641339778900146, -1.5323636531829834, -1.1005933284759521, -0.6688232421875, -0.23705291748046875, 0.1947164535522461, 0.6264867186546326, 1.058256983757019, 1.4900271892547607, 1.921797513961792, 2.3535678386688232, 2.7853379249572754, 3.2171082496643066, 3.648878574371338, 4.080648899078369, 4.5124192237854, 4.944189071655273, 5.375959396362305, 5.807729721069336, 6.239500045776367, 6.671270370483398, 7.10304069519043, 7.534811019897461, 7.966581344604492, 8.398351669311523, 8.830121994018555, 9.261892318725586, 9.693662643432617, 10.125432968139648, 10.55720329284668, 10.988973617553711, 11.420743942260742, 11.852514266967773, 12.284284591674805, 12.716054916381836, 13.147825241088867, 13.579595565795898, 14.011364936828613]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 11.0, 15.0, 28.0, 38.0, 69.0, 102.0, 134.0, 249.0, 398.0, 612.0, 1052.0, 1662.0, 2864.0, 4796.0, 7838.0, 13628.0, 24020.0, 42188.0, 74492.0, 124950.0, 181463.0, 195827.0, 151193.0, 93339.0, 54378.0, 30750.0, 17430.0, 10080.0, 5987.0, 3579.0, 2042.0, 1277.0, 746.0, 461.0, 316.0, 190.0, 117.0, 84.0, 49.0, 37.0, 23.0, 16.0, 7.0, 6.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.625, -17.987548828125, -17.35009765625, -16.712646484375, -16.0751953125, -15.437744140625, -14.80029296875, -14.162841796875, -13.525390625, -12.887939453125, -12.25048828125, -11.613037109375, -10.9755859375, -10.338134765625, -9.70068359375, -9.063232421875, -8.42578125, -7.788330078125, -7.15087890625, -6.513427734375, -5.8759765625, -5.238525390625, -4.60107421875, -3.963623046875, -3.326171875, -2.688720703125, -2.05126953125, -1.413818359375, -0.7763671875, -0.138916015625, 0.49853515625, 1.135986328125, 1.7734375, 2.410888671875, 3.04833984375, 3.685791015625, 4.3232421875, 4.960693359375, 5.59814453125, 6.235595703125, 6.873046875, 7.510498046875, 8.14794921875, 8.785400390625, 9.4228515625, 10.060302734375, 10.69775390625, 11.335205078125, 11.97265625, 12.610107421875, 13.24755859375, 13.885009765625, 14.5224609375, 15.159912109375, 15.79736328125, 16.434814453125, 17.072265625, 17.709716796875, 18.34716796875, 18.984619140625, 19.6220703125, 20.259521484375, 20.89697265625, 21.534423828125, 22.171875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 6.0, 3.0, 12.0, 9.0, 9.0, 19.0, 20.0, 26.0, 16.0, 33.0, 34.0, 38.0, 36.0, 36.0, 37.0, 35.0, 37.0, 45.0, 39.0, 46.0, 58.0, 30.0, 40.0, 31.0, 36.0, 34.0, 22.0, 29.0, 28.0, 22.0, 17.0, 16.0, 16.0, 15.0, 16.0, 7.0, 9.0, 9.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.5546875, -14.083984375, -13.61328125, -13.142578125, -12.671875, -12.201171875, -11.73046875, -11.259765625, -10.7890625, -10.318359375, -9.84765625, -9.376953125, -8.90625, -8.435546875, -7.96484375, -7.494140625, -7.0234375, -6.552734375, -6.08203125, -5.611328125, -5.140625, -4.669921875, -4.19921875, -3.728515625, -3.2578125, -2.787109375, -2.31640625, -1.845703125, -1.375, -0.904296875, -0.43359375, 0.037109375, 0.5078125, 0.978515625, 1.44921875, 1.919921875, 2.390625, 2.861328125, 3.33203125, 3.802734375, 4.2734375, 4.744140625, 5.21484375, 5.685546875, 6.15625, 6.626953125, 7.09765625, 7.568359375, 8.0390625, 8.509765625, 8.98046875, 9.451171875, 9.921875, 10.392578125, 10.86328125, 11.333984375, 11.8046875, 12.275390625, 12.74609375, 13.216796875, 13.6875, 14.158203125, 14.62890625, 15.099609375, 15.5703125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 14.0, 18.0, 28.0, 58.0, 63.0, 87.0, 156.0, 224.0, 287.0, 492.0, 725.0, 998.0, 1591.0, 2453.0, 3868.0, 5961.0, 9448.0, 15193.0, 24339.0, 38675.0, 60967.0, 91595.0, 126402.0, 150982.0, 149699.0, 122074.0, 86751.0, 56850.0, 36261.0, 23166.0, 14225.0, 8953.0, 5636.0, 3586.0, 2346.0, 1450.0, 941.0, 652.0, 426.0, 326.0, 197.0, 110.0, 84.0, 55.0, 33.0, 29.0, 24.0, 12.0, 11.0, 10.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-14.2265625, -13.7666015625, -13.306640625, -12.8466796875, -12.38671875, -11.9267578125, -11.466796875, -11.0068359375, -10.546875, -10.0869140625, -9.626953125, -9.1669921875, -8.70703125, -8.2470703125, -7.787109375, -7.3271484375, -6.8671875, -6.4072265625, -5.947265625, -5.4873046875, -5.02734375, -4.5673828125, -4.107421875, -3.6474609375, -3.1875, -2.7275390625, -2.267578125, -1.8076171875, -1.34765625, -0.8876953125, -0.427734375, 0.0322265625, 0.4921875, 0.9521484375, 1.412109375, 1.8720703125, 2.33203125, 2.7919921875, 3.251953125, 3.7119140625, 4.171875, 4.6318359375, 5.091796875, 5.5517578125, 6.01171875, 6.4716796875, 6.931640625, 7.3916015625, 7.8515625, 8.3115234375, 8.771484375, 9.2314453125, 9.69140625, 10.1513671875, 10.611328125, 11.0712890625, 11.53125, 11.9912109375, 12.451171875, 12.9111328125, 13.37109375, 13.8310546875, 14.291015625, 14.7509765625, 15.2109375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 6.0, 3.0, 5.0, 5.0, 7.0, 11.0, 12.0, 15.0, 22.0, 19.0, 19.0, 23.0, 38.0, 29.0, 25.0, 25.0, 31.0, 39.0, 44.0, 39.0, 39.0, 42.0, 45.0, 39.0, 34.0, 39.0, 35.0, 36.0, 32.0, 23.0, 32.0, 19.0, 13.0, 30.0, 23.0, 13.0, 16.0, 11.0, 15.0, 8.0, 7.0, 7.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.2578125, -7.9957275390625, -7.733642578125, -7.4715576171875, -7.20947265625, -6.9473876953125, -6.685302734375, -6.4232177734375, -6.1611328125, -5.8990478515625, -5.636962890625, -5.3748779296875, -5.11279296875, -4.8507080078125, -4.588623046875, -4.3265380859375, -4.064453125, -3.8023681640625, -3.540283203125, -3.2781982421875, -3.01611328125, -2.7540283203125, -2.491943359375, -2.2298583984375, -1.9677734375, -1.7056884765625, -1.443603515625, -1.1815185546875, -0.91943359375, -0.6573486328125, -0.395263671875, -0.1331787109375, 0.12890625, 0.3909912109375, 0.653076171875, 0.9151611328125, 1.17724609375, 1.4393310546875, 1.701416015625, 1.9635009765625, 2.2255859375, 2.4876708984375, 2.749755859375, 3.0118408203125, 3.27392578125, 3.5360107421875, 3.798095703125, 4.0601806640625, 4.322265625, 4.5843505859375, 4.846435546875, 5.1085205078125, 5.37060546875, 5.6326904296875, 5.894775390625, 6.1568603515625, 6.4189453125, 6.6810302734375, 6.943115234375, 7.2052001953125, 7.46728515625, 7.7293701171875, 7.991455078125, 8.2535400390625, 8.515625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 11.0, 14.0, 15.0, 15.0, 29.0, 46.0, 62.0, 83.0, 129.0, 166.0, 241.0, 343.0, 521.0, 802.0, 1304.0, 1992.0, 3377.0, 5511.0, 9448.0, 18005.0, 35975.0, 76022.0, 163394.0, 274350.0, 229353.0, 115912.0, 53044.0, 25814.0, 13461.0, 7388.0, 4330.0, 2559.0, 1626.0, 1073.0, 737.0, 455.0, 291.0, 192.0, 128.0, 108.0, 73.0, 49.0, 23.0, 28.0, 17.0, 8.0, 11.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-14.8203125, -14.3680419921875, -13.915771484375, -13.4635009765625, -13.01123046875, -12.5589599609375, -12.106689453125, -11.6544189453125, -11.2021484375, -10.7498779296875, -10.297607421875, -9.8453369140625, -9.39306640625, -8.9407958984375, -8.488525390625, -8.0362548828125, -7.583984375, -7.1317138671875, -6.679443359375, -6.2271728515625, -5.77490234375, -5.3226318359375, -4.870361328125, -4.4180908203125, -3.9658203125, -3.5135498046875, -3.061279296875, -2.6090087890625, -2.15673828125, -1.7044677734375, -1.252197265625, -0.7999267578125, -0.34765625, 0.1046142578125, 0.556884765625, 1.0091552734375, 1.46142578125, 1.9136962890625, 2.365966796875, 2.8182373046875, 3.2705078125, 3.7227783203125, 4.175048828125, 4.6273193359375, 5.07958984375, 5.5318603515625, 5.984130859375, 6.4364013671875, 6.888671875, 7.3409423828125, 7.793212890625, 8.2454833984375, 8.69775390625, 9.1500244140625, 9.602294921875, 10.0545654296875, 10.5068359375, 10.9591064453125, 11.411376953125, 11.8636474609375, 12.31591796875, 12.7681884765625, 13.220458984375, 13.6727294921875, 14.125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 5.0, 1.0, 1.0, 5.0, 5.0, 16.0, 8.0, 16.0, 13.0, 44.0, 40.0, 71.0, 71.0, 80.0, 86.0, 108.0, 93.0, 78.0, 59.0, 53.0, 27.0, 27.0, 33.0, 15.0, 10.0, 7.0, 11.0, 0.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013074874877929688, -0.0012574195861816406, -0.0012073516845703125, -0.0011572837829589844, -0.0011072158813476562, -0.0010571479797363281, -0.001007080078125, -0.0009570121765136719, -0.0009069442749023438, -0.0008568763732910156, -0.0008068084716796875, -0.0007567405700683594, -0.0007066726684570312, -0.0006566047668457031, -0.000606536865234375, -0.0005564689636230469, -0.0005064010620117188, -0.0004563331604003906, -0.0004062652587890625, -0.0003561973571777344, -0.00030612945556640625, -0.0002560615539550781, -0.00020599365234375, -0.00015592575073242188, -0.00010585784912109375, -5.5789947509765625e-05, -5.7220458984375e-06, 4.4345855712890625e-05, 9.441375732421875e-05, 0.00014448165893554688, 0.000194549560546875, 0.0002446174621582031, 0.00029468536376953125, 0.0003447532653808594, 0.0003948211669921875, 0.0004448890686035156, 0.0004949569702148438, 0.0005450248718261719, 0.0005950927734375, 0.0006451606750488281, 0.0006952285766601562, 0.0007452964782714844, 0.0007953643798828125, 0.0008454322814941406, 0.0008955001831054688, 0.0009455680847167969, 0.000995635986328125, 0.0010457038879394531, 0.0010957717895507812, 0.0011458396911621094, 0.0011959075927734375, 0.0012459754943847656, 0.0012960433959960938, 0.0013461112976074219, 0.00139617919921875, 0.0014462471008300781, 0.0014963150024414062, 0.0015463829040527344, 0.0015964508056640625, 0.0016465187072753906, 0.0016965866088867188, 0.0017466545104980469, 0.001796722412109375, 0.0018467903137207031, 0.0018968582153320312]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 5.0, 5.0, 7.0, 9.0, 21.0, 27.0, 17.0, 35.0, 46.0, 74.0, 82.0, 95.0, 144.0, 223.0, 290.0, 427.0, 580.0, 951.0, 1438.0, 2405.0, 4330.0, 8064.0, 16655.0, 37467.0, 94818.0, 240690.0, 336052.0, 178423.0, 68487.0, 28148.0, 12760.0, 6398.0, 3497.0, 2058.0, 1188.0, 807.0, 530.0, 334.0, 268.0, 199.0, 138.0, 99.0, 75.0, 55.0, 22.0, 30.0, 16.0, 22.0, 15.0, 11.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-17.140625, -16.575439453125, -16.01025390625, -15.445068359375, -14.8798828125, -14.314697265625, -13.74951171875, -13.184326171875, -12.619140625, -12.053955078125, -11.48876953125, -10.923583984375, -10.3583984375, -9.793212890625, -9.22802734375, -8.662841796875, -8.09765625, -7.532470703125, -6.96728515625, -6.402099609375, -5.8369140625, -5.271728515625, -4.70654296875, -4.141357421875, -3.576171875, -3.010986328125, -2.44580078125, -1.880615234375, -1.3154296875, -0.750244140625, -0.18505859375, 0.380126953125, 0.9453125, 1.510498046875, 2.07568359375, 2.640869140625, 3.2060546875, 3.771240234375, 4.33642578125, 4.901611328125, 5.466796875, 6.031982421875, 6.59716796875, 7.162353515625, 7.7275390625, 8.292724609375, 8.85791015625, 9.423095703125, 9.98828125, 10.553466796875, 11.11865234375, 11.683837890625, 12.2490234375, 12.814208984375, 13.37939453125, 13.944580078125, 14.509765625, 15.074951171875, 15.64013671875, 16.205322265625, 16.7705078125, 17.335693359375, 17.90087890625, 18.466064453125, 19.03125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 6.0, 9.0, 5.0, 16.0, 20.0, 29.0, 26.0, 39.0, 22.0, 39.0, 59.0, 63.0, 73.0, 72.0, 93.0, 71.0, 69.0, 63.0, 54.0, 37.0, 33.0, 20.0, 16.0, 16.0, 11.0, 8.0, 9.0, 8.0, 5.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140625, -4.00274658203125, -3.8648681640625, -3.72698974609375, -3.589111328125, -3.45123291015625, -3.3133544921875, -3.17547607421875, -3.03759765625, -2.89971923828125, -2.7618408203125, -2.62396240234375, -2.486083984375, -2.34820556640625, -2.2103271484375, -2.07244873046875, -1.9345703125, -1.79669189453125, -1.6588134765625, -1.52093505859375, -1.383056640625, -1.24517822265625, -1.1072998046875, -0.96942138671875, -0.83154296875, -0.69366455078125, -0.5557861328125, -0.41790771484375, -0.280029296875, -0.14215087890625, -0.0042724609375, 0.13360595703125, 0.271484375, 0.40936279296875, 0.5472412109375, 0.68511962890625, 0.822998046875, 0.96087646484375, 1.0987548828125, 1.23663330078125, 1.37451171875, 1.51239013671875, 1.6502685546875, 1.78814697265625, 1.926025390625, 2.06390380859375, 2.2017822265625, 2.33966064453125, 2.4775390625, 2.61541748046875, 2.7532958984375, 2.89117431640625, 3.029052734375, 3.16693115234375, 3.3048095703125, 3.44268798828125, 3.58056640625, 3.71844482421875, 3.8563232421875, 3.99420166015625, 4.132080078125, 4.26995849609375, 4.4078369140625, 4.54571533203125, 4.68359375]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 7.0, 12.0, 10.0, 20.0, 25.0, 32.0, 34.0, 41.0, 45.0, 46.0, 64.0, 73.0, 90.0, 60.0, 72.0, 58.0, 58.0, 61.0, 39.0, 33.0, 25.0, 21.0, 19.0, 9.0, 9.0, 5.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.214067459106445, -25.52163314819336, -24.82919692993164, -24.136760711669922, -23.444326400756836, -22.75189208984375, -22.05945587158203, -21.367019653320312, -20.674585342407227, -19.98215103149414, -19.289714813232422, -18.597278594970703, -17.904844284057617, -17.21240997314453, -16.519973754882812, -15.82753849029541, -15.135103225708008, -14.442667961120605, -13.750232696533203, -13.0577974319458, -12.365362167358398, -11.672926902770996, -10.980491638183594, -10.288056373596191, -9.595621109008789, -8.903185844421387, -8.210750579833984, -7.518315315246582, -6.82588005065918, -6.133444786071777, -5.441009521484375, -4.748574256896973, -4.05613899230957, -3.363703727722168, -2.6712684631347656, -1.9788331985473633, -1.286397933959961, -0.5939626693725586, 0.09847259521484375, 0.7909078598022461, 1.4833431243896484, 2.175778388977051, 2.868213653564453, 3.5606489181518555, 4.253084182739258, 4.94551944732666, 5.6379547119140625, 6.330389976501465, 7.022825241088867, 7.7152605056762695, 8.407695770263672, 9.100131034851074, 9.792566299438477, 10.485001564025879, 11.177436828613281, 11.869872093200684, 12.562307357788086, 13.254742622375488, 13.94717788696289, 14.639613151550293, 15.332048416137695, 16.02448272705078, 16.7169189453125, 17.40935516357422, 18.101789474487305]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 3.0, 7.0, 10.0, 7.0, 13.0, 9.0, 9.0, 17.0, 29.0, 16.0, 11.0, 27.0, 33.0, 27.0, 30.0, 30.0, 28.0, 35.0, 39.0, 38.0, 29.0, 37.0, 30.0, 38.0, 39.0, 38.0, 34.0, 36.0, 32.0, 24.0, 27.0, 28.0, 28.0, 14.0, 13.0, 17.0, 13.0, 7.0, 12.0, 10.0, 17.0, 12.0, 7.0, 9.0, 7.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.033554077148438, -11.64134407043457, -11.249134063720703, -10.856924057006836, -10.464715003967285, -10.072504997253418, -9.68029499053955, -9.288084983825684, -8.895875930786133, -8.503665924072266, -8.111455917358398, -7.7192463874816895, -7.3270368576049805, -6.934826850891113, -6.542616844177246, -6.150406837463379, -5.758196830749512, -5.3659868240356445, -4.9737772941589355, -4.581567287445068, -4.189357757568359, -3.797147750854492, -3.404937744140625, -3.012727975845337, -2.620518207550049, -2.2283084392547607, -1.836098551750183, -1.4438886642456055, -1.0516788959503174, -0.6594691276550293, -0.2672591209411621, 0.12495064735412598, 0.5171594619750977, 0.9093692898750305, 1.3015791177749634, 1.693789005279541, 2.085998773574829, 2.478208541870117, 2.8704185485839844, 3.2626283168792725, 3.6548380851745605, 4.047048091888428, 4.439257621765137, 4.831467628479004, 5.223677635192871, 5.61588716506958, 6.008097171783447, 6.400306701660156, 6.792516708374023, 7.184726715087891, 7.5769362449646, 7.969146251678467, 8.361355781555176, 8.753565788269043, 9.14577579498291, 9.537985801696777, 9.930194854736328, 10.322404861450195, 10.714614868164062, 11.10682487487793, 11.49903392791748, 11.891243934631348, 12.283453941345215, 12.675663948059082, 13.06787395477295]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 3.0, 3.0, 4.0, 3.0, 12.0, 11.0, 14.0, 22.0, 32.0, 49.0, 57.0, 83.0, 125.0, 151.0, 234.0, 329.0, 519.0, 772.0, 1212.0, 1940.0, 3078.0, 5179.0, 8514.0, 15172.0, 28021.0, 55532.0, 119509.0, 288329.0, 731860.0, 1286022.0, 953670.0, 389978.0, 153838.0, 69258.0, 34394.0, 18656.0, 10480.0, 6281.0, 3786.0, 2383.0, 1505.0, 1082.0, 665.0, 450.0, 315.0, 209.0, 153.0, 114.0, 80.0, 49.0, 38.0, 32.0, 26.0, 19.0, 14.0, 14.0, 5.0, 2.0, 3.0, 3.0, 3.0], "bins": [-20.84375, -20.20556640625, -19.5673828125, -18.92919921875, -18.291015625, -17.65283203125, -17.0146484375, -16.37646484375, -15.73828125, -15.10009765625, -14.4619140625, -13.82373046875, -13.185546875, -12.54736328125, -11.9091796875, -11.27099609375, -10.6328125, -9.99462890625, -9.3564453125, -8.71826171875, -8.080078125, -7.44189453125, -6.8037109375, -6.16552734375, -5.52734375, -4.88916015625, -4.2509765625, -3.61279296875, -2.974609375, -2.33642578125, -1.6982421875, -1.06005859375, -0.421875, 0.21630859375, 0.8544921875, 1.49267578125, 2.130859375, 2.76904296875, 3.4072265625, 4.04541015625, 4.68359375, 5.32177734375, 5.9599609375, 6.59814453125, 7.236328125, 7.87451171875, 8.5126953125, 9.15087890625, 9.7890625, 10.42724609375, 11.0654296875, 11.70361328125, 12.341796875, 12.97998046875, 13.6181640625, 14.25634765625, 14.89453125, 15.53271484375, 16.1708984375, 16.80908203125, 17.447265625, 18.08544921875, 18.7236328125, 19.36181640625, 20.0]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 3.0, 4.0, 6.0, 5.0, 5.0, 12.0, 11.0, 14.0, 14.0, 21.0, 17.0, 23.0, 30.0, 34.0, 27.0, 27.0, 35.0, 39.0, 35.0, 27.0, 35.0, 35.0, 47.0, 31.0, 40.0, 38.0, 40.0, 26.0, 39.0, 39.0, 29.0, 29.0, 26.0, 15.0, 15.0, 17.0, 16.0, 12.0, 13.0, 10.0, 16.0, 11.0, 2.0, 6.0, 6.0, 4.0, 9.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.7734375, -8.4896240234375, -8.205810546875, -7.9219970703125, -7.63818359375, -7.3543701171875, -7.070556640625, -6.7867431640625, -6.5029296875, -6.2191162109375, -5.935302734375, -5.6514892578125, -5.36767578125, -5.0838623046875, -4.800048828125, -4.5162353515625, -4.232421875, -3.9486083984375, -3.664794921875, -3.3809814453125, -3.09716796875, -2.8133544921875, -2.529541015625, -2.2457275390625, -1.9619140625, -1.6781005859375, -1.394287109375, -1.1104736328125, -0.82666015625, -0.5428466796875, -0.259033203125, 0.0247802734375, 0.30859375, 0.5924072265625, 0.876220703125, 1.1600341796875, 1.44384765625, 1.7276611328125, 2.011474609375, 2.2952880859375, 2.5791015625, 2.8629150390625, 3.146728515625, 3.4305419921875, 3.71435546875, 3.9981689453125, 4.281982421875, 4.5657958984375, 4.849609375, 5.1334228515625, 5.417236328125, 5.7010498046875, 5.98486328125, 6.2686767578125, 6.552490234375, 6.8363037109375, 7.1201171875, 7.4039306640625, 7.687744140625, 7.9715576171875, 8.25537109375, 8.5391845703125, 8.822998046875, 9.1068115234375, 9.390625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 12.0, 22.0, 27.0, 29.0, 49.0, 75.0, 85.0, 135.0, 204.0, 334.0, 489.0, 739.0, 1194.0, 1783.0, 3094.0, 5148.0, 9200.0, 16625.0, 31681.0, 63107.0, 135113.0, 303634.0, 692123.0, 1201549.0, 930093.0, 430343.0, 188741.0, 86506.0, 42134.0, 21741.0, 11851.0, 6508.0, 3752.0, 2309.0, 1383.0, 862.0, 545.0, 373.0, 248.0, 146.0, 106.0, 55.0, 52.0, 31.0, 25.0, 17.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.74755859375, -19.1044921875, -18.46142578125, -17.818359375, -17.17529296875, -16.5322265625, -15.88916015625, -15.24609375, -14.60302734375, -13.9599609375, -13.31689453125, -12.673828125, -12.03076171875, -11.3876953125, -10.74462890625, -10.1015625, -9.45849609375, -8.8154296875, -8.17236328125, -7.529296875, -6.88623046875, -6.2431640625, -5.60009765625, -4.95703125, -4.31396484375, -3.6708984375, -3.02783203125, -2.384765625, -1.74169921875, -1.0986328125, -0.45556640625, 0.1875, 0.83056640625, 1.4736328125, 2.11669921875, 2.759765625, 3.40283203125, 4.0458984375, 4.68896484375, 5.33203125, 5.97509765625, 6.6181640625, 7.26123046875, 7.904296875, 8.54736328125, 9.1904296875, 9.83349609375, 10.4765625, 11.11962890625, 11.7626953125, 12.40576171875, 13.048828125, 13.69189453125, 14.3349609375, 14.97802734375, 15.62109375, 16.26416015625, 16.9072265625, 17.55029296875, 18.193359375, 18.83642578125, 19.4794921875, 20.12255859375, 20.765625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 6.0, 3.0, 5.0, 5.0, 4.0, 10.0, 2.0, 10.0, 12.0, 20.0, 17.0, 20.0, 33.0, 54.0, 54.0, 72.0, 89.0, 128.0, 132.0, 173.0, 215.0, 270.0, 301.0, 337.0, 309.0, 316.0, 238.0, 222.0, 193.0, 194.0, 131.0, 106.0, 98.0, 79.0, 50.0, 38.0, 31.0, 22.0, 25.0, 16.0, 11.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.390625, -6.1982421875, -6.005859375, -5.8134765625, -5.62109375, -5.4287109375, -5.236328125, -5.0439453125, -4.8515625, -4.6591796875, -4.466796875, -4.2744140625, -4.08203125, -3.8896484375, -3.697265625, -3.5048828125, -3.3125, -3.1201171875, -2.927734375, -2.7353515625, -2.54296875, -2.3505859375, -2.158203125, -1.9658203125, -1.7734375, -1.5810546875, -1.388671875, -1.1962890625, -1.00390625, -0.8115234375, -0.619140625, -0.4267578125, -0.234375, -0.0419921875, 0.150390625, 0.3427734375, 0.53515625, 0.7275390625, 0.919921875, 1.1123046875, 1.3046875, 1.4970703125, 1.689453125, 1.8818359375, 2.07421875, 2.2666015625, 2.458984375, 2.6513671875, 2.84375, 3.0361328125, 3.228515625, 3.4208984375, 3.61328125, 3.8056640625, 3.998046875, 4.1904296875, 4.3828125, 4.5751953125, 4.767578125, 4.9599609375, 5.15234375, 5.3447265625, 5.537109375, 5.7294921875, 5.921875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 13.0, 14.0, 8.0, 20.0, 26.0, 33.0, 36.0, 42.0, 51.0, 62.0, 79.0, 89.0, 78.0, 70.0, 73.0, 55.0, 43.0, 42.0, 35.0, 18.0, 15.0, 22.0, 18.0, 9.0, 14.0, 6.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.06292724609375, -26.371339797973633, -25.679750442504883, -24.988162994384766, -24.29657554626465, -23.60498809814453, -22.91339874267578, -22.221811294555664, -21.530223846435547, -20.83863639831543, -20.14704704284668, -19.455459594726562, -18.763872146606445, -18.072284698486328, -17.380695343017578, -16.68910789489746, -15.997518539428711, -15.305930137634277, -14.61434268951416, -13.922754287719727, -13.23116683959961, -12.539578437805176, -11.847990036010742, -11.156402587890625, -10.464814186096191, -9.773225784301758, -9.08163833618164, -8.390049934387207, -7.698462009429932, -7.006874084472656, -6.315285682678223, -5.623697757720947, -4.932111740112305, -4.240523815155029, -3.548935651779175, -2.8573474884033203, -2.165759563446045, -1.4741716384887695, -0.7825832366943359, -0.09099531173706055, 0.6005926132202148, 1.2921806573867798, 1.9837687015533447, 2.675356864929199, 3.3669447898864746, 4.05853271484375, 4.750121116638184, 5.441709041595459, 6.133296966552734, 6.82488489151001, 7.516472816467285, 8.208061218261719, 8.899648666381836, 9.59123706817627, 10.282825469970703, 10.97441291809082, 11.666001319885254, 12.357589721679688, 13.049177169799805, 13.740765571594238, 14.432353973388672, 15.123941421508789, 15.815529823303223, 16.507118225097656, 17.198705673217773]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 5.0, 6.0, 5.0, 16.0, 11.0, 17.0, 18.0, 17.0, 17.0, 19.0, 15.0, 30.0, 31.0, 36.0, 38.0, 32.0, 33.0, 48.0, 36.0, 43.0, 42.0, 47.0, 36.0, 43.0, 39.0, 31.0, 32.0, 39.0, 17.0, 22.0, 32.0, 22.0, 21.0, 21.0, 13.0, 7.0, 14.0, 12.0, 9.0, 6.0, 6.0, 7.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.914490699768066, -12.507570266723633, -12.100648880004883, -11.69372844696045, -11.286808013916016, -10.879887580871582, -10.472967147827148, -10.066045761108398, -9.659125328063965, -9.252204895019531, -8.845283508300781, -8.438363075256348, -8.031442642211914, -7.6245222091674805, -7.217601299285889, -6.810680389404297, -6.403759956359863, -5.99683952331543, -5.589918613433838, -5.182997703552246, -4.7760772705078125, -4.369156837463379, -3.962235927581787, -3.5553152561187744, -3.1483945846557617, -2.741473913192749, -2.3345532417297363, -1.9276325702667236, -1.520711898803711, -1.1137912273406982, -0.7068705558776855, -0.29994988441467285, 0.10697174072265625, 0.513892412185669, 0.9208130836486816, 1.3277337551116943, 1.734654426574707, 2.1415750980377197, 2.5484957695007324, 2.955416440963745, 3.362337112426758, 3.7692577838897705, 4.176178455352783, 4.583099365234375, 4.990019798278809, 5.396940231323242, 5.803861141204834, 6.210782051086426, 6.617702484130859, 7.024622917175293, 7.431543827056885, 7.838464736938477, 8.24538516998291, 8.652305603027344, 9.059226989746094, 9.466147422790527, 9.873067855834961, 10.279988288879395, 10.686908721923828, 11.093830108642578, 11.500750541687012, 11.907670974731445, 12.314592361450195, 12.721512794494629, 13.128433227539062]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 8.0, 4.0, 16.0, 20.0, 29.0, 41.0, 74.0, 117.0, 189.0, 279.0, 419.0, 658.0, 1146.0, 1761.0, 2840.0, 4968.0, 8361.0, 14657.0, 27010.0, 51107.0, 99314.0, 180780.0, 242880.0, 187837.0, 104539.0, 53690.0, 28316.0, 15758.0, 8735.0, 4976.0, 2994.0, 1848.0, 1168.0, 745.0, 457.0, 279.0, 178.0, 130.0, 85.0, 46.0, 33.0, 19.0, 15.0, 10.0, 7.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7734375, -11.400146484375, -11.02685546875, -10.653564453125, -10.2802734375, -9.906982421875, -9.53369140625, -9.160400390625, -8.787109375, -8.413818359375, -8.04052734375, -7.667236328125, -7.2939453125, -6.920654296875, -6.54736328125, -6.174072265625, -5.80078125, -5.427490234375, -5.05419921875, -4.680908203125, -4.3076171875, -3.934326171875, -3.56103515625, -3.187744140625, -2.814453125, -2.441162109375, -2.06787109375, -1.694580078125, -1.3212890625, -0.947998046875, -0.57470703125, -0.201416015625, 0.171875, 0.545166015625, 0.91845703125, 1.291748046875, 1.6650390625, 2.038330078125, 2.41162109375, 2.784912109375, 3.158203125, 3.531494140625, 3.90478515625, 4.278076171875, 4.6513671875, 5.024658203125, 5.39794921875, 5.771240234375, 6.14453125, 6.517822265625, 6.89111328125, 7.264404296875, 7.6376953125, 8.010986328125, 8.38427734375, 8.757568359375, 9.130859375, 9.504150390625, 9.87744140625, 10.250732421875, 10.6240234375, 10.997314453125, 11.37060546875, 11.743896484375, 12.1171875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 12.0, 8.0, 6.0, 13.0, 13.0, 14.0, 17.0, 27.0, 27.0, 23.0, 33.0, 23.0, 27.0, 38.0, 31.0, 42.0, 36.0, 44.0, 41.0, 41.0, 46.0, 48.0, 39.0, 35.0, 36.0, 30.0, 32.0, 24.0, 35.0, 21.0, 19.0, 14.0, 17.0, 12.0, 10.0, 6.0, 13.0, 10.0, 7.0, 3.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-13.3671875, -12.9522705078125, -12.537353515625, -12.1224365234375, -11.70751953125, -11.2926025390625, -10.877685546875, -10.4627685546875, -10.0478515625, -9.6329345703125, -9.218017578125, -8.8031005859375, -8.38818359375, -7.9732666015625, -7.558349609375, -7.1434326171875, -6.728515625, -6.3135986328125, -5.898681640625, -5.4837646484375, -5.06884765625, -4.6539306640625, -4.239013671875, -3.8240966796875, -3.4091796875, -2.9942626953125, -2.579345703125, -2.1644287109375, -1.74951171875, -1.3345947265625, -0.919677734375, -0.5047607421875, -0.08984375, 0.3250732421875, 0.739990234375, 1.1549072265625, 1.56982421875, 1.9847412109375, 2.399658203125, 2.8145751953125, 3.2294921875, 3.6444091796875, 4.059326171875, 4.4742431640625, 4.88916015625, 5.3040771484375, 5.718994140625, 6.1339111328125, 6.548828125, 6.9637451171875, 7.378662109375, 7.7935791015625, 8.20849609375, 8.6234130859375, 9.038330078125, 9.4532470703125, 9.8681640625, 10.2830810546875, 10.697998046875, 11.1129150390625, 11.52783203125, 11.9427490234375, 12.357666015625, 12.7725830078125, 13.1875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 9.0, 3.0, 9.0, 11.0, 15.0, 33.0, 25.0, 42.0, 62.0, 68.0, 120.0, 172.0, 242.0, 414.0, 593.0, 949.0, 1614.0, 2685.0, 4832.0, 9167.0, 19461.0, 45274.0, 117015.0, 288423.0, 320044.0, 138169.0, 52995.0, 22313.0, 10560.0, 5404.0, 3086.0, 1763.0, 1031.0, 680.0, 400.0, 269.0, 168.0, 136.0, 88.0, 60.0, 48.0, 32.0, 23.0, 20.0, 7.0, 10.0, 5.0, 4.0, 8.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-19.015625, -18.457763671875, -17.89990234375, -17.342041015625, -16.7841796875, -16.226318359375, -15.66845703125, -15.110595703125, -14.552734375, -13.994873046875, -13.43701171875, -12.879150390625, -12.3212890625, -11.763427734375, -11.20556640625, -10.647705078125, -10.08984375, -9.531982421875, -8.97412109375, -8.416259765625, -7.8583984375, -7.300537109375, -6.74267578125, -6.184814453125, -5.626953125, -5.069091796875, -4.51123046875, -3.953369140625, -3.3955078125, -2.837646484375, -2.27978515625, -1.721923828125, -1.1640625, -0.606201171875, -0.04833984375, 0.509521484375, 1.0673828125, 1.625244140625, 2.18310546875, 2.740966796875, 3.298828125, 3.856689453125, 4.41455078125, 4.972412109375, 5.5302734375, 6.088134765625, 6.64599609375, 7.203857421875, 7.76171875, 8.319580078125, 8.87744140625, 9.435302734375, 9.9931640625, 10.551025390625, 11.10888671875, 11.666748046875, 12.224609375, 12.782470703125, 13.34033203125, 13.898193359375, 14.4560546875, 15.013916015625, 15.57177734375, 16.129638671875, 16.6875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 17.0, 15.0, 18.0, 12.0, 30.0, 22.0, 28.0, 31.0, 28.0, 31.0, 40.0, 39.0, 33.0, 31.0, 49.0, 33.0, 36.0, 52.0, 42.0, 38.0, 43.0, 41.0, 33.0, 34.0, 30.0, 34.0, 23.0, 20.0, 16.0, 13.0, 15.0, 12.0, 14.0, 8.0, 6.0, 2.0, 2.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.375, -8.12347412109375, -7.8719482421875, -7.62042236328125, -7.368896484375, -7.11737060546875, -6.8658447265625, -6.61431884765625, -6.36279296875, -6.11126708984375, -5.8597412109375, -5.60821533203125, -5.356689453125, -5.10516357421875, -4.8536376953125, -4.60211181640625, -4.3505859375, -4.09906005859375, -3.8475341796875, -3.59600830078125, -3.344482421875, -3.09295654296875, -2.8414306640625, -2.58990478515625, -2.33837890625, -2.08685302734375, -1.8353271484375, -1.58380126953125, -1.332275390625, -1.08074951171875, -0.8292236328125, -0.57769775390625, -0.326171875, -0.07464599609375, 0.1768798828125, 0.42840576171875, 0.679931640625, 0.93145751953125, 1.1829833984375, 1.43450927734375, 1.68603515625, 1.93756103515625, 2.1890869140625, 2.44061279296875, 2.692138671875, 2.94366455078125, 3.1951904296875, 3.44671630859375, 3.6982421875, 3.94976806640625, 4.2012939453125, 4.45281982421875, 4.704345703125, 4.95587158203125, 5.2073974609375, 5.45892333984375, 5.71044921875, 5.96197509765625, 6.2135009765625, 6.46502685546875, 6.716552734375, 6.96807861328125, 7.2196044921875, 7.47113037109375, 7.72265625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 14.0, 14.0, 15.0, 25.0, 35.0, 45.0, 75.0, 106.0, 171.0, 171.0, 281.0, 419.0, 646.0, 892.0, 1468.0, 2383.0, 3917.0, 6672.0, 12352.0, 24419.0, 52547.0, 121028.0, 269068.0, 294144.0, 137742.0, 59960.0, 27469.0, 13890.0, 7412.0, 4114.0, 2524.0, 1545.0, 1002.0, 609.0, 394.0, 304.0, 202.0, 143.0, 115.0, 70.0, 52.0, 27.0, 25.0, 17.0, 12.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.64453125, -5.473876953125, -5.30322265625, -5.132568359375, -4.9619140625, -4.791259765625, -4.62060546875, -4.449951171875, -4.279296875, -4.108642578125, -3.93798828125, -3.767333984375, -3.5966796875, -3.426025390625, -3.25537109375, -3.084716796875, -2.9140625, -2.743408203125, -2.57275390625, -2.402099609375, -2.2314453125, -2.060791015625, -1.89013671875, -1.719482421875, -1.548828125, -1.378173828125, -1.20751953125, -1.036865234375, -0.8662109375, -0.695556640625, -0.52490234375, -0.354248046875, -0.18359375, -0.012939453125, 0.15771484375, 0.328369140625, 0.4990234375, 0.669677734375, 0.84033203125, 1.010986328125, 1.181640625, 1.352294921875, 1.52294921875, 1.693603515625, 1.8642578125, 2.034912109375, 2.20556640625, 2.376220703125, 2.546875, 2.717529296875, 2.88818359375, 3.058837890625, 3.2294921875, 3.400146484375, 3.57080078125, 3.741455078125, 3.912109375, 4.082763671875, 4.25341796875, 4.424072265625, 4.5947265625, 4.765380859375, 4.93603515625, 5.106689453125, 5.27734375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 14.0, 27.0, 21.0, 34.0, 43.0, 69.0, 82.0, 94.0, 108.0, 91.0, 89.0, 71.0, 75.0, 38.0, 34.0, 20.0, 23.0, 11.0, 12.0, 13.0, 2.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003936290740966797, -0.0003808923065662384, -0.0003681555390357971, -0.00035541877150535583, -0.00034268200397491455, -0.00032994523644447327, -0.000317208468914032, -0.0003044717013835907, -0.0002917349338531494, -0.00027899816632270813, -0.00026626139879226685, -0.00025352463126182556, -0.00024078786373138428, -0.000228051096200943, -0.0002153143286705017, -0.00020257756114006042, -0.00018984079360961914, -0.00017710402607917786, -0.00016436725854873657, -0.0001516304910182953, -0.000138893723487854, -0.00012615695595741272, -0.00011342018842697144, -0.00010068342089653015, -8.794665336608887e-05, -7.520988583564758e-05, -6.24731183052063e-05, -4.9736350774765015e-05, -3.699958324432373e-05, -2.4262815713882446e-05, -1.1526048183441162e-05, 1.210719347000122e-06, 1.3947486877441406e-05, 2.668425440788269e-05, 3.9421021938323975e-05, 5.215778946876526e-05, 6.489455699920654e-05, 7.763132452964783e-05, 9.036809206008911e-05, 0.0001031048595905304, 0.00011584162712097168, 0.00012857839465141296, 0.00014131516218185425, 0.00015405192971229553, 0.00016678869724273682, 0.0001795254647731781, 0.00019226223230361938, 0.00020499899983406067, 0.00021773576736450195, 0.00023047253489494324, 0.00024320930242538452, 0.0002559460699558258, 0.0002686828374862671, 0.0002814196050167084, 0.00029415637254714966, 0.00030689314007759094, 0.0003196299076080322, 0.0003323666751384735, 0.0003451034426689148, 0.0003578402101993561, 0.00037057697772979736, 0.00038331374526023865, 0.00039605051279067993, 0.0004087872803211212, 0.0004215240478515625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 5.0, 5.0, 11.0, 14.0, 19.0, 31.0, 45.0, 72.0, 119.0, 171.0, 260.0, 485.0, 789.0, 1373.0, 2513.0, 4865.0, 9458.0, 19912.0, 44906.0, 105377.0, 223977.0, 295773.0, 186757.0, 82907.0, 35827.0, 15989.0, 7640.0, 4002.0, 2132.0, 1265.0, 716.0, 416.0, 258.0, 157.0, 91.0, 64.0, 51.0, 34.0, 30.0, 13.0, 13.0, 9.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.76171875, -5.5780029296875, -5.394287109375, -5.2105712890625, -5.02685546875, -4.8431396484375, -4.659423828125, -4.4757080078125, -4.2919921875, -4.1082763671875, -3.924560546875, -3.7408447265625, -3.55712890625, -3.3734130859375, -3.189697265625, -3.0059814453125, -2.822265625, -2.6385498046875, -2.454833984375, -2.2711181640625, -2.08740234375, -1.9036865234375, -1.719970703125, -1.5362548828125, -1.3525390625, -1.1688232421875, -0.985107421875, -0.8013916015625, -0.61767578125, -0.4339599609375, -0.250244140625, -0.0665283203125, 0.1171875, 0.3009033203125, 0.484619140625, 0.6683349609375, 0.85205078125, 1.0357666015625, 1.219482421875, 1.4031982421875, 1.5869140625, 1.7706298828125, 1.954345703125, 2.1380615234375, 2.32177734375, 2.5054931640625, 2.689208984375, 2.8729248046875, 3.056640625, 3.2403564453125, 3.424072265625, 3.6077880859375, 3.79150390625, 3.9752197265625, 4.158935546875, 4.3426513671875, 4.5263671875, 4.7100830078125, 4.893798828125, 5.0775146484375, 5.26123046875, 5.4449462890625, 5.628662109375, 5.8123779296875, 5.99609375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 6.0, 12.0, 8.0, 15.0, 20.0, 22.0, 22.0, 26.0, 38.0, 51.0, 51.0, 49.0, 33.0, 52.0, 63.0, 52.0, 44.0, 45.0, 50.0, 48.0, 39.0, 31.0, 38.0, 18.0, 32.0, 21.0, 18.0, 14.0, 14.0, 10.0, 11.0, 4.0, 8.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0849609375, -1.0475006103515625, -1.010040283203125, -0.9725799560546875, -0.93511962890625, -0.8976593017578125, -0.860198974609375, -0.8227386474609375, -0.7852783203125, -0.7478179931640625, -0.710357666015625, -0.6728973388671875, -0.63543701171875, -0.5979766845703125, -0.560516357421875, -0.5230560302734375, -0.485595703125, -0.4481353759765625, -0.410675048828125, -0.3732147216796875, -0.33575439453125, -0.2982940673828125, -0.260833740234375, -0.2233734130859375, -0.1859130859375, -0.1484527587890625, -0.110992431640625, -0.0735321044921875, -0.03607177734375, 0.0013885498046875, 0.038848876953125, 0.0763092041015625, 0.11376953125, 0.1512298583984375, 0.188690185546875, 0.2261505126953125, 0.26361083984375, 0.3010711669921875, 0.338531494140625, 0.3759918212890625, 0.4134521484375, 0.4509124755859375, 0.488372802734375, 0.5258331298828125, 0.56329345703125, 0.6007537841796875, 0.638214111328125, 0.6756744384765625, 0.713134765625, 0.7505950927734375, 0.788055419921875, 0.8255157470703125, 0.86297607421875, 0.9004364013671875, 0.937896728515625, 0.9753570556640625, 1.0128173828125, 1.0502777099609375, 1.087738037109375, 1.1251983642578125, 1.16265869140625, 1.2001190185546875, 1.237579345703125, 1.2750396728515625, 1.3125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 7.0, 9.0, 12.0, 5.0, 20.0, 21.0, 25.0, 31.0, 35.0, 45.0, 51.0, 62.0, 81.0, 79.0, 90.0, 76.0, 67.0, 52.0, 47.0, 44.0, 21.0, 25.0, 18.0, 22.0, 11.0, 15.0, 9.0, 10.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.460037231445312, -25.76615333557129, -25.072269439697266, -24.37838363647461, -23.684499740600586, -22.990615844726562, -22.296730041503906, -21.602846145629883, -20.90896224975586, -20.215078353881836, -19.521194458007812, -18.827308654785156, -18.133424758911133, -17.43954086303711, -16.745655059814453, -16.05177116394043, -15.357887268066406, -14.664003372192383, -13.970118522644043, -13.276233673095703, -12.58234977722168, -11.888465881347656, -11.194581031799316, -10.500696182250977, -9.806812286376953, -9.11292839050293, -8.41904354095459, -7.725159168243408, -7.031274795532227, -6.337390422821045, -5.643506050109863, -4.949621677398682, -4.2557373046875, -3.5618529319763184, -2.8679685592651367, -2.174084186553955, -1.4801998138427734, -0.7863154411315918, -0.09243106842041016, 0.6014533042907715, 1.2953376770019531, 1.9892220497131348, 2.6831064224243164, 3.376990795135498, 4.07087516784668, 4.764759540557861, 5.458643913269043, 6.152528285980225, 6.846412658691406, 7.540297031402588, 8.23418140411377, 8.92806625366211, 9.621950149536133, 10.315834045410156, 11.009718894958496, 11.703603744506836, 12.39748764038086, 13.091371536254883, 13.785256385803223, 14.479141235351562, 15.173025131225586, 15.86690902709961, 16.560794830322266, 17.25467872619629, 17.948562622070312]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 10.0, 16.0, 9.0, 20.0, 20.0, 11.0, 23.0, 16.0, 24.0, 29.0, 33.0, 38.0, 39.0, 29.0, 40.0, 41.0, 51.0, 40.0, 40.0, 43.0, 35.0, 32.0, 41.0, 39.0, 32.0, 27.0, 19.0, 21.0, 29.0, 26.0, 16.0, 17.0, 14.0, 13.0, 11.0, 12.0, 6.0, 3.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.408023834228516, -12.008654594421387, -11.609285354614258, -11.209916114807129, -10.810546875, -10.411177635192871, -10.011808395385742, -9.612439155578613, -9.213069915771484, -8.813700675964355, -8.414331436157227, -8.014962196350098, -7.615592956542969, -7.21622371673584, -6.816854476928711, -6.417485237121582, -6.018115997314453, -5.618746757507324, -5.219377517700195, -4.820008277893066, -4.4206390380859375, -4.021269798278809, -3.6219005584716797, -3.222531318664551, -2.823162078857422, -2.423792839050293, -2.024423599243164, -1.6250543594360352, -1.2256851196289062, -0.8263158798217773, -0.42694664001464844, -0.02757740020751953, 0.3717927932739258, 0.7711620330810547, 1.1705312728881836, 1.5699005126953125, 1.9692697525024414, 2.3686389923095703, 2.768008232116699, 3.167377471923828, 3.566746711730957, 3.966115951538086, 4.365485191345215, 4.764854431152344, 5.164223670959473, 5.563592910766602, 5.9629621505737305, 6.362331390380859, 6.761700630187988, 7.161069869995117, 7.560439109802246, 7.959808349609375, 8.359177589416504, 8.758546829223633, 9.157916069030762, 9.55728530883789, 9.95665454864502, 10.356023788452148, 10.755393028259277, 11.154762268066406, 11.554131507873535, 11.953500747680664, 12.352869987487793, 12.752239227294922, 13.15160846710205]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 10.0, 11.0, 18.0, 23.0, 41.0, 52.0, 67.0, 124.0, 190.0, 269.0, 455.0, 689.0, 1051.0, 1638.0, 2480.0, 3908.0, 6227.0, 9860.0, 15924.0, 25303.0, 40843.0, 64446.0, 98445.0, 137632.0, 162482.0, 151210.0, 115400.0, 77591.0, 49462.0, 30747.0, 18970.0, 12093.0, 7626.0, 4660.0, 3075.0, 1977.0, 1221.0, 784.0, 574.0, 353.0, 215.0, 140.0, 102.0, 51.0, 39.0, 33.0, 17.0, 9.0, 8.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7578125, -14.2772216796875, -13.796630859375, -13.3160400390625, -12.83544921875, -12.3548583984375, -11.874267578125, -11.3936767578125, -10.9130859375, -10.4324951171875, -9.951904296875, -9.4713134765625, -8.99072265625, -8.5101318359375, -8.029541015625, -7.5489501953125, -7.068359375, -6.5877685546875, -6.107177734375, -5.6265869140625, -5.14599609375, -4.6654052734375, -4.184814453125, -3.7042236328125, -3.2236328125, -2.7430419921875, -2.262451171875, -1.7818603515625, -1.30126953125, -0.8206787109375, -0.340087890625, 0.1405029296875, 0.62109375, 1.1016845703125, 1.582275390625, 2.0628662109375, 2.54345703125, 3.0240478515625, 3.504638671875, 3.9852294921875, 4.4658203125, 4.9464111328125, 5.427001953125, 5.9075927734375, 6.38818359375, 6.8687744140625, 7.349365234375, 7.8299560546875, 8.310546875, 8.7911376953125, 9.271728515625, 9.7523193359375, 10.23291015625, 10.7135009765625, 11.194091796875, 11.6746826171875, 12.1552734375, 12.6358642578125, 13.116455078125, 13.5970458984375, 14.07763671875, 14.5582275390625, 15.038818359375, 15.5194091796875, 16.0]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 8.0, 16.0, 12.0, 9.0, 18.0, 19.0, 15.0, 25.0, 23.0, 27.0, 36.0, 36.0, 42.0, 33.0, 43.0, 38.0, 47.0, 50.0, 49.0, 37.0, 47.0, 49.0, 38.0, 32.0, 32.0, 24.0, 29.0, 22.0, 15.0, 23.0, 17.0, 20.0, 13.0, 8.0, 5.0, 6.0, 6.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.796875, -12.3651123046875, -11.933349609375, -11.5015869140625, -11.06982421875, -10.6380615234375, -10.206298828125, -9.7745361328125, -9.3427734375, -8.9110107421875, -8.479248046875, -8.0474853515625, -7.61572265625, -7.1839599609375, -6.752197265625, -6.3204345703125, -5.888671875, -5.4569091796875, -5.025146484375, -4.5933837890625, -4.16162109375, -3.7298583984375, -3.298095703125, -2.8663330078125, -2.4345703125, -2.0028076171875, -1.571044921875, -1.1392822265625, -0.70751953125, -0.2757568359375, 0.156005859375, 0.5877685546875, 1.01953125, 1.4512939453125, 1.883056640625, 2.3148193359375, 2.74658203125, 3.1783447265625, 3.610107421875, 4.0418701171875, 4.4736328125, 4.9053955078125, 5.337158203125, 5.7689208984375, 6.20068359375, 6.6324462890625, 7.064208984375, 7.4959716796875, 7.927734375, 8.3594970703125, 8.791259765625, 9.2230224609375, 9.65478515625, 10.0865478515625, 10.518310546875, 10.9500732421875, 11.3818359375, 11.8135986328125, 12.245361328125, 12.6771240234375, 13.10888671875, 13.5406494140625, 13.972412109375, 14.4041748046875, 14.8359375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 8.0, 10.0, 30.0, 20.0, 35.0, 70.0, 117.0, 173.0, 237.0, 419.0, 674.0, 1095.0, 1861.0, 2930.0, 4911.0, 8127.0, 14233.0, 23805.0, 40531.0, 67755.0, 106475.0, 151632.0, 175907.0, 156613.0, 112700.0, 71548.0, 43756.0, 25606.0, 14986.0, 8875.0, 5266.0, 3215.0, 1925.0, 1112.0, 694.0, 430.0, 265.0, 177.0, 127.0, 64.0, 48.0, 25.0, 22.0, 13.0, 13.0, 8.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.3214111328125, -12.838134765625, -12.3548583984375, -11.87158203125, -11.3883056640625, -10.905029296875, -10.4217529296875, -9.9384765625, -9.4552001953125, -8.971923828125, -8.4886474609375, -8.00537109375, -7.5220947265625, -7.038818359375, -6.5555419921875, -6.072265625, -5.5889892578125, -5.105712890625, -4.6224365234375, -4.13916015625, -3.6558837890625, -3.172607421875, -2.6893310546875, -2.2060546875, -1.7227783203125, -1.239501953125, -0.7562255859375, -0.27294921875, 0.2103271484375, 0.693603515625, 1.1768798828125, 1.66015625, 2.1434326171875, 2.626708984375, 3.1099853515625, 3.59326171875, 4.0765380859375, 4.559814453125, 5.0430908203125, 5.5263671875, 6.0096435546875, 6.492919921875, 6.9761962890625, 7.45947265625, 7.9427490234375, 8.426025390625, 8.9093017578125, 9.392578125, 9.8758544921875, 10.359130859375, 10.8424072265625, 11.32568359375, 11.8089599609375, 12.292236328125, 12.7755126953125, 13.2587890625, 13.7420654296875, 14.225341796875, 14.7086181640625, 15.19189453125, 15.6751708984375, 16.158447265625, 16.6417236328125, 17.125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 10.0, 5.0, 6.0, 4.0, 9.0, 7.0, 15.0, 11.0, 17.0, 23.0, 13.0, 23.0, 26.0, 19.0, 38.0, 42.0, 37.0, 30.0, 42.0, 38.0, 52.0, 58.0, 47.0, 29.0, 41.0, 42.0, 31.0, 36.0, 35.0, 31.0, 31.0, 23.0, 14.0, 13.0, 13.0, 20.0, 13.0, 14.0, 9.0, 14.0, 4.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.4609375, -8.19677734375, -7.9326171875, -7.66845703125, -7.404296875, -7.14013671875, -6.8759765625, -6.61181640625, -6.34765625, -6.08349609375, -5.8193359375, -5.55517578125, -5.291015625, -5.02685546875, -4.7626953125, -4.49853515625, -4.234375, -3.97021484375, -3.7060546875, -3.44189453125, -3.177734375, -2.91357421875, -2.6494140625, -2.38525390625, -2.12109375, -1.85693359375, -1.5927734375, -1.32861328125, -1.064453125, -0.80029296875, -0.5361328125, -0.27197265625, -0.0078125, 0.25634765625, 0.5205078125, 0.78466796875, 1.048828125, 1.31298828125, 1.5771484375, 1.84130859375, 2.10546875, 2.36962890625, 2.6337890625, 2.89794921875, 3.162109375, 3.42626953125, 3.6904296875, 3.95458984375, 4.21875, 4.48291015625, 4.7470703125, 5.01123046875, 5.275390625, 5.53955078125, 5.8037109375, 6.06787109375, 6.33203125, 6.59619140625, 6.8603515625, 7.12451171875, 7.388671875, 7.65283203125, 7.9169921875, 8.18115234375, 8.4453125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 7.0, 5.0, 10.0, 6.0, 16.0, 23.0, 33.0, 43.0, 57.0, 76.0, 160.0, 200.0, 294.0, 521.0, 725.0, 1205.0, 1775.0, 2723.0, 4381.0, 7053.0, 11272.0, 18948.0, 31850.0, 53823.0, 91066.0, 143956.0, 189116.0, 177215.0, 123474.0, 75784.0, 44759.0, 26392.0, 15725.0, 9532.0, 5851.0, 3655.0, 2405.0, 1468.0, 1010.0, 655.0, 411.0, 280.0, 187.0, 129.0, 87.0, 66.0, 37.0, 32.0, 23.0, 11.0, 14.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0], "bins": [-9.140625, -8.870361328125, -8.60009765625, -8.329833984375, -8.0595703125, -7.789306640625, -7.51904296875, -7.248779296875, -6.978515625, -6.708251953125, -6.43798828125, -6.167724609375, -5.8974609375, -5.627197265625, -5.35693359375, -5.086669921875, -4.81640625, -4.546142578125, -4.27587890625, -4.005615234375, -3.7353515625, -3.465087890625, -3.19482421875, -2.924560546875, -2.654296875, -2.384033203125, -2.11376953125, -1.843505859375, -1.5732421875, -1.302978515625, -1.03271484375, -0.762451171875, -0.4921875, -0.221923828125, 0.04833984375, 0.318603515625, 0.5888671875, 0.859130859375, 1.12939453125, 1.399658203125, 1.669921875, 1.940185546875, 2.21044921875, 2.480712890625, 2.7509765625, 3.021240234375, 3.29150390625, 3.561767578125, 3.83203125, 4.102294921875, 4.37255859375, 4.642822265625, 4.9130859375, 5.183349609375, 5.45361328125, 5.723876953125, 5.994140625, 6.264404296875, 6.53466796875, 6.804931640625, 7.0751953125, 7.345458984375, 7.61572265625, 7.885986328125, 8.15625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 4.0, 7.0, 15.0, 18.0, 18.0, 16.0, 28.0, 33.0, 43.0, 56.0, 76.0, 78.0, 88.0, 85.0, 84.0, 72.0, 60.0, 51.0, 51.0, 27.0, 23.0, 23.0, 12.0, 10.0, 4.0, 2.0, 4.0, 2.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010280609130859375, -0.000990539789199829, -0.0009530186653137207, -0.0009154975414276123, -0.0008779764175415039, -0.0008404552936553955, -0.0008029341697692871, -0.0007654130458831787, -0.0007278919219970703, -0.0006903707981109619, -0.0006528496742248535, -0.0006153285503387451, -0.0005778074264526367, -0.0005402863025665283, -0.0005027651786804199, -0.0004652440547943115, -0.0004277229309082031, -0.0003902018070220947, -0.00035268068313598633, -0.00031515955924987793, -0.00027763843536376953, -0.00024011731147766113, -0.00020259618759155273, -0.00016507506370544434, -0.00012755393981933594, -9.003281593322754e-05, -5.251169204711914e-05, -1.4990568161010742e-05, 2.2530555725097656e-05, 6.0051679611206055e-05, 9.757280349731445e-05, 0.00013509392738342285, 0.00017261505126953125, 0.00021013617515563965, 0.00024765729904174805, 0.00028517842292785645, 0.00032269954681396484, 0.00036022067070007324, 0.00039774179458618164, 0.00043526291847229004, 0.00047278404235839844, 0.0005103051662445068, 0.0005478262901306152, 0.0005853474140167236, 0.000622868537902832, 0.0006603896617889404, 0.0006979107856750488, 0.0007354319095611572, 0.0007729530334472656, 0.000810474157333374, 0.0008479952812194824, 0.0008855164051055908, 0.0009230375289916992, 0.0009605586528778076, 0.000998079776763916, 0.0010356009006500244, 0.0010731220245361328, 0.0011106431484222412, 0.0011481642723083496, 0.001185685396194458, 0.0012232065200805664, 0.0012607276439666748, 0.0012982487678527832, 0.0013357698917388916, 0.001373291015625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 8.0, 15.0, 21.0, 32.0, 39.0, 74.0, 89.0, 135.0, 221.0, 336.0, 437.0, 807.0, 1118.0, 1807.0, 2908.0, 4482.0, 7443.0, 12463.0, 21323.0, 36632.0, 62582.0, 104572.0, 158518.0, 190212.0, 165288.0, 112148.0, 67472.0, 39713.0, 22809.0, 13501.0, 8026.0, 4842.0, 2995.0, 1927.0, 1268.0, 736.0, 485.0, 362.0, 236.0, 160.0, 97.0, 78.0, 37.0, 34.0, 19.0, 19.0, 11.0, 4.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.07958984375, -8.7919921875, -8.50439453125, -8.216796875, -7.92919921875, -7.6416015625, -7.35400390625, -7.06640625, -6.77880859375, -6.4912109375, -6.20361328125, -5.916015625, -5.62841796875, -5.3408203125, -5.05322265625, -4.765625, -4.47802734375, -4.1904296875, -3.90283203125, -3.615234375, -3.32763671875, -3.0400390625, -2.75244140625, -2.46484375, -2.17724609375, -1.8896484375, -1.60205078125, -1.314453125, -1.02685546875, -0.7392578125, -0.45166015625, -0.1640625, 0.12353515625, 0.4111328125, 0.69873046875, 0.986328125, 1.27392578125, 1.5615234375, 1.84912109375, 2.13671875, 2.42431640625, 2.7119140625, 2.99951171875, 3.287109375, 3.57470703125, 3.8623046875, 4.14990234375, 4.4375, 4.72509765625, 5.0126953125, 5.30029296875, 5.587890625, 5.87548828125, 6.1630859375, 6.45068359375, 6.73828125, 7.02587890625, 7.3134765625, 7.60107421875, 7.888671875, 8.17626953125, 8.4638671875, 8.75146484375, 9.0390625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 4.0, 4.0, 12.0, 7.0, 9.0, 14.0, 15.0, 20.0, 36.0, 36.0, 27.0, 40.0, 39.0, 53.0, 45.0, 61.0, 63.0, 69.0, 54.0, 49.0, 68.0, 47.0, 51.0, 41.0, 25.0, 26.0, 15.0, 11.0, 18.0, 17.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-4.01953125, -3.89483642578125, -3.7701416015625, -3.64544677734375, -3.520751953125, -3.39605712890625, -3.2713623046875, -3.14666748046875, -3.02197265625, -2.89727783203125, -2.7725830078125, -2.64788818359375, -2.523193359375, -2.39849853515625, -2.2738037109375, -2.14910888671875, -2.0244140625, -1.89971923828125, -1.7750244140625, -1.65032958984375, -1.525634765625, -1.40093994140625, -1.2762451171875, -1.15155029296875, -1.02685546875, -0.90216064453125, -0.7774658203125, -0.65277099609375, -0.528076171875, -0.40338134765625, -0.2786865234375, -0.15399169921875, -0.029296875, 0.09539794921875, 0.2200927734375, 0.34478759765625, 0.469482421875, 0.59417724609375, 0.7188720703125, 0.84356689453125, 0.96826171875, 1.09295654296875, 1.2176513671875, 1.34234619140625, 1.467041015625, 1.59173583984375, 1.7164306640625, 1.84112548828125, 1.9658203125, 2.09051513671875, 2.2152099609375, 2.33990478515625, 2.464599609375, 2.58929443359375, 2.7139892578125, 2.83868408203125, 2.96337890625, 3.08807373046875, 3.2127685546875, 3.33746337890625, 3.462158203125, 3.58685302734375, 3.7115478515625, 3.83624267578125, 3.9609375]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 4.0, 8.0, 11.0, 13.0, 12.0, 25.0, 23.0, 28.0, 28.0, 45.0, 60.0, 66.0, 65.0, 74.0, 76.0, 85.0, 59.0, 65.0, 39.0, 51.0, 32.0, 22.0, 17.0, 18.0, 15.0, 8.0, 14.0, 11.0, 8.0, 0.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.177438735961914, -22.52055549621582, -21.863672256469727, -21.206790924072266, -20.549907684326172, -19.893024444580078, -19.236141204833984, -18.57925796508789, -17.922374725341797, -17.265491485595703, -16.60860824584961, -15.951725959777832, -15.294842720031738, -14.637960433959961, -13.981077194213867, -13.324193954467773, -12.667311668395996, -12.010428428649902, -11.353546142578125, -10.696662902832031, -10.039779663085938, -9.382896423339844, -8.726014137268066, -8.069130897521973, -7.412248134613037, -6.755365371704102, -6.098482131958008, -5.441599369049072, -4.784716606140137, -4.127833366394043, -3.4709506034851074, -2.8140673637390137, -2.157184600830078, -1.5003015995025635, -0.8434187173843384, -0.18653583526611328, 0.47034716606140137, 1.127230167388916, 1.7841129302978516, 2.4409961700439453, 3.097878932952881, 3.7547619342803955, 4.41164493560791, 5.068527698516846, 5.725410461425781, 6.382293701171875, 7.0391764640808105, 7.696059703826904, 8.35294246673584, 9.009825706481934, 9.666707992553711, 10.323591232299805, 10.980474472045898, 11.637357711791992, 12.29423999786377, 12.951123237609863, 13.60800552368164, 14.264888763427734, 14.921771049499512, 15.578654289245605, 16.235536575317383, 16.892419815063477, 17.54930305480957, 18.206186294555664, 18.863069534301758]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 7.0, 14.0, 11.0, 11.0, 15.0, 14.0, 14.0, 11.0, 19.0, 23.0, 22.0, 43.0, 33.0, 41.0, 38.0, 38.0, 37.0, 41.0, 40.0, 42.0, 39.0, 35.0, 33.0, 38.0, 44.0, 29.0, 37.0, 39.0, 25.0, 18.0, 26.0, 19.0, 17.0, 11.0, 10.0, 12.0, 8.0, 12.0, 5.0, 4.0, 9.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.626763343811035, -11.233745574951172, -10.840727806091309, -10.447710037231445, -10.054691314697266, -9.661673545837402, -9.268655776977539, -8.875638008117676, -8.482620239257812, -8.08960247039795, -7.696584701538086, -7.3035664558410645, -6.910548686981201, -6.517530918121338, -6.124512672424316, -5.731494903564453, -5.33847713470459, -4.945459365844727, -4.552441596984863, -4.159423351287842, -3.7664055824279785, -3.3733878135681152, -2.980369806289673, -2.5873517990112305, -2.194334030151367, -1.8013161420822144, -1.4082982540130615, -1.0152803659439087, -0.6222624778747559, -0.22924458980560303, 0.1637732982635498, 0.5567913055419922, 0.9498081207275391, 1.342826008796692, 1.7358438968658447, 2.128861904144287, 2.5218796730041504, 2.9148974418640137, 3.307915449142456, 3.7009334564208984, 4.093951225280762, 4.486968994140625, 4.879986763000488, 5.27300500869751, 5.666022777557373, 6.059040546417236, 6.452058792114258, 6.845076560974121, 7.238094329833984, 7.631112098693848, 8.024129867553711, 8.417147636413574, 8.810165405273438, 9.203184127807617, 9.59620189666748, 9.989219665527344, 10.382237434387207, 10.77525520324707, 11.168272972106934, 11.561290740966797, 11.954309463500977, 12.34732723236084, 12.740345001220703, 13.133362770080566, 13.52638053894043]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 5.0, 10.0, 13.0, 15.0, 32.0, 38.0, 67.0, 78.0, 104.0, 159.0, 236.0, 344.0, 477.0, 718.0, 1095.0, 1613.0, 2428.0, 3619.0, 6020.0, 9777.0, 15722.0, 27352.0, 48729.0, 94502.0, 203960.0, 484002.0, 1011179.0, 1145831.0, 620035.0, 260060.0, 116265.0, 58559.0, 31850.0, 18314.0, 10887.0, 7082.0, 4294.0, 2892.0, 1833.0, 1235.0, 799.0, 594.0, 410.0, 299.0, 231.0, 139.0, 105.0, 75.0, 52.0, 36.0, 28.0, 27.0, 23.0, 11.0, 11.0, 9.0, 6.0, 6.0, 0.0, 4.0], "bins": [-16.296875, -15.773681640625, -15.25048828125, -14.727294921875, -14.2041015625, -13.680908203125, -13.15771484375, -12.634521484375, -12.111328125, -11.588134765625, -11.06494140625, -10.541748046875, -10.0185546875, -9.495361328125, -8.97216796875, -8.448974609375, -7.92578125, -7.402587890625, -6.87939453125, -6.356201171875, -5.8330078125, -5.309814453125, -4.78662109375, -4.263427734375, -3.740234375, -3.217041015625, -2.69384765625, -2.170654296875, -1.6474609375, -1.124267578125, -0.60107421875, -0.077880859375, 0.4453125, 0.968505859375, 1.49169921875, 2.014892578125, 2.5380859375, 3.061279296875, 3.58447265625, 4.107666015625, 4.630859375, 5.154052734375, 5.67724609375, 6.200439453125, 6.7236328125, 7.246826171875, 7.77001953125, 8.293212890625, 8.81640625, 9.339599609375, 9.86279296875, 10.385986328125, 10.9091796875, 11.432373046875, 11.95556640625, 12.478759765625, 13.001953125, 13.525146484375, 14.04833984375, 14.571533203125, 15.0947265625, 15.617919921875, 16.14111328125, 16.664306640625, 17.1875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 11.0, 8.0, 11.0, 10.0, 19.0, 10.0, 15.0, 16.0, 20.0, 32.0, 30.0, 38.0, 45.0, 33.0, 45.0, 31.0, 46.0, 48.0, 40.0, 44.0, 36.0, 36.0, 38.0, 42.0, 35.0, 40.0, 29.0, 22.0, 23.0, 13.0, 27.0, 20.0, 14.0, 9.0, 12.0, 12.0, 8.0, 5.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.265625, -7.9888916015625, -7.712158203125, -7.4354248046875, -7.15869140625, -6.8819580078125, -6.605224609375, -6.3284912109375, -6.0517578125, -5.7750244140625, -5.498291015625, -5.2215576171875, -4.94482421875, -4.6680908203125, -4.391357421875, -4.1146240234375, -3.837890625, -3.5611572265625, -3.284423828125, -3.0076904296875, -2.73095703125, -2.4542236328125, -2.177490234375, -1.9007568359375, -1.6240234375, -1.3472900390625, -1.070556640625, -0.7938232421875, -0.51708984375, -0.2403564453125, 0.036376953125, 0.3131103515625, 0.58984375, 0.8665771484375, 1.143310546875, 1.4200439453125, 1.69677734375, 1.9735107421875, 2.250244140625, 2.5269775390625, 2.8037109375, 3.0804443359375, 3.357177734375, 3.6339111328125, 3.91064453125, 4.1873779296875, 4.464111328125, 4.7408447265625, 5.017578125, 5.2943115234375, 5.571044921875, 5.8477783203125, 6.12451171875, 6.4012451171875, 6.677978515625, 6.9547119140625, 7.2314453125, 7.5081787109375, 7.784912109375, 8.0616455078125, 8.33837890625, 8.6151123046875, 8.891845703125, 9.1685791015625, 9.4453125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 8.0, 12.0, 18.0, 36.0, 46.0, 66.0, 103.0, 168.0, 227.0, 384.0, 600.0, 980.0, 1558.0, 2540.0, 4250.0, 7326.0, 12946.0, 24027.0, 46681.0, 97005.0, 213969.0, 506140.0, 1087981.0, 1161542.0, 568179.0, 240219.0, 106023.0, 51121.0, 26216.0, 14023.0, 7990.0, 4672.0, 2757.0, 1730.0, 1052.0, 639.0, 376.0, 225.0, 141.0, 115.0, 64.0, 37.0, 25.0, 16.0, 14.0, 12.0, 8.0, 2.0, 7.0, 3.0, 1.0, 0.0, 1.0], "bins": [-20.734375, -20.125732421875, -19.51708984375, -18.908447265625, -18.2998046875, -17.691162109375, -17.08251953125, -16.473876953125, -15.865234375, -15.256591796875, -14.64794921875, -14.039306640625, -13.4306640625, -12.822021484375, -12.21337890625, -11.604736328125, -10.99609375, -10.387451171875, -9.77880859375, -9.170166015625, -8.5615234375, -7.952880859375, -7.34423828125, -6.735595703125, -6.126953125, -5.518310546875, -4.90966796875, -4.301025390625, -3.6923828125, -3.083740234375, -2.47509765625, -1.866455078125, -1.2578125, -0.649169921875, -0.04052734375, 0.568115234375, 1.1767578125, 1.785400390625, 2.39404296875, 3.002685546875, 3.611328125, 4.219970703125, 4.82861328125, 5.437255859375, 6.0458984375, 6.654541015625, 7.26318359375, 7.871826171875, 8.48046875, 9.089111328125, 9.69775390625, 10.306396484375, 10.9150390625, 11.523681640625, 12.13232421875, 12.740966796875, 13.349609375, 13.958251953125, 14.56689453125, 15.175537109375, 15.7841796875, 16.392822265625, 17.00146484375, 17.610107421875, 18.21875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 7.0, 13.0, 9.0, 23.0, 19.0, 29.0, 50.0, 57.0, 69.0, 112.0, 135.0, 168.0, 192.0, 265.0, 285.0, 391.0, 385.0, 375.0, 304.0, 256.0, 206.0, 168.0, 163.0, 97.0, 70.0, 54.0, 40.0, 17.0, 38.0, 16.0, 10.0, 16.0, 8.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.37139892578125, -5.1685791015625, -4.96575927734375, -4.762939453125, -4.56011962890625, -4.3572998046875, -4.15447998046875, -3.95166015625, -3.74884033203125, -3.5460205078125, -3.34320068359375, -3.140380859375, -2.93756103515625, -2.7347412109375, -2.53192138671875, -2.3291015625, -2.12628173828125, -1.9234619140625, -1.72064208984375, -1.517822265625, -1.31500244140625, -1.1121826171875, -0.90936279296875, -0.70654296875, -0.50372314453125, -0.3009033203125, -0.09808349609375, 0.104736328125, 0.30755615234375, 0.5103759765625, 0.71319580078125, 0.916015625, 1.11883544921875, 1.3216552734375, 1.52447509765625, 1.727294921875, 1.93011474609375, 2.1329345703125, 2.33575439453125, 2.53857421875, 2.74139404296875, 2.9442138671875, 3.14703369140625, 3.349853515625, 3.55267333984375, 3.7554931640625, 3.95831298828125, 4.1611328125, 4.36395263671875, 4.5667724609375, 4.76959228515625, 4.972412109375, 5.17523193359375, 5.3780517578125, 5.58087158203125, 5.78369140625, 5.98651123046875, 6.1893310546875, 6.39215087890625, 6.594970703125, 6.79779052734375, 7.0006103515625, 7.20343017578125, 7.40625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 8.0, 11.0, 13.0, 22.0, 30.0, 23.0, 37.0, 40.0, 48.0, 73.0, 91.0, 89.0, 89.0, 89.0, 59.0, 61.0, 47.0, 42.0, 27.0, 15.0, 15.0, 14.0, 12.0, 9.0, 7.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.39463233947754, -26.70754051208496, -26.020448684692383, -25.333356857299805, -24.646265029907227, -23.95917320251465, -23.27208137512207, -22.584989547729492, -21.897897720336914, -21.210805892944336, -20.523714065551758, -19.83662223815918, -19.1495304107666, -18.462438583374023, -17.775346755981445, -17.088254928588867, -16.401165008544922, -15.714073181152344, -15.026981353759766, -14.339889526367188, -13.65279769897461, -12.965705871582031, -12.278614044189453, -11.591522216796875, -10.904430389404297, -10.217338562011719, -9.53024673461914, -8.843154907226562, -8.156063079833984, -7.468971252441406, -6.781879901885986, -6.094788074493408, -5.407695770263672, -4.720603942871094, -4.033512115478516, -3.3464205265045166, -2.6593286991119385, -1.9722368717193604, -1.2851452827453613, -0.5980534553527832, 0.08903837203979492, 0.7761301398277283, 1.4632219076156616, 2.15031361579895, 2.8374054431915283, 3.5244972705841064, 4.2115888595581055, 4.898680686950684, 5.585772514343262, 6.27286434173584, 6.959956169128418, 7.647047996520996, 8.334139823913574, 9.021231651306152, 9.708322525024414, 10.395414352416992, 11.08250617980957, 11.769598007202148, 12.456689834594727, 13.143781661987305, 13.830873489379883, 14.517965316772461, 15.205057144165039, 15.892148971557617, 16.579240798950195]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 4.0, 9.0, 8.0, 12.0, 14.0, 8.0, 13.0, 12.0, 18.0, 21.0, 24.0, 33.0, 52.0, 44.0, 36.0, 44.0, 34.0, 41.0, 68.0, 48.0, 51.0, 41.0, 54.0, 55.0, 33.0, 36.0, 39.0, 21.0, 14.0, 26.0, 23.0, 8.0, 17.0, 13.0, 9.0, 7.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.019588470458984, -14.589088439941406, -14.158588409423828, -13.72808837890625, -13.297589302062988, -12.86708927154541, -12.436589241027832, -12.006089210510254, -11.575590133666992, -11.145090103149414, -10.714590072631836, -10.284090042114258, -9.853590965270996, -9.423090934753418, -8.99259090423584, -8.562090873718262, -8.131590843200684, -7.7010908126831055, -7.2705912590026855, -6.840091228485107, -6.4095916748046875, -5.979091644287109, -5.548591613769531, -5.118091583251953, -4.687592029571533, -4.257091999053955, -3.826592445373535, -3.396092414855957, -2.965592622756958, -2.535092830657959, -2.104592800140381, -1.6740930080413818, -1.2435941696166992, -0.8130943179130554, -0.3825944662094116, 0.04790544509887695, 0.478405237197876, 0.908905029296875, 1.3394050598144531, 1.7699048519134521, 2.200404644012451, 2.63090443611145, 3.061404228210449, 3.4919042587280273, 3.9224040508270264, 4.352903842926025, 4.7834038734436035, 5.213903427124023, 5.644403457641602, 6.07490348815918, 6.5054030418396, 6.935903072357178, 7.366402626037598, 7.796902656555176, 8.227402687072754, 8.657902717590332, 9.088401794433594, 9.518901824951172, 9.94940185546875, 10.379901885986328, 10.81040096282959, 11.240900993347168, 11.671401023864746, 12.101901054382324, 12.532401084899902]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 9.0, 11.0, 18.0, 24.0, 33.0, 46.0, 91.0, 112.0, 184.0, 279.0, 520.0, 833.0, 1400.0, 2313.0, 3849.0, 6718.0, 11599.0, 20910.0, 38046.0, 69745.0, 125040.0, 199411.0, 218239.0, 153313.0, 87348.0, 47860.0, 26132.0, 14446.0, 8212.0, 4768.0, 2803.0, 1660.0, 959.0, 604.0, 392.0, 224.0, 158.0, 95.0, 57.0, 33.0, 22.0, 10.0, 13.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.90625, -9.63250732421875, -9.3587646484375, -9.08502197265625, -8.811279296875, -8.53753662109375, -8.2637939453125, -7.99005126953125, -7.71630859375, -7.44256591796875, -7.1688232421875, -6.89508056640625, -6.621337890625, -6.34759521484375, -6.0738525390625, -5.80010986328125, -5.5263671875, -5.25262451171875, -4.9788818359375, -4.70513916015625, -4.431396484375, -4.15765380859375, -3.8839111328125, -3.61016845703125, -3.33642578125, -3.06268310546875, -2.7889404296875, -2.51519775390625, -2.241455078125, -1.96771240234375, -1.6939697265625, -1.42022705078125, -1.146484375, -0.87274169921875, -0.5989990234375, -0.32525634765625, -0.051513671875, 0.22222900390625, 0.4959716796875, 0.76971435546875, 1.04345703125, 1.31719970703125, 1.5909423828125, 1.86468505859375, 2.138427734375, 2.41217041015625, 2.6859130859375, 2.95965576171875, 3.2333984375, 3.50714111328125, 3.7808837890625, 4.05462646484375, 4.328369140625, 4.60211181640625, 4.8758544921875, 5.14959716796875, 5.42333984375, 5.69708251953125, 5.9708251953125, 6.24456787109375, 6.518310546875, 6.79205322265625, 7.0657958984375, 7.33953857421875, 7.61328125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 5.0, 1.0, 9.0, 8.0, 13.0, 10.0, 12.0, 12.0, 17.0, 22.0, 17.0, 24.0, 27.0, 35.0, 40.0, 37.0, 36.0, 42.0, 46.0, 47.0, 43.0, 52.0, 57.0, 36.0, 44.0, 38.0, 37.0, 40.0, 35.0, 22.0, 25.0, 25.0, 18.0, 10.0, 17.0, 7.0, 11.0, 7.0, 5.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9921875, -11.5582275390625, -11.124267578125, -10.6903076171875, -10.25634765625, -9.8223876953125, -9.388427734375, -8.9544677734375, -8.5205078125, -8.0865478515625, -7.652587890625, -7.2186279296875, -6.78466796875, -6.3507080078125, -5.916748046875, -5.4827880859375, -5.048828125, -4.6148681640625, -4.180908203125, -3.7469482421875, -3.31298828125, -2.8790283203125, -2.445068359375, -2.0111083984375, -1.5771484375, -1.1431884765625, -0.709228515625, -0.2752685546875, 0.15869140625, 0.5926513671875, 1.026611328125, 1.4605712890625, 1.89453125, 2.3284912109375, 2.762451171875, 3.1964111328125, 3.63037109375, 4.0643310546875, 4.498291015625, 4.9322509765625, 5.3662109375, 5.8001708984375, 6.234130859375, 6.6680908203125, 7.10205078125, 7.5360107421875, 7.969970703125, 8.4039306640625, 8.837890625, 9.2718505859375, 9.705810546875, 10.1397705078125, 10.57373046875, 11.0076904296875, 11.441650390625, 11.8756103515625, 12.3095703125, 12.7435302734375, 13.177490234375, 13.6114501953125, 14.04541015625, 14.4793701171875, 14.913330078125, 15.3472900390625, 15.78125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 10.0, 17.0, 21.0, 25.0, 29.0, 62.0, 76.0, 106.0, 175.0, 211.0, 321.0, 482.0, 742.0, 1073.0, 1905.0, 3377.0, 5842.0, 10586.0, 21308.0, 45321.0, 103494.0, 225616.0, 303445.0, 175850.0, 76763.0, 34464.0, 16505.0, 8638.0, 4729.0, 2785.0, 1711.0, 998.0, 590.0, 388.0, 290.0, 185.0, 123.0, 82.0, 62.0, 40.0, 28.0, 25.0, 13.0, 9.0, 12.0, 3.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.53125, -12.1312255859375, -11.731201171875, -11.3311767578125, -10.93115234375, -10.5311279296875, -10.131103515625, -9.7310791015625, -9.3310546875, -8.9310302734375, -8.531005859375, -8.1309814453125, -7.73095703125, -7.3309326171875, -6.930908203125, -6.5308837890625, -6.130859375, -5.7308349609375, -5.330810546875, -4.9307861328125, -4.53076171875, -4.1307373046875, -3.730712890625, -3.3306884765625, -2.9306640625, -2.5306396484375, -2.130615234375, -1.7305908203125, -1.33056640625, -0.9305419921875, -0.530517578125, -0.1304931640625, 0.26953125, 0.6695556640625, 1.069580078125, 1.4696044921875, 1.86962890625, 2.2696533203125, 2.669677734375, 3.0697021484375, 3.4697265625, 3.8697509765625, 4.269775390625, 4.6697998046875, 5.06982421875, 5.4698486328125, 5.869873046875, 6.2698974609375, 6.669921875, 7.0699462890625, 7.469970703125, 7.8699951171875, 8.27001953125, 8.6700439453125, 9.070068359375, 9.4700927734375, 9.8701171875, 10.2701416015625, 10.670166015625, 11.0701904296875, 11.47021484375, 11.8702392578125, 12.270263671875, 12.6702880859375, 13.0703125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 7.0, 7.0, 7.0, 7.0, 8.0, 8.0, 16.0, 20.0, 21.0, 21.0, 23.0, 25.0, 28.0, 34.0, 24.0, 37.0, 46.0, 45.0, 39.0, 46.0, 45.0, 33.0, 41.0, 37.0, 32.0, 33.0, 38.0, 31.0, 29.0, 30.0, 38.0, 22.0, 23.0, 19.0, 12.0, 11.0, 8.0, 12.0, 7.0, 7.0, 3.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.67578125, -6.45330810546875, -6.2308349609375, -6.00836181640625, -5.785888671875, -5.56341552734375, -5.3409423828125, -5.11846923828125, -4.89599609375, -4.67352294921875, -4.4510498046875, -4.22857666015625, -4.006103515625, -3.78363037109375, -3.5611572265625, -3.33868408203125, -3.1162109375, -2.89373779296875, -2.6712646484375, -2.44879150390625, -2.226318359375, -2.00384521484375, -1.7813720703125, -1.55889892578125, -1.33642578125, -1.11395263671875, -0.8914794921875, -0.66900634765625, -0.446533203125, -0.22406005859375, -0.0015869140625, 0.22088623046875, 0.443359375, 0.66583251953125, 0.8883056640625, 1.11077880859375, 1.333251953125, 1.55572509765625, 1.7781982421875, 2.00067138671875, 2.22314453125, 2.44561767578125, 2.6680908203125, 2.89056396484375, 3.113037109375, 3.33551025390625, 3.5579833984375, 3.78045654296875, 4.0029296875, 4.22540283203125, 4.4478759765625, 4.67034912109375, 4.892822265625, 5.11529541015625, 5.3377685546875, 5.56024169921875, 5.78271484375, 6.00518798828125, 6.2276611328125, 6.45013427734375, 6.672607421875, 6.89508056640625, 7.1175537109375, 7.34002685546875, 7.5625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 7.0, 9.0, 19.0, 15.0, 32.0, 45.0, 49.0, 75.0, 120.0, 170.0, 219.0, 373.0, 617.0, 1000.0, 1904.0, 3539.0, 8567.0, 22213.0, 69292.0, 246418.0, 448925.0, 166677.0, 48547.0, 16441.0, 6357.0, 2880.0, 1541.0, 893.0, 554.0, 321.0, 226.0, 153.0, 96.0, 66.0, 67.0, 24.0, 31.0, 16.0, 12.0, 9.0, 9.0, 5.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-6.3828125, -6.19140625, -6.0, -5.80859375, -5.6171875, -5.42578125, -5.234375, -5.04296875, -4.8515625, -4.66015625, -4.46875, -4.27734375, -4.0859375, -3.89453125, -3.703125, -3.51171875, -3.3203125, -3.12890625, -2.9375, -2.74609375, -2.5546875, -2.36328125, -2.171875, -1.98046875, -1.7890625, -1.59765625, -1.40625, -1.21484375, -1.0234375, -0.83203125, -0.640625, -0.44921875, -0.2578125, -0.06640625, 0.125, 0.31640625, 0.5078125, 0.69921875, 0.890625, 1.08203125, 1.2734375, 1.46484375, 1.65625, 1.84765625, 2.0390625, 2.23046875, 2.421875, 2.61328125, 2.8046875, 2.99609375, 3.1875, 3.37890625, 3.5703125, 3.76171875, 3.953125, 4.14453125, 4.3359375, 4.52734375, 4.71875, 4.91015625, 5.1015625, 5.29296875, 5.484375, 5.67578125, 5.8671875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 4.0, 6.0, 13.0, 12.0, 16.0, 31.0, 45.0, 72.0, 102.0, 126.0, 107.0, 138.0, 85.0, 78.0, 45.0, 51.0, 24.0, 16.0, 12.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004858970642089844, -0.0004732981324195862, -0.000460699200630188, -0.0004481002688407898, -0.0004355013370513916, -0.0004229024052619934, -0.0004103034734725952, -0.000397704541683197, -0.00038510560989379883, -0.00037250667810440063, -0.00035990774631500244, -0.00034730881452560425, -0.00033470988273620605, -0.00032211095094680786, -0.00030951201915740967, -0.0002969130873680115, -0.0002843141555786133, -0.0002717152237892151, -0.0002591162919998169, -0.0002465173602104187, -0.0002339184284210205, -0.00022131949663162231, -0.00020872056484222412, -0.00019612163305282593, -0.00018352270126342773, -0.00017092376947402954, -0.00015832483768463135, -0.00014572590589523315, -0.00013312697410583496, -0.00012052804231643677, -0.00010792911052703857, -9.533017873764038e-05, -8.273124694824219e-05, -7.0132315158844e-05, -5.75333833694458e-05, -4.493445158004761e-05, -3.2335519790649414e-05, -1.973658800125122e-05, -7.137656211853027e-06, 5.461275577545166e-06, 1.806020736694336e-05, 3.065913915634155e-05, 4.3258070945739746e-05, 5.585700273513794e-05, 6.845593452453613e-05, 8.105486631393433e-05, 9.365379810333252e-05, 0.00010625272989273071, 0.0001188516616821289, 0.0001314505934715271, 0.0001440495252609253, 0.00015664845705032349, 0.00016924738883972168, 0.00018184632062911987, 0.00019444525241851807, 0.00020704418420791626, 0.00021964311599731445, 0.00023224204778671265, 0.00024484097957611084, 0.00025743991136550903, 0.0002700388431549072, 0.0002826377749443054, 0.0002952367067337036, 0.0003078356385231018, 0.0003204345703125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 12.0, 13.0, 21.0, 24.0, 31.0, 42.0, 61.0, 95.0, 117.0, 203.0, 286.0, 461.0, 790.0, 1625.0, 3693.0, 9966.0, 32080.0, 116019.0, 353109.0, 359816.0, 119348.0, 32871.0, 10228.0, 3797.0, 1633.0, 853.0, 449.0, 310.0, 181.0, 114.0, 80.0, 59.0, 58.0, 32.0, 19.0, 20.0, 13.0, 8.0, 7.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.6953125, -6.49249267578125, -6.2896728515625, -6.08685302734375, -5.884033203125, -5.68121337890625, -5.4783935546875, -5.27557373046875, -5.07275390625, -4.86993408203125, -4.6671142578125, -4.46429443359375, -4.261474609375, -4.05865478515625, -3.8558349609375, -3.65301513671875, -3.4501953125, -3.24737548828125, -3.0445556640625, -2.84173583984375, -2.638916015625, -2.43609619140625, -2.2332763671875, -2.03045654296875, -1.82763671875, -1.62481689453125, -1.4219970703125, -1.21917724609375, -1.016357421875, -0.81353759765625, -0.6107177734375, -0.40789794921875, -0.205078125, -0.00225830078125, 0.2005615234375, 0.40338134765625, 0.606201171875, 0.80902099609375, 1.0118408203125, 1.21466064453125, 1.41748046875, 1.62030029296875, 1.8231201171875, 2.02593994140625, 2.228759765625, 2.43157958984375, 2.6343994140625, 2.83721923828125, 3.0400390625, 3.24285888671875, 3.4456787109375, 3.64849853515625, 3.851318359375, 4.05413818359375, 4.2569580078125, 4.45977783203125, 4.66259765625, 4.86541748046875, 5.0682373046875, 5.27105712890625, 5.473876953125, 5.67669677734375, 5.8795166015625, 6.08233642578125, 6.28515625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 9.0, 20.0, 22.0, 43.0, 63.0, 115.0, 131.0, 135.0, 118.0, 114.0, 74.0, 44.0, 40.0, 28.0, 16.0, 3.0, 8.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.28955078125, -2.2197265625, -2.14990234375, -2.080078125, -2.01025390625, -1.9404296875, -1.87060546875, -1.80078125, -1.73095703125, -1.6611328125, -1.59130859375, -1.521484375, -1.45166015625, -1.3818359375, -1.31201171875, -1.2421875, -1.17236328125, -1.1025390625, -1.03271484375, -0.962890625, -0.89306640625, -0.8232421875, -0.75341796875, -0.68359375, -0.61376953125, -0.5439453125, -0.47412109375, -0.404296875, -0.33447265625, -0.2646484375, -0.19482421875, -0.125, -0.05517578125, 0.0146484375, 0.08447265625, 0.154296875, 0.22412109375, 0.2939453125, 0.36376953125, 0.43359375, 0.50341796875, 0.5732421875, 0.64306640625, 0.712890625, 0.78271484375, 0.8525390625, 0.92236328125, 0.9921875, 1.06201171875, 1.1318359375, 1.20166015625, 1.271484375, 1.34130859375, 1.4111328125, 1.48095703125, 1.55078125, 1.62060546875, 1.6904296875, 1.76025390625, 1.830078125, 1.89990234375, 1.9697265625, 2.03955078125, 2.109375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 8.0, 4.0, 14.0, 21.0, 23.0, 21.0, 35.0, 42.0, 52.0, 56.0, 76.0, 108.0, 93.0, 88.0, 73.0, 62.0, 57.0, 40.0, 29.0, 16.0, 17.0, 14.0, 7.0, 9.0, 11.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-29.336435317993164, -28.623172760009766, -27.909908294677734, -27.196643829345703, -26.483381271362305, -25.770118713378906, -25.056854248046875, -24.343589782714844, -23.630327224731445, -22.917064666748047, -22.203800201416016, -21.490535736083984, -20.777273178100586, -20.064010620117188, -19.350746154785156, -18.637481689453125, -17.924219131469727, -17.210956573486328, -16.497692108154297, -15.784428596496582, -15.071165084838867, -14.357901573181152, -13.644638061523438, -12.931374549865723, -12.218111038208008, -11.504847526550293, -10.791584014892578, -10.078320503234863, -9.365056991577148, -8.651793479919434, -7.938529968261719, -7.225266456604004, -6.512004852294922, -5.798741340637207, -5.085477828979492, -4.372214317321777, -3.6589508056640625, -2.9456872940063477, -2.232423782348633, -1.519160270690918, -0.8058967590332031, -0.09263324737548828, 0.6206302642822266, 1.3338937759399414, 2.0471572875976562, 2.760420799255371, 3.473684310913086, 4.186947822570801, 4.900211334228516, 5.6134748458862305, 6.326738357543945, 7.04000186920166, 7.753265380859375, 8.46652889251709, 9.179792404174805, 9.89305591583252, 10.606319427490234, 11.31958293914795, 12.032846450805664, 12.746109962463379, 13.459373474121094, 14.172636985778809, 14.885900497436523, 15.599164009094238, 16.312427520751953]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 7.0, 7.0, 13.0, 10.0, 13.0, 13.0, 13.0, 17.0, 23.0, 22.0, 32.0, 43.0, 47.0, 48.0, 34.0, 37.0, 42.0, 57.0, 58.0, 48.0, 53.0, 42.0, 57.0, 37.0, 34.0, 34.0, 23.0, 25.0, 20.0, 19.0, 14.0, 17.0, 12.0, 9.0, 7.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.124489784240723, -14.69525146484375, -14.266013145446777, -13.836774826049805, -13.407536506652832, -12.97829818725586, -12.54905891418457, -12.119821548461914, -11.690582275390625, -11.261343955993652, -10.83210563659668, -10.402867317199707, -9.973628997802734, -9.544390678405762, -9.115152359008789, -8.6859130859375, -8.256675720214844, -7.827437400817871, -7.398199081420898, -6.968960762023926, -6.539722442626953, -6.1104841232299805, -5.68124532699585, -5.252007007598877, -4.822768688201904, -4.393530368804932, -3.964292049407959, -3.5350534915924072, -3.1058151721954346, -2.676576852798462, -2.24733829498291, -1.8180999755859375, -1.3888616561889648, -0.9596232771873474, -0.53038489818573, -0.10114645957946777, 0.3280918598175049, 0.7573301792144775, 1.1865687370300293, 1.615807056427002, 2.0450453758239746, 2.4742836952209473, 2.90352201461792, 3.3327605724334717, 3.7619988918304443, 4.191237449645996, 4.620475769042969, 5.049714088439941, 5.478952407836914, 5.908190727233887, 6.337429046630859, 6.766667366027832, 7.195905685424805, 7.625144004821777, 8.05438232421875, 8.483621597290039, 8.912858963012695, 9.342097282409668, 9.77133560180664, 10.200573921203613, 10.629812240600586, 11.059050559997559, 11.488288879394531, 11.91752815246582, 12.346766471862793]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 17.0, 10.0, 36.0, 43.0, 85.0, 132.0, 298.0, 529.0, 1127.0, 2188.0, 4562.0, 10088.0, 22317.0, 52380.0, 120587.0, 236622.0, 281719.0, 174394.0, 79168.0, 34355.0, 14796.0, 6734.0, 3210.0, 1529.0, 750.0, 408.0, 211.0, 109.0, 71.0, 24.0, 18.0, 15.0, 9.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.578125, -23.8388671875, -23.099609375, -22.3603515625, -21.62109375, -20.8818359375, -20.142578125, -19.4033203125, -18.6640625, -17.9248046875, -17.185546875, -16.4462890625, -15.70703125, -14.9677734375, -14.228515625, -13.4892578125, -12.75, -12.0107421875, -11.271484375, -10.5322265625, -9.79296875, -9.0537109375, -8.314453125, -7.5751953125, -6.8359375, -6.0966796875, -5.357421875, -4.6181640625, -3.87890625, -3.1396484375, -2.400390625, -1.6611328125, -0.921875, -0.1826171875, 0.556640625, 1.2958984375, 2.03515625, 2.7744140625, 3.513671875, 4.2529296875, 4.9921875, 5.7314453125, 6.470703125, 7.2099609375, 7.94921875, 8.6884765625, 9.427734375, 10.1669921875, 10.90625, 11.6455078125, 12.384765625, 13.1240234375, 13.86328125, 14.6025390625, 15.341796875, 16.0810546875, 16.8203125, 17.5595703125, 18.298828125, 19.0380859375, 19.77734375, 20.5166015625, 21.255859375, 21.9951171875, 22.734375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 1.0, 7.0, 14.0, 6.0, 9.0, 9.0, 17.0, 12.0, 16.0, 24.0, 20.0, 36.0, 23.0, 31.0, 42.0, 43.0, 44.0, 43.0, 44.0, 58.0, 52.0, 57.0, 47.0, 43.0, 41.0, 32.0, 32.0, 34.0, 28.0, 24.0, 13.0, 14.0, 18.0, 13.0, 15.0, 10.0, 8.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-15.34375, -14.915283203125, -14.48681640625, -14.058349609375, -13.6298828125, -13.201416015625, -12.77294921875, -12.344482421875, -11.916015625, -11.487548828125, -11.05908203125, -10.630615234375, -10.2021484375, -9.773681640625, -9.34521484375, -8.916748046875, -8.48828125, -8.059814453125, -7.63134765625, -7.202880859375, -6.7744140625, -6.345947265625, -5.91748046875, -5.489013671875, -5.060546875, -4.632080078125, -4.20361328125, -3.775146484375, -3.3466796875, -2.918212890625, -2.48974609375, -2.061279296875, -1.6328125, -1.204345703125, -0.77587890625, -0.347412109375, 0.0810546875, 0.509521484375, 0.93798828125, 1.366455078125, 1.794921875, 2.223388671875, 2.65185546875, 3.080322265625, 3.5087890625, 3.937255859375, 4.36572265625, 4.794189453125, 5.22265625, 5.651123046875, 6.07958984375, 6.508056640625, 6.9365234375, 7.364990234375, 7.79345703125, 8.221923828125, 8.650390625, 9.078857421875, 9.50732421875, 9.935791015625, 10.3642578125, 10.792724609375, 11.22119140625, 11.649658203125, 12.078125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 6.0, 9.0, 12.0, 17.0, 21.0, 23.0, 42.0, 61.0, 81.0, 109.0, 145.0, 207.0, 315.0, 477.0, 724.0, 1215.0, 2211.0, 4094.0, 8173.0, 16676.0, 34862.0, 75483.0, 151671.0, 243722.0, 235411.0, 140494.0, 68874.0, 31701.0, 15161.0, 7440.0, 3787.0, 2020.0, 1182.0, 710.0, 414.0, 276.0, 207.0, 144.0, 99.0, 63.0, 61.0, 40.0, 40.0, 23.0, 13.0, 10.0, 12.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-20.3125, -19.676513671875, -19.04052734375, -18.404541015625, -17.7685546875, -17.132568359375, -16.49658203125, -15.860595703125, -15.224609375, -14.588623046875, -13.95263671875, -13.316650390625, -12.6806640625, -12.044677734375, -11.40869140625, -10.772705078125, -10.13671875, -9.500732421875, -8.86474609375, -8.228759765625, -7.5927734375, -6.956787109375, -6.32080078125, -5.684814453125, -5.048828125, -4.412841796875, -3.77685546875, -3.140869140625, -2.5048828125, -1.868896484375, -1.23291015625, -0.596923828125, 0.0390625, 0.675048828125, 1.31103515625, 1.947021484375, 2.5830078125, 3.218994140625, 3.85498046875, 4.490966796875, 5.126953125, 5.762939453125, 6.39892578125, 7.034912109375, 7.6708984375, 8.306884765625, 8.94287109375, 9.578857421875, 10.21484375, 10.850830078125, 11.48681640625, 12.122802734375, 12.7587890625, 13.394775390625, 14.03076171875, 14.666748046875, 15.302734375, 15.938720703125, 16.57470703125, 17.210693359375, 17.8466796875, 18.482666015625, 19.11865234375, 19.754638671875, 20.390625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 9.0, 14.0, 11.0, 10.0, 16.0, 25.0, 20.0, 25.0, 33.0, 39.0, 26.0, 49.0, 56.0, 33.0, 41.0, 52.0, 47.0, 43.0, 45.0, 46.0, 37.0, 49.0, 29.0, 30.0, 43.0, 29.0, 26.0, 20.0, 20.0, 14.0, 11.0, 13.0, 11.0, 4.0, 3.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-10.0703125, -9.806640625, -9.54296875, -9.279296875, -9.015625, -8.751953125, -8.48828125, -8.224609375, -7.9609375, -7.697265625, -7.43359375, -7.169921875, -6.90625, -6.642578125, -6.37890625, -6.115234375, -5.8515625, -5.587890625, -5.32421875, -5.060546875, -4.796875, -4.533203125, -4.26953125, -4.005859375, -3.7421875, -3.478515625, -3.21484375, -2.951171875, -2.6875, -2.423828125, -2.16015625, -1.896484375, -1.6328125, -1.369140625, -1.10546875, -0.841796875, -0.578125, -0.314453125, -0.05078125, 0.212890625, 0.4765625, 0.740234375, 1.00390625, 1.267578125, 1.53125, 1.794921875, 2.05859375, 2.322265625, 2.5859375, 2.849609375, 3.11328125, 3.376953125, 3.640625, 3.904296875, 4.16796875, 4.431640625, 4.6953125, 4.958984375, 5.22265625, 5.486328125, 5.75, 6.013671875, 6.27734375, 6.541015625, 6.8046875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 9.0, 6.0, 15.0, 29.0, 22.0, 31.0, 54.0, 78.0, 90.0, 110.0, 174.0, 231.0, 353.0, 501.0, 800.0, 1208.0, 1987.0, 3327.0, 5590.0, 10038.0, 18844.0, 35354.0, 68007.0, 129417.0, 210585.0, 228582.0, 154563.0, 83367.0, 43282.0, 22576.0, 12213.0, 6665.0, 3833.0, 2291.0, 1433.0, 908.0, 593.0, 400.0, 293.0, 197.0, 144.0, 109.0, 76.0, 50.0, 37.0, 29.0, 14.0, 13.0, 11.0, 5.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.1640625, -7.91015625, -7.65625, -7.40234375, -7.1484375, -6.89453125, -6.640625, -6.38671875, -6.1328125, -5.87890625, -5.625, -5.37109375, -5.1171875, -4.86328125, -4.609375, -4.35546875, -4.1015625, -3.84765625, -3.59375, -3.33984375, -3.0859375, -2.83203125, -2.578125, -2.32421875, -2.0703125, -1.81640625, -1.5625, -1.30859375, -1.0546875, -0.80078125, -0.546875, -0.29296875, -0.0390625, 0.21484375, 0.46875, 0.72265625, 0.9765625, 1.23046875, 1.484375, 1.73828125, 1.9921875, 2.24609375, 2.5, 2.75390625, 3.0078125, 3.26171875, 3.515625, 3.76953125, 4.0234375, 4.27734375, 4.53125, 4.78515625, 5.0390625, 5.29296875, 5.546875, 5.80078125, 6.0546875, 6.30859375, 6.5625, 6.81640625, 7.0703125, 7.32421875, 7.578125, 7.83203125, 8.0859375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 7.0, 9.0, 8.0, 9.0, 16.0, 9.0, 34.0, 18.0, 37.0, 55.0, 64.0, 80.0, 81.0, 77.0, 87.0, 97.0, 78.0, 37.0, 51.0, 33.0, 24.0, 23.0, 11.0, 15.0, 10.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0011339187622070312, -0.001104898750782013, -0.0010758787393569946, -0.0010468587279319763, -0.001017838716506958, -0.0009888187050819397, -0.0009597986936569214, -0.0009307786822319031, -0.0009017586708068848, -0.0008727386593818665, -0.0008437186479568481, -0.0008146986365318298, -0.0007856786251068115, -0.0007566586136817932, -0.0007276386022567749, -0.0006986185908317566, -0.0006695985794067383, -0.00064057856798172, -0.0006115585565567017, -0.0005825385451316833, -0.000553518533706665, -0.0005244985222816467, -0.0004954785108566284, -0.0004664584994316101, -0.0004374384880065918, -0.0004084184765815735, -0.0003793984651565552, -0.00035037845373153687, -0.00032135844230651855, -0.00029233843088150024, -0.00026331841945648193, -0.00023429840803146362, -0.0002052783966064453, -0.000176258385181427, -0.0001472383737564087, -0.00011821836233139038, -8.919835090637207e-05, -6.017833948135376e-05, -3.115832805633545e-05, -2.1383166313171387e-06, 2.6881694793701172e-05, 5.590170621871948e-05, 8.492171764373779e-05, 0.0001139417290687561, 0.00014296174049377441, 0.00017198175191879272, 0.00020100176334381104, 0.00023002177476882935, 0.00025904178619384766, 0.00028806179761886597, 0.0003170818090438843, 0.0003461018204689026, 0.0003751218318939209, 0.0004041418433189392, 0.0004331618547439575, 0.00046218186616897583, 0.0004912018775939941, 0.0005202218890190125, 0.0005492419004440308, 0.0005782619118690491, 0.0006072819232940674, 0.0006363019347190857, 0.000665321946144104, 0.0006943419575691223, 0.0007233619689941406]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 11.0, 11.0, 11.0, 26.0, 35.0, 56.0, 74.0, 70.0, 120.0, 179.0, 239.0, 416.0, 596.0, 976.0, 1618.0, 2659.0, 4889.0, 8986.0, 16789.0, 33133.0, 67011.0, 133677.0, 223501.0, 237980.0, 154044.0, 78817.0, 38863.0, 19540.0, 10485.0, 5602.0, 3124.0, 1866.0, 1071.0, 693.0, 410.0, 284.0, 179.0, 158.0, 96.0, 67.0, 48.0, 35.0, 30.0, 25.0, 12.0, 16.0, 10.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.390625, -8.1209716796875, -7.851318359375, -7.5816650390625, -7.31201171875, -7.0423583984375, -6.772705078125, -6.5030517578125, -6.2333984375, -5.9637451171875, -5.694091796875, -5.4244384765625, -5.15478515625, -4.8851318359375, -4.615478515625, -4.3458251953125, -4.076171875, -3.8065185546875, -3.536865234375, -3.2672119140625, -2.99755859375, -2.7279052734375, -2.458251953125, -2.1885986328125, -1.9189453125, -1.6492919921875, -1.379638671875, -1.1099853515625, -0.84033203125, -0.5706787109375, -0.301025390625, -0.0313720703125, 0.23828125, 0.5079345703125, 0.777587890625, 1.0472412109375, 1.31689453125, 1.5865478515625, 1.856201171875, 2.1258544921875, 2.3955078125, 2.6651611328125, 2.934814453125, 3.2044677734375, 3.47412109375, 3.7437744140625, 4.013427734375, 4.2830810546875, 4.552734375, 4.8223876953125, 5.092041015625, 5.3616943359375, 5.63134765625, 5.9010009765625, 6.170654296875, 6.4403076171875, 6.7099609375, 6.9796142578125, 7.249267578125, 7.5189208984375, 7.78857421875, 8.0582275390625, 8.327880859375, 8.5975341796875, 8.8671875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 0.0, 1.0, 0.0, 4.0, 6.0, 4.0, 1.0, 8.0, 8.0, 7.0, 13.0, 8.0, 15.0, 17.0, 16.0, 26.0, 34.0, 37.0, 34.0, 42.0, 52.0, 68.0, 75.0, 80.0, 55.0, 70.0, 51.0, 56.0, 41.0, 31.0, 24.0, 30.0, 17.0, 10.0, 11.0, 12.0, 12.0, 6.0, 9.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.923828125, -2.8406982421875, -2.757568359375, -2.6744384765625, -2.59130859375, -2.5081787109375, -2.425048828125, -2.3419189453125, -2.2587890625, -2.1756591796875, -2.092529296875, -2.0093994140625, -1.92626953125, -1.8431396484375, -1.760009765625, -1.6768798828125, -1.59375, -1.5106201171875, -1.427490234375, -1.3443603515625, -1.26123046875, -1.1781005859375, -1.094970703125, -1.0118408203125, -0.9287109375, -0.8455810546875, -0.762451171875, -0.6793212890625, -0.59619140625, -0.5130615234375, -0.429931640625, -0.3468017578125, -0.263671875, -0.1805419921875, -0.097412109375, -0.0142822265625, 0.06884765625, 0.1519775390625, 0.235107421875, 0.3182373046875, 0.4013671875, 0.4844970703125, 0.567626953125, 0.6507568359375, 0.73388671875, 0.8170166015625, 0.900146484375, 0.9832763671875, 1.06640625, 1.1495361328125, 1.232666015625, 1.3157958984375, 1.39892578125, 1.4820556640625, 1.565185546875, 1.6483154296875, 1.7314453125, 1.8145751953125, 1.897705078125, 1.9808349609375, 2.06396484375, 2.1470947265625, 2.230224609375, 2.3133544921875, 2.396484375]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 8.0, 6.0, 7.0, 20.0, 19.0, 21.0, 25.0, 38.0, 42.0, 70.0, 68.0, 80.0, 79.0, 94.0, 78.0, 64.0, 70.0, 53.0, 38.0, 22.0, 24.0, 16.0, 12.0, 10.0, 6.0, 7.0, 7.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.061565399169922, -25.35848045349121, -24.655397415161133, -23.952312469482422, -23.249229431152344, -22.546144485473633, -21.843059539794922, -21.139976501464844, -20.436893463134766, -19.733808517456055, -19.030725479125977, -18.327640533447266, -17.624557495117188, -16.921472549438477, -16.218387603759766, -15.515304565429688, -14.812219619750977, -14.109135627746582, -13.406051635742188, -12.702966690063477, -11.999883651733398, -11.296798706054688, -10.593714714050293, -9.890630722045898, -9.187546730041504, -8.48446273803711, -7.781378746032715, -7.078294277191162, -6.375210285186768, -5.672126293182373, -4.96904182434082, -4.265957832336426, -3.5628719329833984, -2.859787940979004, -2.1567037105560303, -1.4536194801330566, -0.7505354881286621, -0.04745149612426758, 0.6556329727172852, 1.3587169647216797, 2.061800956726074, 2.7648849487304688, 3.4679691791534424, 4.171053409576416, 4.8741374015808105, 5.577221393585205, 6.280305862426758, 6.983389854431152, 7.686473846435547, 8.389557838439941, 9.092641830444336, 9.795726776123047, 10.498809814453125, 11.201894760131836, 11.90497875213623, 12.608062744140625, 13.31114673614502, 14.014230728149414, 14.717314720153809, 15.420398712158203, 16.123483657836914, 16.826566696166992, 17.529651641845703, 18.23273468017578, 18.935819625854492]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 13.0, 14.0, 13.0, 19.0, 20.0, 16.0, 19.0, 27.0, 28.0, 47.0, 39.0, 37.0, 49.0, 39.0, 61.0, 37.0, 40.0, 58.0, 51.0, 58.0, 45.0, 43.0, 33.0, 28.0, 28.0, 26.0, 18.0, 12.0, 16.0, 16.0, 9.0, 8.0, 5.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.976397514343262, -13.553116798400879, -13.129836082458496, -12.70655632019043, -12.283275604248047, -11.859994888305664, -11.436714172363281, -11.013433456420898, -10.590153694152832, -10.16687297821045, -9.743592262268066, -9.3203125, -8.897031784057617, -8.473751068115234, -8.050470352172852, -7.627190113067627, -7.203909397125244, -6.780628681182861, -6.357348442077637, -5.934067726135254, -5.510787487030029, -5.0875067710876465, -4.664226531982422, -4.240945816040039, -3.8176653385162354, -3.3943848609924316, -2.971104383468628, -2.547823905944824, -2.1245431900024414, -1.7012627124786377, -1.277982234954834, -0.8547017574310303, -0.43142127990722656, -0.008140772581100464, 0.41513973474502563, 0.8384202718734741, 1.2617007493972778, 1.684981346130371, 2.108261823654175, 2.5315423011779785, 2.9548227787017822, 3.378103256225586, 3.8013837337493896, 4.224664211273193, 4.647944927215576, 5.071225166320801, 5.494505882263184, 5.917786598205566, 6.341066837310791, 6.764347553253174, 7.187627792358398, 7.610908508300781, 8.034189224243164, 8.457469940185547, 8.880749702453613, 9.304030418395996, 9.727311134338379, 10.150591850280762, 10.573872566223145, 10.997152328491211, 11.420433044433594, 11.843713760375977, 12.26699447631836, 12.690275192260742, 13.113554954528809]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 10.0, 17.0, 28.0, 52.0, 90.0, 179.0, 280.0, 547.0, 1088.0, 2446.0, 5311.0, 12701.0, 34321.0, 117322.0, 554860.0, 2081283.0, 1087009.0, 209395.0, 54538.0, 18415.0, 7324.0, 3307.0, 1634.0, 881.0, 484.0, 292.0, 151.0, 106.0, 71.0, 45.0, 31.0, 11.0, 18.0, 8.0, 6.0, 11.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.453125, -23.463134765625, -22.47314453125, -21.483154296875, -20.4931640625, -19.503173828125, -18.51318359375, -17.523193359375, -16.533203125, -15.543212890625, -14.55322265625, -13.563232421875, -12.5732421875, -11.583251953125, -10.59326171875, -9.603271484375, -8.61328125, -7.623291015625, -6.63330078125, -5.643310546875, -4.6533203125, -3.663330078125, -2.67333984375, -1.683349609375, -0.693359375, 0.296630859375, 1.28662109375, 2.276611328125, 3.2666015625, 4.256591796875, 5.24658203125, 6.236572265625, 7.2265625, 8.216552734375, 9.20654296875, 10.196533203125, 11.1865234375, 12.176513671875, 13.16650390625, 14.156494140625, 15.146484375, 16.136474609375, 17.12646484375, 18.116455078125, 19.1064453125, 20.096435546875, 21.08642578125, 22.076416015625, 23.06640625, 24.056396484375, 25.04638671875, 26.036376953125, 27.0263671875, 28.016357421875, 29.00634765625, 29.996337890625, 30.986328125, 31.976318359375, 32.96630859375, 33.956298828125, 34.9462890625, 35.936279296875, 36.92626953125, 37.916259765625, 38.90625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 13.0, 10.0, 10.0, 13.0, 19.0, 18.0, 26.0, 23.0, 33.0, 29.0, 35.0, 36.0, 47.0, 50.0, 53.0, 64.0, 51.0, 52.0, 50.0, 55.0, 41.0, 45.0, 28.0, 36.0, 25.0, 23.0, 19.0, 15.0, 11.0, 17.0, 18.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.919677734375, -9.62060546875, -9.321533203125, -9.0224609375, -8.723388671875, -8.42431640625, -8.125244140625, -7.826171875, -7.527099609375, -7.22802734375, -6.928955078125, -6.6298828125, -6.330810546875, -6.03173828125, -5.732666015625, -5.43359375, -5.134521484375, -4.83544921875, -4.536376953125, -4.2373046875, -3.938232421875, -3.63916015625, -3.340087890625, -3.041015625, -2.741943359375, -2.44287109375, -2.143798828125, -1.8447265625, -1.545654296875, -1.24658203125, -0.947509765625, -0.6484375, -0.349365234375, -0.05029296875, 0.248779296875, 0.5478515625, 0.846923828125, 1.14599609375, 1.445068359375, 1.744140625, 2.043212890625, 2.34228515625, 2.641357421875, 2.9404296875, 3.239501953125, 3.53857421875, 3.837646484375, 4.13671875, 4.435791015625, 4.73486328125, 5.033935546875, 5.3330078125, 5.632080078125, 5.93115234375, 6.230224609375, 6.529296875, 6.828369140625, 7.12744140625, 7.426513671875, 7.7255859375, 8.024658203125, 8.32373046875, 8.622802734375, 8.921875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 14.0, 13.0, 23.0, 34.0, 30.0, 67.0, 114.0, 163.0, 232.0, 363.0, 599.0, 960.0, 1565.0, 2549.0, 4277.0, 7362.0, 13273.0, 24438.0, 46810.0, 96179.0, 209579.0, 480952.0, 1025031.0, 1169337.0, 604605.0, 263613.0, 118769.0, 57140.0, 29325.0, 15526.0, 8739.0, 4886.0, 2984.0, 1812.0, 1074.0, 637.0, 433.0, 255.0, 177.0, 101.0, 83.0, 51.0, 41.0, 27.0, 17.0, 10.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.953125, -16.390625, -15.828125, -15.265625, -14.703125, -14.140625, -13.578125, -13.015625, -12.453125, -11.890625, -11.328125, -10.765625, -10.203125, -9.640625, -9.078125, -8.515625, -7.953125, -7.390625, -6.828125, -6.265625, -5.703125, -5.140625, -4.578125, -4.015625, -3.453125, -2.890625, -2.328125, -1.765625, -1.203125, -0.640625, -0.078125, 0.484375, 1.046875, 1.609375, 2.171875, 2.734375, 3.296875, 3.859375, 4.421875, 4.984375, 5.546875, 6.109375, 6.671875, 7.234375, 7.796875, 8.359375, 8.921875, 9.484375, 10.046875, 10.609375, 11.171875, 11.734375, 12.296875, 12.859375, 13.421875, 13.984375, 14.546875, 15.109375, 15.671875, 16.234375, 16.796875, 17.359375, 17.921875, 18.484375, 19.046875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 11.0, 13.0, 17.0, 22.0, 35.0, 33.0, 52.0, 56.0, 74.0, 118.0, 141.0, 185.0, 229.0, 303.0, 321.0, 357.0, 349.0, 296.0, 295.0, 248.0, 202.0, 164.0, 127.0, 90.0, 94.0, 54.0, 39.0, 25.0, 29.0, 24.0, 12.0, 7.0, 16.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0859375, -5.90789794921875, -5.7298583984375, -5.55181884765625, -5.373779296875, -5.19573974609375, -5.0177001953125, -4.83966064453125, -4.66162109375, -4.48358154296875, -4.3055419921875, -4.12750244140625, -3.949462890625, -3.77142333984375, -3.5933837890625, -3.41534423828125, -3.2373046875, -3.05926513671875, -2.8812255859375, -2.70318603515625, -2.525146484375, -2.34710693359375, -2.1690673828125, -1.99102783203125, -1.81298828125, -1.63494873046875, -1.4569091796875, -1.27886962890625, -1.100830078125, -0.92279052734375, -0.7447509765625, -0.56671142578125, -0.388671875, -0.21063232421875, -0.0325927734375, 0.14544677734375, 0.323486328125, 0.50152587890625, 0.6795654296875, 0.85760498046875, 1.03564453125, 1.21368408203125, 1.3917236328125, 1.56976318359375, 1.747802734375, 1.92584228515625, 2.1038818359375, 2.28192138671875, 2.4599609375, 2.63800048828125, 2.8160400390625, 2.99407958984375, 3.172119140625, 3.35015869140625, 3.5281982421875, 3.70623779296875, 3.88427734375, 4.06231689453125, 4.2403564453125, 4.41839599609375, 4.596435546875, 4.77447509765625, 4.9525146484375, 5.13055419921875, 5.30859375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 3.0, 7.0, 10.0, 10.0, 26.0, 27.0, 29.0, 39.0, 59.0, 70.0, 70.0, 102.0, 88.0, 72.0, 83.0, 65.0, 58.0, 41.0, 19.0, 28.0, 15.0, 17.0, 8.0, 12.0, 6.0, 6.0, 4.0, 4.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.464479446411133, -22.782136917114258, -22.099794387817383, -21.417451858520508, -20.735107421875, -20.052764892578125, -19.37042236328125, -18.688079833984375, -18.0057373046875, -17.323394775390625, -16.64105224609375, -15.958708763122559, -15.276366233825684, -14.594023704528809, -13.911680221557617, -13.229337692260742, -12.546995162963867, -11.864652633666992, -11.182310104370117, -10.499966621398926, -9.81762409210205, -9.135281562805176, -8.452938079833984, -7.770595550537109, -7.088253021240234, -6.405910491943359, -5.723567485809326, -5.041224479675293, -4.358881950378418, -3.676539182662964, -2.9941964149475098, -2.3118534088134766, -1.6295089721679688, -0.9471662044525146, -0.26482343673706055, 0.41751933097839355, 1.0998620986938477, 1.7822048664093018, 2.464547634124756, 3.146890640258789, 3.829233169555664, 4.511575698852539, 5.193918704986572, 5.8762617111206055, 6.5586042404174805, 7.2409467697143555, 7.923289775848389, 8.605632781982422, 9.287975311279297, 9.970317840576172, 10.652660369873047, 11.335003852844238, 12.017346382141113, 12.699688911437988, 13.38203239440918, 14.064374923706055, 14.74671745300293, 15.429059982299805, 16.11140251159668, 16.793745040893555, 17.476089477539062, 18.158432006835938, 18.840774536132812, 19.523117065429688, 20.205459594726562]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 6.0, 10.0, 5.0, 11.0, 11.0, 7.0, 13.0, 20.0, 18.0, 25.0, 20.0, 23.0, 24.0, 39.0, 47.0, 49.0, 41.0, 38.0, 47.0, 46.0, 48.0, 44.0, 47.0, 43.0, 36.0, 44.0, 40.0, 30.0, 20.0, 24.0, 15.0, 18.0, 21.0, 13.0, 14.0, 7.0, 6.0, 5.0, 9.0, 5.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.00927734375, -11.652820587158203, -11.296363830566406, -10.93990707397461, -10.583450317382812, -10.226994514465332, -9.870537757873535, -9.514081001281738, -9.157624244689941, -8.801167488098145, -8.444710731506348, -8.08825397491455, -7.731797695159912, -7.375340938568115, -7.018884658813477, -6.66242790222168, -6.305971145629883, -5.949514389038086, -5.593057632446289, -5.23660135269165, -4.8801445960998535, -4.523687839508057, -4.167231559753418, -3.810774803161621, -3.454318046569824, -3.0978612899780273, -2.7414047718048096, -2.384948253631592, -2.028491497039795, -1.6720348596572876, -1.3155782222747803, -0.9591217041015625, -0.602665901184082, -0.2462092638015747, 0.11024737358093262, 0.46670401096343994, 0.8231606483459473, 1.1796172857284546, 1.536073923110962, 1.8925304412841797, 2.2489871978759766, 2.6054439544677734, 2.961900472640991, 3.318356990814209, 3.674813747406006, 4.031270503997803, 4.387726783752441, 4.744183540344238, 5.100640296936035, 5.457097053527832, 5.813553810119629, 6.170010089874268, 6.5264668464660645, 6.882923603057861, 7.2393798828125, 7.595836639404297, 7.952293395996094, 8.30875015258789, 8.665206909179688, 9.021663665771484, 9.378120422363281, 9.734576225280762, 10.091032981872559, 10.447489738464355, 10.803946495056152]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 12.0, 9.0, 19.0, 15.0, 41.0, 36.0, 55.0, 78.0, 112.0, 184.0, 312.0, 418.0, 768.0, 1280.0, 2231.0, 3812.0, 7027.0, 13418.0, 28005.0, 60877.0, 134334.0, 256058.0, 265857.0, 145305.0, 66184.0, 30125.0, 14600.0, 7588.0, 4037.0, 2219.0, 1366.0, 790.0, 467.0, 273.0, 185.0, 119.0, 96.0, 58.0, 49.0, 40.0, 21.0, 21.0, 10.0, 12.0, 12.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-10.9296875, -10.5989990234375, -10.268310546875, -9.9376220703125, -9.60693359375, -9.2762451171875, -8.945556640625, -8.6148681640625, -8.2841796875, -7.9534912109375, -7.622802734375, -7.2921142578125, -6.96142578125, -6.6307373046875, -6.300048828125, -5.9693603515625, -5.638671875, -5.3079833984375, -4.977294921875, -4.6466064453125, -4.31591796875, -3.9852294921875, -3.654541015625, -3.3238525390625, -2.9931640625, -2.6624755859375, -2.331787109375, -2.0010986328125, -1.67041015625, -1.3397216796875, -1.009033203125, -0.6783447265625, -0.34765625, -0.0169677734375, 0.313720703125, 0.6444091796875, 0.97509765625, 1.3057861328125, 1.636474609375, 1.9671630859375, 2.2978515625, 2.6285400390625, 2.959228515625, 3.2899169921875, 3.62060546875, 3.9512939453125, 4.281982421875, 4.6126708984375, 4.943359375, 5.2740478515625, 5.604736328125, 5.9354248046875, 6.26611328125, 6.5968017578125, 6.927490234375, 7.2581787109375, 7.5888671875, 7.9195556640625, 8.250244140625, 8.5809326171875, 8.91162109375, 9.2423095703125, 9.572998046875, 9.9036865234375, 10.234375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 7.0, 4.0, 10.0, 9.0, 11.0, 8.0, 10.0, 15.0, 17.0, 13.0, 23.0, 33.0, 17.0, 32.0, 36.0, 33.0, 42.0, 44.0, 54.0, 50.0, 47.0, 66.0, 37.0, 44.0, 28.0, 38.0, 42.0, 33.0, 29.0, 28.0, 19.0, 16.0, 19.0, 21.0, 12.0, 7.0, 5.0, 11.0, 6.0, 3.0, 6.0, 8.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-13.3125, -12.9403076171875, -12.568115234375, -12.1959228515625, -11.82373046875, -11.4515380859375, -11.079345703125, -10.7071533203125, -10.3349609375, -9.9627685546875, -9.590576171875, -9.2183837890625, -8.84619140625, -8.4739990234375, -8.101806640625, -7.7296142578125, -7.357421875, -6.9852294921875, -6.613037109375, -6.2408447265625, -5.86865234375, -5.4964599609375, -5.124267578125, -4.7520751953125, -4.3798828125, -4.0076904296875, -3.635498046875, -3.2633056640625, -2.89111328125, -2.5189208984375, -2.146728515625, -1.7745361328125, -1.40234375, -1.0301513671875, -0.657958984375, -0.2857666015625, 0.08642578125, 0.4586181640625, 0.830810546875, 1.2030029296875, 1.5751953125, 1.9473876953125, 2.319580078125, 2.6917724609375, 3.06396484375, 3.4361572265625, 3.808349609375, 4.1805419921875, 4.552734375, 4.9249267578125, 5.297119140625, 5.6693115234375, 6.04150390625, 6.4136962890625, 6.785888671875, 7.1580810546875, 7.5302734375, 7.9024658203125, 8.274658203125, 8.6468505859375, 9.01904296875, 9.3912353515625, 9.763427734375, 10.1356201171875, 10.5078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 6.0, 12.0, 20.0, 15.0, 25.0, 38.0, 47.0, 86.0, 110.0, 178.0, 227.0, 371.0, 571.0, 934.0, 1487.0, 2593.0, 4607.0, 8908.0, 17868.0, 40172.0, 97612.0, 236540.0, 333131.0, 174031.0, 69861.0, 29301.0, 13711.0, 6897.0, 3652.0, 2083.0, 1261.0, 769.0, 494.0, 320.0, 190.0, 126.0, 82.0, 74.0, 45.0, 22.0, 17.0, 17.0, 16.0, 7.0, 10.0, 8.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-14.7578125, -14.3277587890625, -13.897705078125, -13.4676513671875, -13.03759765625, -12.6075439453125, -12.177490234375, -11.7474365234375, -11.3173828125, -10.8873291015625, -10.457275390625, -10.0272216796875, -9.59716796875, -9.1671142578125, -8.737060546875, -8.3070068359375, -7.876953125, -7.4468994140625, -7.016845703125, -6.5867919921875, -6.15673828125, -5.7266845703125, -5.296630859375, -4.8665771484375, -4.4365234375, -4.0064697265625, -3.576416015625, -3.1463623046875, -2.71630859375, -2.2862548828125, -1.856201171875, -1.4261474609375, -0.99609375, -0.5660400390625, -0.135986328125, 0.2940673828125, 0.72412109375, 1.1541748046875, 1.584228515625, 2.0142822265625, 2.4443359375, 2.8743896484375, 3.304443359375, 3.7344970703125, 4.16455078125, 4.5946044921875, 5.024658203125, 5.4547119140625, 5.884765625, 6.3148193359375, 6.744873046875, 7.1749267578125, 7.60498046875, 8.0350341796875, 8.465087890625, 8.8951416015625, 9.3251953125, 9.7552490234375, 10.185302734375, 10.6153564453125, 11.04541015625, 11.4754638671875, 11.905517578125, 12.3355712890625, 12.765625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 3.0, 7.0, 8.0, 13.0, 8.0, 12.0, 11.0, 17.0, 20.0, 21.0, 31.0, 29.0, 25.0, 38.0, 29.0, 28.0, 41.0, 28.0, 41.0, 45.0, 35.0, 48.0, 44.0, 41.0, 27.0, 41.0, 44.0, 41.0, 34.0, 22.0, 19.0, 31.0, 19.0, 17.0, 20.0, 7.0, 10.0, 8.0, 11.0, 6.0, 8.0, 3.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.9296875, -6.72015380859375, -6.5106201171875, -6.30108642578125, -6.091552734375, -5.88201904296875, -5.6724853515625, -5.46295166015625, -5.25341796875, -5.04388427734375, -4.8343505859375, -4.62481689453125, -4.415283203125, -4.20574951171875, -3.9962158203125, -3.78668212890625, -3.5771484375, -3.36761474609375, -3.1580810546875, -2.94854736328125, -2.739013671875, -2.52947998046875, -2.3199462890625, -2.11041259765625, -1.90087890625, -1.69134521484375, -1.4818115234375, -1.27227783203125, -1.062744140625, -0.85321044921875, -0.6436767578125, -0.43414306640625, -0.224609375, -0.01507568359375, 0.1944580078125, 0.40399169921875, 0.613525390625, 0.82305908203125, 1.0325927734375, 1.24212646484375, 1.45166015625, 1.66119384765625, 1.8707275390625, 2.08026123046875, 2.289794921875, 2.49932861328125, 2.7088623046875, 2.91839599609375, 3.1279296875, 3.33746337890625, 3.5469970703125, 3.75653076171875, 3.966064453125, 4.17559814453125, 4.3851318359375, 4.59466552734375, 4.80419921875, 5.01373291015625, 5.2232666015625, 5.43280029296875, 5.642333984375, 5.85186767578125, 6.0614013671875, 6.27093505859375, 6.48046875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 9.0, 10.0, 14.0, 22.0, 19.0, 34.0, 53.0, 59.0, 78.0, 157.0, 247.0, 330.0, 536.0, 845.0, 1495.0, 2781.0, 5390.0, 10822.0, 25129.0, 63105.0, 172528.0, 373762.0, 240611.0, 87924.0, 33721.0, 14312.0, 6531.0, 3321.0, 1825.0, 1026.0, 651.0, 395.0, 268.0, 171.0, 117.0, 78.0, 53.0, 35.0, 18.0, 28.0, 18.0, 11.0, 4.0, 8.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.05078125, -4.89129638671875, -4.7318115234375, -4.57232666015625, -4.412841796875, -4.25335693359375, -4.0938720703125, -3.93438720703125, -3.77490234375, -3.61541748046875, -3.4559326171875, -3.29644775390625, -3.136962890625, -2.97747802734375, -2.8179931640625, -2.65850830078125, -2.4990234375, -2.33953857421875, -2.1800537109375, -2.02056884765625, -1.861083984375, -1.70159912109375, -1.5421142578125, -1.38262939453125, -1.22314453125, -1.06365966796875, -0.9041748046875, -0.74468994140625, -0.585205078125, -0.42572021484375, -0.2662353515625, -0.10675048828125, 0.052734375, 0.21221923828125, 0.3717041015625, 0.53118896484375, 0.690673828125, 0.85015869140625, 1.0096435546875, 1.16912841796875, 1.32861328125, 1.48809814453125, 1.6475830078125, 1.80706787109375, 1.966552734375, 2.12603759765625, 2.2855224609375, 2.44500732421875, 2.6044921875, 2.76397705078125, 2.9234619140625, 3.08294677734375, 3.242431640625, 3.40191650390625, 3.5614013671875, 3.72088623046875, 3.88037109375, 4.03985595703125, 4.1993408203125, 4.35882568359375, 4.518310546875, 4.67779541015625, 4.8372802734375, 4.99676513671875, 5.15625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 8.0, 4.0, 9.0, 12.0, 20.0, 22.0, 29.0, 40.0, 46.0, 59.0, 69.0, 103.0, 89.0, 89.0, 79.0, 77.0, 52.0, 46.0, 33.0, 26.0, 23.0, 9.0, 7.0, 9.0, 4.0, 5.0, 1.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003216266632080078, -0.0003117993474006653, -0.00030197203159332275, -0.0002921447157859802, -0.0002823173999786377, -0.00027249008417129517, -0.00026266276836395264, -0.0002528354525566101, -0.00024300813674926758, -0.00023318082094192505, -0.00022335350513458252, -0.00021352618932724, -0.00020369887351989746, -0.00019387155771255493, -0.0001840442419052124, -0.00017421692609786987, -0.00016438961029052734, -0.00015456229448318481, -0.00014473497867584229, -0.00013490766286849976, -0.00012508034706115723, -0.0001152530312538147, -0.00010542571544647217, -9.559839963912964e-05, -8.577108383178711e-05, -7.594376802444458e-05, -6.611645221710205e-05, -5.628913640975952e-05, -4.646182060241699e-05, -3.663450479507446e-05, -2.6807188987731934e-05, -1.6979873180389404e-05, -7.152557373046875e-06, 2.6747584342956543e-06, 1.2502074241638184e-05, 2.2329390048980713e-05, 3.215670585632324e-05, 4.198402166366577e-05, 5.18113374710083e-05, 6.163865327835083e-05, 7.146596908569336e-05, 8.129328489303589e-05, 9.112060070037842e-05, 0.00010094791650772095, 0.00011077523231506348, 0.000120602548122406, 0.00013042986392974854, 0.00014025717973709106, 0.0001500844955444336, 0.00015991181135177612, 0.00016973912715911865, 0.00017956644296646118, 0.0001893937587738037, 0.00019922107458114624, 0.00020904839038848877, 0.0002188757061958313, 0.00022870302200317383, 0.00023853033781051636, 0.0002483576536178589, 0.0002581849694252014, 0.00026801228523254395, 0.0002778396010398865, 0.000287666916847229, 0.00029749423265457153, 0.00030732154846191406]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 14.0, 20.0, 17.0, 22.0, 25.0, 33.0, 56.0, 52.0, 113.0, 114.0, 173.0, 229.0, 315.0, 411.0, 594.0, 912.0, 1470.0, 2445.0, 4652.0, 9602.0, 21253.0, 50508.0, 126737.0, 271195.0, 296039.0, 151386.0, 60822.0, 25280.0, 11113.0, 5303.0, 2724.0, 1571.0, 968.0, 668.0, 434.0, 322.0, 241.0, 202.0, 135.0, 113.0, 66.0, 52.0, 39.0, 42.0, 17.0, 19.0, 15.0, 11.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.65625, -4.50653076171875, -4.3568115234375, -4.20709228515625, -4.057373046875, -3.90765380859375, -3.7579345703125, -3.60821533203125, -3.45849609375, -3.30877685546875, -3.1590576171875, -3.00933837890625, -2.859619140625, -2.70989990234375, -2.5601806640625, -2.41046142578125, -2.2607421875, -2.11102294921875, -1.9613037109375, -1.81158447265625, -1.661865234375, -1.51214599609375, -1.3624267578125, -1.21270751953125, -1.06298828125, -0.91326904296875, -0.7635498046875, -0.61383056640625, -0.464111328125, -0.31439208984375, -0.1646728515625, -0.01495361328125, 0.134765625, 0.28448486328125, 0.4342041015625, 0.58392333984375, 0.733642578125, 0.88336181640625, 1.0330810546875, 1.18280029296875, 1.33251953125, 1.48223876953125, 1.6319580078125, 1.78167724609375, 1.931396484375, 2.08111572265625, 2.2308349609375, 2.38055419921875, 2.5302734375, 2.67999267578125, 2.8297119140625, 2.97943115234375, 3.129150390625, 3.27886962890625, 3.4285888671875, 3.57830810546875, 3.72802734375, 3.87774658203125, 4.0274658203125, 4.17718505859375, 4.326904296875, 4.47662353515625, 4.6263427734375, 4.77606201171875, 4.92578125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 10.0, 21.0, 29.0, 43.0, 59.0, 85.0, 110.0, 114.0, 117.0, 115.0, 85.0, 66.0, 33.0, 39.0, 19.0, 12.0, 11.0, 5.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8974609375, -1.8362579345703125, -1.775054931640625, -1.7138519287109375, -1.65264892578125, -1.5914459228515625, -1.530242919921875, -1.4690399169921875, -1.4078369140625, -1.3466339111328125, -1.285430908203125, -1.2242279052734375, -1.16302490234375, -1.1018218994140625, -1.040618896484375, -0.9794158935546875, -0.918212890625, -0.8570098876953125, -0.795806884765625, -0.7346038818359375, -0.67340087890625, -0.6121978759765625, -0.550994873046875, -0.4897918701171875, -0.4285888671875, -0.3673858642578125, -0.306182861328125, -0.2449798583984375, -0.18377685546875, -0.1225738525390625, -0.061370849609375, -0.0001678466796875, 0.06103515625, 0.1222381591796875, 0.183441162109375, 0.2446441650390625, 0.30584716796875, 0.3670501708984375, 0.428253173828125, 0.4894561767578125, 0.5506591796875, 0.6118621826171875, 0.673065185546875, 0.7342681884765625, 0.79547119140625, 0.8566741943359375, 0.917877197265625, 0.9790802001953125, 1.040283203125, 1.1014862060546875, 1.162689208984375, 1.2238922119140625, 1.28509521484375, 1.3462982177734375, 1.407501220703125, 1.4687042236328125, 1.5299072265625, 1.5911102294921875, 1.652313232421875, 1.7135162353515625, 1.77471923828125, 1.8359222412109375, 1.897125244140625, 1.9583282470703125, 2.01953125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 3.0, 9.0, 15.0, 15.0, 31.0, 28.0, 33.0, 59.0, 67.0, 82.0, 89.0, 99.0, 87.0, 74.0, 73.0, 55.0, 35.0, 29.0, 24.0, 11.0, 23.0, 9.0, 8.0, 7.0, 8.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.203750610351562, -24.492664337158203, -23.78157615661621, -23.07048988342285, -22.35940170288086, -21.6483154296875, -20.93722915649414, -20.22614097595215, -19.51505470275879, -18.80396842956543, -18.092880249023438, -17.381793975830078, -16.670705795288086, -15.959619522094727, -15.24853229522705, -14.537445068359375, -13.8263578414917, -13.115270614624023, -12.404183387756348, -11.693096160888672, -10.982009887695312, -10.270922660827637, -9.559835433959961, -8.848749160766602, -8.13766098022461, -7.426573753356934, -6.715487003326416, -6.00439977645874, -5.293313026428223, -4.582225799560547, -3.871138572692871, -3.1600518226623535, -2.448965072631836, -1.7378780841827393, -1.026790976524353, -0.3157038688659668, 0.3953831195831299, 1.1064701080322266, 1.8175573348999023, 2.52864408493042, 3.2397313117980957, 3.9508183002471924, 4.661905288696289, 5.372992515563965, 6.084079742431641, 6.795166492462158, 7.506253719329834, 8.217340469360352, 8.928427696228027, 9.639514923095703, 10.350602149963379, 11.061689376831055, 11.772775650024414, 12.48386287689209, 13.194950103759766, 13.906036376953125, 14.617124557495117, 15.328211784362793, 16.03929901123047, 16.750385284423828, 17.46147346496582, 18.17255973815918, 18.883647918701172, 19.59473419189453, 20.30582046508789]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 4.0, 3.0, 7.0, 9.0, 8.0, 12.0, 7.0, 11.0, 16.0, 17.0, 17.0, 25.0, 21.0, 21.0, 25.0, 43.0, 40.0, 42.0, 45.0, 37.0, 48.0, 45.0, 42.0, 49.0, 51.0, 34.0, 46.0, 36.0, 39.0, 32.0, 23.0, 20.0, 16.0, 23.0, 17.0, 17.0, 12.0, 5.0, 9.0, 6.0, 6.0, 8.0, 2.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.688831329345703, -11.343927383422852, -10.999024391174316, -10.654120445251465, -10.30921745300293, -9.964313507080078, -9.619409561157227, -9.274505615234375, -8.92960262298584, -8.584698677062988, -8.239795684814453, -7.894891738891602, -7.549988269805908, -7.205084800720215, -6.860180854797363, -6.51527738571167, -6.170373916625977, -5.825470447540283, -5.48056697845459, -5.135663032531738, -4.790759563446045, -4.445856094360352, -4.1009521484375, -3.7560486793518066, -3.4111452102661133, -3.06624174118042, -2.7213380336761475, -2.376434326171875, -2.0315308570861816, -1.6866272687911987, -1.3417236804962158, -0.9968199729919434, -0.6519174575805664, -0.3070138692855835, 0.037889719009399414, 0.3827933073043823, 0.7276968955993652, 1.0726004838943481, 1.417504072189331, 1.7624077796936035, 2.107311248779297, 2.4522147178649902, 2.7971184253692627, 3.142022132873535, 3.4869256019592285, 3.831829071044922, 4.176733016967773, 4.521636486053467, 4.86653995513916, 5.2114434242248535, 5.556346893310547, 5.901250839233398, 6.246154308319092, 6.591057777404785, 6.935961723327637, 7.28086519241333, 7.625768661499023, 7.970672130584717, 8.31557559967041, 8.660479545593262, 9.005382537841797, 9.350286483764648, 9.6951904296875, 10.040094375610352, 10.384997367858887]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 5.0, 12.0, 7.0, 13.0, 20.0, 40.0, 41.0, 68.0, 119.0, 169.0, 280.0, 407.0, 679.0, 1065.0, 1701.0, 2879.0, 4736.0, 7924.0, 13978.0, 24311.0, 42409.0, 72150.0, 118963.0, 171616.0, 189690.0, 153105.0, 99673.0, 59650.0, 34689.0, 19721.0, 11425.0, 6817.0, 3986.0, 2291.0, 1471.0, 902.0, 531.0, 327.0, 233.0, 138.0, 110.0, 81.0, 41.0, 24.0, 21.0, 13.0, 3.0, 6.0, 3.0, 6.0, 2.0, 2.0, 4.0, 3.0], "bins": [-15.1015625, -14.6614990234375, -14.221435546875, -13.7813720703125, -13.34130859375, -12.9012451171875, -12.461181640625, -12.0211181640625, -11.5810546875, -11.1409912109375, -10.700927734375, -10.2608642578125, -9.82080078125, -9.3807373046875, -8.940673828125, -8.5006103515625, -8.060546875, -7.6204833984375, -7.180419921875, -6.7403564453125, -6.30029296875, -5.8602294921875, -5.420166015625, -4.9801025390625, -4.5400390625, -4.0999755859375, -3.659912109375, -3.2198486328125, -2.77978515625, -2.3397216796875, -1.899658203125, -1.4595947265625, -1.01953125, -0.5794677734375, -0.139404296875, 0.3006591796875, 0.74072265625, 1.1807861328125, 1.620849609375, 2.0609130859375, 2.5009765625, 2.9410400390625, 3.381103515625, 3.8211669921875, 4.26123046875, 4.7012939453125, 5.141357421875, 5.5814208984375, 6.021484375, 6.4615478515625, 6.901611328125, 7.3416748046875, 7.78173828125, 8.2218017578125, 8.661865234375, 9.1019287109375, 9.5419921875, 9.9820556640625, 10.422119140625, 10.8621826171875, 11.30224609375, 11.7423095703125, 12.182373046875, 12.6224365234375, 13.0625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 4.0, 9.0, 4.0, 7.0, 14.0, 15.0, 17.0, 21.0, 24.0, 21.0, 31.0, 44.0, 43.0, 50.0, 51.0, 49.0, 46.0, 45.0, 50.0, 56.0, 40.0, 58.0, 37.0, 44.0, 30.0, 34.0, 24.0, 24.0, 24.0, 17.0, 10.0, 8.0, 15.0, 5.0, 6.0, 9.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.59375, -12.183837890625, -11.77392578125, -11.364013671875, -10.9541015625, -10.544189453125, -10.13427734375, -9.724365234375, -9.314453125, -8.904541015625, -8.49462890625, -8.084716796875, -7.6748046875, -7.264892578125, -6.85498046875, -6.445068359375, -6.03515625, -5.625244140625, -5.21533203125, -4.805419921875, -4.3955078125, -3.985595703125, -3.57568359375, -3.165771484375, -2.755859375, -2.345947265625, -1.93603515625, -1.526123046875, -1.1162109375, -0.706298828125, -0.29638671875, 0.113525390625, 0.5234375, 0.933349609375, 1.34326171875, 1.753173828125, 2.1630859375, 2.572998046875, 2.98291015625, 3.392822265625, 3.802734375, 4.212646484375, 4.62255859375, 5.032470703125, 5.4423828125, 5.852294921875, 6.26220703125, 6.672119140625, 7.08203125, 7.491943359375, 7.90185546875, 8.311767578125, 8.7216796875, 9.131591796875, 9.54150390625, 9.951416015625, 10.361328125, 10.771240234375, 11.18115234375, 11.591064453125, 12.0009765625, 12.410888671875, 12.82080078125, 13.230712890625, 13.640625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 2.0, 6.0, 10.0, 16.0, 16.0, 31.0, 38.0, 70.0, 108.0, 130.0, 209.0, 297.0, 512.0, 840.0, 1385.0, 2353.0, 4073.0, 7239.0, 13249.0, 25557.0, 49297.0, 94381.0, 164703.0, 222726.0, 196780.0, 123594.0, 66357.0, 34520.0, 17776.0, 9555.0, 5230.0, 2913.0, 1713.0, 1069.0, 659.0, 381.0, 236.0, 168.0, 112.0, 70.0, 51.0, 36.0, 23.0, 21.0, 14.0, 8.0, 7.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.15625, -16.615478515625, -16.07470703125, -15.533935546875, -14.9931640625, -14.452392578125, -13.91162109375, -13.370849609375, -12.830078125, -12.289306640625, -11.74853515625, -11.207763671875, -10.6669921875, -10.126220703125, -9.58544921875, -9.044677734375, -8.50390625, -7.963134765625, -7.42236328125, -6.881591796875, -6.3408203125, -5.800048828125, -5.25927734375, -4.718505859375, -4.177734375, -3.636962890625, -3.09619140625, -2.555419921875, -2.0146484375, -1.473876953125, -0.93310546875, -0.392333984375, 0.1484375, 0.689208984375, 1.22998046875, 1.770751953125, 2.3115234375, 2.852294921875, 3.39306640625, 3.933837890625, 4.474609375, 5.015380859375, 5.55615234375, 6.096923828125, 6.6376953125, 7.178466796875, 7.71923828125, 8.260009765625, 8.80078125, 9.341552734375, 9.88232421875, 10.423095703125, 10.9638671875, 11.504638671875, 12.04541015625, 12.586181640625, 13.126953125, 13.667724609375, 14.20849609375, 14.749267578125, 15.2900390625, 15.830810546875, 16.37158203125, 16.912353515625, 17.453125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 6.0, 6.0, 3.0, 5.0, 5.0, 10.0, 11.0, 13.0, 7.0, 20.0, 29.0, 14.0, 27.0, 21.0, 23.0, 32.0, 25.0, 42.0, 39.0, 31.0, 30.0, 34.0, 44.0, 41.0, 35.0, 34.0, 35.0, 37.0, 37.0, 27.0, 28.0, 32.0, 22.0, 30.0, 21.0, 15.0, 16.0, 16.0, 15.0, 15.0, 14.0, 10.0, 9.0, 3.0, 8.0, 2.0, 6.0, 3.0, 4.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0], "bins": [-6.01953125, -5.82952880859375, -5.6395263671875, -5.44952392578125, -5.259521484375, -5.06951904296875, -4.8795166015625, -4.68951416015625, -4.49951171875, -4.30950927734375, -4.1195068359375, -3.92950439453125, -3.739501953125, -3.54949951171875, -3.3594970703125, -3.16949462890625, -2.9794921875, -2.78948974609375, -2.5994873046875, -2.40948486328125, -2.219482421875, -2.02947998046875, -1.8394775390625, -1.64947509765625, -1.45947265625, -1.26947021484375, -1.0794677734375, -0.88946533203125, -0.699462890625, -0.50946044921875, -0.3194580078125, -0.12945556640625, 0.060546875, 0.25054931640625, 0.4405517578125, 0.63055419921875, 0.820556640625, 1.01055908203125, 1.2005615234375, 1.39056396484375, 1.58056640625, 1.77056884765625, 1.9605712890625, 2.15057373046875, 2.340576171875, 2.53057861328125, 2.7205810546875, 2.91058349609375, 3.1005859375, 3.29058837890625, 3.4805908203125, 3.67059326171875, 3.860595703125, 4.05059814453125, 4.2406005859375, 4.43060302734375, 4.62060546875, 4.81060791015625, 5.0006103515625, 5.19061279296875, 5.380615234375, 5.57061767578125, 5.7606201171875, 5.95062255859375, 6.140625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 11.0, 10.0, 25.0, 35.0, 50.0, 101.0, 125.0, 209.0, 366.0, 640.0, 1035.0, 1816.0, 3086.0, 5288.0, 9748.0, 18050.0, 33747.0, 64932.0, 122252.0, 199199.0, 226885.0, 164458.0, 91694.0, 48467.0, 25113.0, 13586.0, 7469.0, 4183.0, 2388.0, 1412.0, 845.0, 498.0, 327.0, 196.0, 130.0, 58.0, 41.0, 28.0, 23.0, 10.0, 8.0, 5.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.853515625, -5.66015625, -5.466796875, -5.2734375, -5.080078125, -4.88671875, -4.693359375, -4.5, -4.306640625, -4.11328125, -3.919921875, -3.7265625, -3.533203125, -3.33984375, -3.146484375, -2.953125, -2.759765625, -2.56640625, -2.373046875, -2.1796875, -1.986328125, -1.79296875, -1.599609375, -1.40625, -1.212890625, -1.01953125, -0.826171875, -0.6328125, -0.439453125, -0.24609375, -0.052734375, 0.140625, 0.333984375, 0.52734375, 0.720703125, 0.9140625, 1.107421875, 1.30078125, 1.494140625, 1.6875, 1.880859375, 2.07421875, 2.267578125, 2.4609375, 2.654296875, 2.84765625, 3.041015625, 3.234375, 3.427734375, 3.62109375, 3.814453125, 4.0078125, 4.201171875, 4.39453125, 4.587890625, 4.78125, 4.974609375, 5.16796875, 5.361328125, 5.5546875, 5.748046875, 5.94140625, 6.134765625, 6.328125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 9.0, 5.0, 7.0, 24.0, 28.0, 33.0, 31.0, 56.0, 55.0, 65.0, 87.0, 89.0, 114.0, 73.0, 61.0, 69.0, 47.0, 48.0, 23.0, 26.0, 13.0, 9.0, 11.0, 4.0, 3.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007867813110351562, -0.0007650107145309448, -0.0007432401180267334, -0.000721469521522522, -0.0006996989250183105, -0.0006779283285140991, -0.0006561577320098877, -0.0006343871355056763, -0.0006126165390014648, -0.0005908459424972534, -0.000569075345993042, -0.0005473047494888306, -0.0005255341529846191, -0.0005037635564804077, -0.0004819929599761963, -0.00046022236347198486, -0.00043845176696777344, -0.000416681170463562, -0.0003949105739593506, -0.00037313997745513916, -0.00035136938095092773, -0.0003295987844467163, -0.0003078281879425049, -0.00028605759143829346, -0.00026428699493408203, -0.0002425163984298706, -0.00022074580192565918, -0.00019897520542144775, -0.00017720460891723633, -0.0001554340124130249, -0.00013366341590881348, -0.00011189281940460205, -9.012222290039062e-05, -6.83516263961792e-05, -4.6581029891967773e-05, -2.4810433387756348e-05, -3.039836883544922e-06, 1.8730759620666504e-05, 4.050135612487793e-05, 6.227195262908936e-05, 8.404254913330078e-05, 0.00010581314563751221, 0.00012758374214172363, 0.00014935433864593506, 0.00017112493515014648, 0.0001928955316543579, 0.00021466612815856934, 0.00023643672466278076, 0.0002582073211669922, 0.0002799779176712036, 0.00030174851417541504, 0.00032351911067962646, 0.0003452897071838379, 0.0003670603036880493, 0.00038883090019226074, 0.00041060149669647217, 0.0004323720932006836, 0.000454142689704895, 0.00047591328620910645, 0.0004976838827133179, 0.0005194544792175293, 0.0005412250757217407, 0.0005629956722259521, 0.0005847662687301636, 0.000606536865234375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 10.0, 7.0, 25.0, 31.0, 41.0, 59.0, 99.0, 151.0, 223.0, 379.0, 623.0, 1097.0, 1682.0, 2824.0, 4824.0, 8138.0, 14275.0, 25776.0, 46251.0, 82568.0, 140457.0, 201650.0, 198523.0, 136420.0, 79832.0, 44303.0, 24591.0, 14080.0, 7965.0, 4527.0, 2691.0, 1675.0, 1014.0, 641.0, 406.0, 238.0, 148.0, 107.0, 72.0, 43.0, 22.0, 18.0, 21.0, 11.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0], "bins": [-6.70703125, -6.52056884765625, -6.3341064453125, -6.14764404296875, -5.961181640625, -5.77471923828125, -5.5882568359375, -5.40179443359375, -5.21533203125, -5.02886962890625, -4.8424072265625, -4.65594482421875, -4.469482421875, -4.28302001953125, -4.0965576171875, -3.91009521484375, -3.7236328125, -3.53717041015625, -3.3507080078125, -3.16424560546875, -2.977783203125, -2.79132080078125, -2.6048583984375, -2.41839599609375, -2.23193359375, -2.04547119140625, -1.8590087890625, -1.67254638671875, -1.486083984375, -1.29962158203125, -1.1131591796875, -0.92669677734375, -0.740234375, -0.55377197265625, -0.3673095703125, -0.18084716796875, 0.005615234375, 0.19207763671875, 0.3785400390625, 0.56500244140625, 0.75146484375, 0.93792724609375, 1.1243896484375, 1.31085205078125, 1.497314453125, 1.68377685546875, 1.8702392578125, 2.05670166015625, 2.2431640625, 2.42962646484375, 2.6160888671875, 2.80255126953125, 2.989013671875, 3.17547607421875, 3.3619384765625, 3.54840087890625, 3.73486328125, 3.92132568359375, 4.1077880859375, 4.29425048828125, 4.480712890625, 4.66717529296875, 4.8536376953125, 5.04010009765625, 5.2265625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 1.0, 4.0, 5.0, 5.0, 6.0, 8.0, 10.0, 17.0, 10.0, 12.0, 16.0, 29.0, 32.0, 37.0, 39.0, 45.0, 55.0, 72.0, 53.0, 56.0, 58.0, 59.0, 48.0, 52.0, 40.0, 37.0, 35.0, 38.0, 22.0, 24.0, 11.0, 9.0, 19.0, 7.0, 10.0, 8.0, 9.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6767578125, -1.6244354248046875, -1.572113037109375, -1.5197906494140625, -1.46746826171875, -1.4151458740234375, -1.362823486328125, -1.3105010986328125, -1.2581787109375, -1.2058563232421875, -1.153533935546875, -1.1012115478515625, -1.04888916015625, -0.9965667724609375, -0.944244384765625, -0.8919219970703125, -0.839599609375, -0.7872772216796875, -0.734954833984375, -0.6826324462890625, -0.63031005859375, -0.5779876708984375, -0.525665283203125, -0.4733428955078125, -0.4210205078125, -0.3686981201171875, -0.316375732421875, -0.2640533447265625, -0.21173095703125, -0.1594085693359375, -0.107086181640625, -0.0547637939453125, -0.00244140625, 0.0498809814453125, 0.102203369140625, 0.1545257568359375, 0.20684814453125, 0.2591705322265625, 0.311492919921875, 0.3638153076171875, 0.4161376953125, 0.4684600830078125, 0.520782470703125, 0.5731048583984375, 0.62542724609375, 0.6777496337890625, 0.730072021484375, 0.7823944091796875, 0.834716796875, 0.8870391845703125, 0.939361572265625, 0.9916839599609375, 1.04400634765625, 1.0963287353515625, 1.148651123046875, 1.2009735107421875, 1.2532958984375, 1.3056182861328125, 1.357940673828125, 1.4102630615234375, 1.46258544921875, 1.5149078369140625, 1.567230224609375, 1.6195526123046875, 1.671875]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 10.0, 6.0, 8.0, 10.0, 15.0, 34.0, 27.0, 35.0, 62.0, 72.0, 55.0, 106.0, 64.0, 85.0, 85.0, 58.0, 57.0, 40.0, 29.0, 30.0, 26.0, 12.0, 12.0, 12.0, 7.0, 7.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.424373626708984, -20.788061141967773, -20.151748657226562, -19.515438079833984, -18.879125595092773, -18.242813110351562, -17.60650062561035, -16.97018814086914, -16.333877563476562, -15.697565078735352, -15.061253547668457, -14.424941062927246, -13.788629531860352, -13.15231704711914, -12.51600456237793, -11.879693031311035, -11.243380546569824, -10.607068061828613, -9.970756530761719, -9.334444046020508, -8.698132514953613, -8.061820030212402, -7.42550802230835, -6.789196014404297, -6.152884006500244, -5.516571998596191, -4.880259990692139, -4.243947982788086, -3.607635736465454, -2.9713237285614014, -2.3350114822387695, -1.6986994743347168, -1.062387466430664, -0.42607539892196655, 0.21023666858673096, 0.8465487957000732, 1.482860803604126, 2.1191728115081787, 2.7554850578308105, 3.3917970657348633, 4.028109073638916, 4.664421081542969, 5.3007330894470215, 5.937045097351074, 6.573357582092285, 7.20966911315918, 7.845981597900391, 8.482294082641602, 9.118605613708496, 9.754918098449707, 10.391229629516602, 11.027542114257812, 11.663853645324707, 12.300166130065918, 12.936477661132812, 13.572790145874023, 14.209102630615234, 14.845415115356445, 15.48172664642334, 16.118038177490234, 16.754350662231445, 17.390663146972656, 18.026975631713867, 18.663288116455078, 19.299598693847656]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 12.0, 15.0, 9.0, 10.0, 11.0, 15.0, 16.0, 25.0, 23.0, 36.0, 31.0, 23.0, 37.0, 38.0, 42.0, 42.0, 42.0, 43.0, 56.0, 41.0, 43.0, 38.0, 42.0, 29.0, 35.0, 32.0, 28.0, 20.0, 23.0, 24.0, 23.0, 18.0, 13.0, 11.0, 10.0, 6.0, 8.0, 5.0, 7.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.103266716003418, -9.778627395629883, -9.453987121582031, -9.129347801208496, -8.804708480834961, -8.48006820678711, -8.155428886413574, -7.830789566040039, -7.506149768829346, -7.181509971618652, -6.856870651245117, -6.532230854034424, -6.2075910568237305, -5.882951736450195, -5.558311939239502, -5.233672142028809, -4.909032821655273, -4.58439302444458, -4.259753704071045, -3.9351139068603516, -3.6104743480682373, -3.285834789276123, -2.9611949920654297, -2.6365554332733154, -2.311915874481201, -1.987276315689087, -1.662636637687683, -1.3379969596862793, -1.013357400894165, -0.6887178421020508, -0.364078164100647, -0.039438486099243164, 0.2852001190185547, 0.6098397374153137, 0.9344793558120728, 1.2591190338134766, 1.5837585926055908, 1.908398151397705, 2.2330379486083984, 2.5576775074005127, 2.882317066192627, 3.206956624984741, 3.5315961837768555, 3.856235980987549, 4.180875778198242, 4.505515098571777, 4.830154895782471, 5.154794692993164, 5.479434013366699, 5.804073810577393, 6.128713130950928, 6.453352928161621, 6.777992248535156, 7.10263204574585, 7.427271842956543, 7.751911163330078, 8.07655143737793, 8.401190757751465, 8.725831031799316, 9.050470352172852, 9.375109672546387, 9.699748992919922, 10.024389266967773, 10.349028587341309, 10.673667907714844]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 7.0, 9.0, 11.0, 26.0, 39.0, 50.0, 83.0, 130.0, 221.0, 376.0, 526.0, 958.0, 1653.0, 2778.0, 4834.0, 9411.0, 18181.0, 37915.0, 89344.0, 246570.0, 767942.0, 1566736.0, 945965.0, 303975.0, 106057.0, 43982.0, 21002.0, 10853.0, 5911.0, 3449.0, 1949.0, 1220.0, 773.0, 455.0, 288.0, 191.0, 139.0, 81.0, 55.0, 33.0, 34.0, 26.0, 12.0, 11.0, 12.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.174560546875, -16.55224609375, -15.929931640625, -15.3076171875, -14.685302734375, -14.06298828125, -13.440673828125, -12.818359375, -12.196044921875, -11.57373046875, -10.951416015625, -10.3291015625, -9.706787109375, -9.08447265625, -8.462158203125, -7.83984375, -7.217529296875, -6.59521484375, -5.972900390625, -5.3505859375, -4.728271484375, -4.10595703125, -3.483642578125, -2.861328125, -2.239013671875, -1.61669921875, -0.994384765625, -0.3720703125, 0.250244140625, 0.87255859375, 1.494873046875, 2.1171875, 2.739501953125, 3.36181640625, 3.984130859375, 4.6064453125, 5.228759765625, 5.85107421875, 6.473388671875, 7.095703125, 7.718017578125, 8.34033203125, 8.962646484375, 9.5849609375, 10.207275390625, 10.82958984375, 11.451904296875, 12.07421875, 12.696533203125, 13.31884765625, 13.941162109375, 14.5634765625, 15.185791015625, 15.80810546875, 16.430419921875, 17.052734375, 17.675048828125, 18.29736328125, 18.919677734375, 19.5419921875, 20.164306640625, 20.78662109375, 21.408935546875, 22.03125]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 13.0, 9.0, 6.0, 9.0, 19.0, 15.0, 16.0, 13.0, 29.0, 23.0, 23.0, 37.0, 40.0, 28.0, 34.0, 41.0, 53.0, 47.0, 52.0, 46.0, 50.0, 31.0, 38.0, 36.0, 41.0, 44.0, 31.0, 23.0, 23.0, 18.0, 14.0, 14.0, 16.0, 18.0, 14.0, 7.0, 8.0, 1.0, 9.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.80078125, -7.5643310546875, -7.327880859375, -7.0914306640625, -6.85498046875, -6.6185302734375, -6.382080078125, -6.1456298828125, -5.9091796875, -5.6727294921875, -5.436279296875, -5.1998291015625, -4.96337890625, -4.7269287109375, -4.490478515625, -4.2540283203125, -4.017578125, -3.7811279296875, -3.544677734375, -3.3082275390625, -3.07177734375, -2.8353271484375, -2.598876953125, -2.3624267578125, -2.1259765625, -1.8895263671875, -1.653076171875, -1.4166259765625, -1.18017578125, -0.9437255859375, -0.707275390625, -0.4708251953125, -0.234375, 0.0020751953125, 0.238525390625, 0.4749755859375, 0.71142578125, 0.9478759765625, 1.184326171875, 1.4207763671875, 1.6572265625, 1.8936767578125, 2.130126953125, 2.3665771484375, 2.60302734375, 2.8394775390625, 3.075927734375, 3.3123779296875, 3.548828125, 3.7852783203125, 4.021728515625, 4.2581787109375, 4.49462890625, 4.7310791015625, 4.967529296875, 5.2039794921875, 5.4404296875, 5.6768798828125, 5.913330078125, 6.1497802734375, 6.38623046875, 6.6226806640625, 6.859130859375, 7.0955810546875, 7.33203125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 2.0, 7.0, 15.0, 13.0, 27.0, 29.0, 58.0, 75.0, 131.0, 165.0, 294.0, 555.0, 828.0, 1336.0, 2496.0, 4316.0, 7730.0, 14799.0, 28969.0, 60967.0, 133080.0, 319203.0, 787922.0, 1337836.0, 861923.0, 352834.0, 146366.0, 65724.0, 31464.0, 15981.0, 8545.0, 4535.0, 2478.0, 1445.0, 813.0, 473.0, 310.0, 195.0, 120.0, 89.0, 43.0, 36.0, 17.0, 13.0, 9.0, 3.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.828125, -17.24462890625, -16.6611328125, -16.07763671875, -15.494140625, -14.91064453125, -14.3271484375, -13.74365234375, -13.16015625, -12.57666015625, -11.9931640625, -11.40966796875, -10.826171875, -10.24267578125, -9.6591796875, -9.07568359375, -8.4921875, -7.90869140625, -7.3251953125, -6.74169921875, -6.158203125, -5.57470703125, -4.9912109375, -4.40771484375, -3.82421875, -3.24072265625, -2.6572265625, -2.07373046875, -1.490234375, -0.90673828125, -0.3232421875, 0.26025390625, 0.84375, 1.42724609375, 2.0107421875, 2.59423828125, 3.177734375, 3.76123046875, 4.3447265625, 4.92822265625, 5.51171875, 6.09521484375, 6.6787109375, 7.26220703125, 7.845703125, 8.42919921875, 9.0126953125, 9.59619140625, 10.1796875, 10.76318359375, 11.3466796875, 11.93017578125, 12.513671875, 13.09716796875, 13.6806640625, 14.26416015625, 14.84765625, 15.43115234375, 16.0146484375, 16.59814453125, 17.181640625, 17.76513671875, 18.3486328125, 18.93212890625, 19.515625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 7.0, 12.0, 13.0, 22.0, 33.0, 36.0, 48.0, 53.0, 60.0, 96.0, 108.0, 163.0, 216.0, 285.0, 310.0, 325.0, 387.0, 325.0, 349.0, 251.0, 221.0, 189.0, 120.0, 112.0, 76.0, 66.0, 47.0, 33.0, 39.0, 21.0, 10.0, 9.0, 8.0, 5.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.94140625, -5.76904296875, -5.5966796875, -5.42431640625, -5.251953125, -5.07958984375, -4.9072265625, -4.73486328125, -4.5625, -4.39013671875, -4.2177734375, -4.04541015625, -3.873046875, -3.70068359375, -3.5283203125, -3.35595703125, -3.18359375, -3.01123046875, -2.8388671875, -2.66650390625, -2.494140625, -2.32177734375, -2.1494140625, -1.97705078125, -1.8046875, -1.63232421875, -1.4599609375, -1.28759765625, -1.115234375, -0.94287109375, -0.7705078125, -0.59814453125, -0.42578125, -0.25341796875, -0.0810546875, 0.09130859375, 0.263671875, 0.43603515625, 0.6083984375, 0.78076171875, 0.953125, 1.12548828125, 1.2978515625, 1.47021484375, 1.642578125, 1.81494140625, 1.9873046875, 2.15966796875, 2.33203125, 2.50439453125, 2.6767578125, 2.84912109375, 3.021484375, 3.19384765625, 3.3662109375, 3.53857421875, 3.7109375, 3.88330078125, 4.0556640625, 4.22802734375, 4.400390625, 4.57275390625, 4.7451171875, 4.91748046875, 5.08984375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 4.0, 7.0, 8.0, 6.0, 15.0, 30.0, 22.0, 45.0, 54.0, 64.0, 69.0, 80.0, 112.0, 86.0, 86.0, 65.0, 62.0, 32.0, 38.0, 27.0, 24.0, 12.0, 8.0, 7.0, 10.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-28.235580444335938, -27.558937072753906, -26.882291793823242, -26.20564842224121, -25.529003143310547, -24.852359771728516, -24.175716400146484, -23.499073028564453, -22.82242774963379, -22.145784378051758, -21.469139099121094, -20.792495727539062, -20.11585235595703, -19.439207077026367, -18.762563705444336, -18.085918426513672, -17.40927505493164, -16.73263168334961, -16.055986404418945, -15.379343032836914, -14.702698707580566, -14.026054382324219, -13.349411010742188, -12.67276668548584, -11.996122360229492, -11.319478034973145, -10.642833709716797, -9.966190338134766, -9.289546012878418, -8.61290168762207, -7.936257839202881, -7.259613990783691, -6.582969665527344, -5.906325340270996, -5.229681491851807, -4.553037643432617, -3.8763933181762695, -3.199749231338501, -2.5231051445007324, -1.846461296081543, -1.1698169708251953, -0.49317288398742676, 0.1834712028503418, 0.8601152896881104, 1.536759376525879, 2.2134034633636475, 2.890047550201416, 3.5666913986206055, 4.243335723876953, 4.919980049133301, 5.59662389755249, 6.27326774597168, 6.949912071228027, 7.626556396484375, 8.303199768066406, 8.979844093322754, 9.656488418579102, 10.33313274383545, 11.009777069091797, 11.686420440673828, 12.363064765930176, 13.039709091186523, 13.716352462768555, 14.392996788024902, 15.06964111328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 3.0, 2.0, 2.0, 8.0, 7.0, 13.0, 10.0, 14.0, 11.0, 16.0, 19.0, 26.0, 33.0, 31.0, 28.0, 29.0, 42.0, 34.0, 51.0, 41.0, 35.0, 35.0, 40.0, 32.0, 36.0, 33.0, 30.0, 37.0, 31.0, 27.0, 33.0, 33.0, 26.0, 23.0, 20.0, 22.0, 19.0, 16.0, 9.0, 5.0, 10.0, 2.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-9.291252136230469, -9.004437446594238, -8.717622756958008, -8.430808067321777, -8.143993377685547, -7.857179164886475, -7.570364475250244, -7.283550262451172, -6.996735572814941, -6.709920883178711, -6.4231061935424805, -6.13629150390625, -5.849477291107178, -5.562662601470947, -5.275847911834717, -4.9890336990356445, -4.702218532562256, -4.415403842926025, -4.128589153289795, -3.8417747020721436, -3.554960250854492, -3.2681455612182617, -2.9813308715820312, -2.69451642036438, -2.4077017307281494, -2.120887041091919, -1.8340725898742676, -1.547257900238037, -1.2604433298110962, -0.9736287593841553, -0.6868140697479248, -0.39999961853027344, -0.11318492889404297, 0.17362967133522034, 0.46044427156448364, 0.7472589015960693, 1.0340734720230103, 1.3208880424499512, 1.6077027320861816, 1.894517183303833, 2.1813318729400635, 2.468146562576294, 2.7549610137939453, 3.041775703430176, 3.3285903930664062, 3.6154048442840576, 3.902219533920288, 4.1890339851379395, 4.47584867477417, 4.7626633644104, 5.049478054046631, 5.336292266845703, 5.623106956481934, 5.909921646118164, 6.1967363357543945, 6.483551025390625, 6.7703657150268555, 7.057180404663086, 7.343995094299316, 7.630809783935547, 7.917623996734619, 8.204439163208008, 8.491252899169922, 8.778067588806152, 9.064882278442383]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 7.0, 5.0, 7.0, 13.0, 20.0, 22.0, 43.0, 61.0, 97.0, 152.0, 245.0, 399.0, 602.0, 1031.0, 1702.0, 2763.0, 4874.0, 8141.0, 14762.0, 26435.0, 49547.0, 90515.0, 155806.0, 217254.0, 195821.0, 124256.0, 69010.0, 37480.0, 20310.0, 11357.0, 6449.0, 3686.0, 2199.0, 1311.0, 784.0, 519.0, 303.0, 187.0, 129.0, 82.0, 61.0, 35.0, 31.0, 14.0, 11.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.46875, -8.218017578125, -7.96728515625, -7.716552734375, -7.4658203125, -7.215087890625, -6.96435546875, -6.713623046875, -6.462890625, -6.212158203125, -5.96142578125, -5.710693359375, -5.4599609375, -5.209228515625, -4.95849609375, -4.707763671875, -4.45703125, -4.206298828125, -3.95556640625, -3.704833984375, -3.4541015625, -3.203369140625, -2.95263671875, -2.701904296875, -2.451171875, -2.200439453125, -1.94970703125, -1.698974609375, -1.4482421875, -1.197509765625, -0.94677734375, -0.696044921875, -0.4453125, -0.194580078125, 0.05615234375, 0.306884765625, 0.5576171875, 0.808349609375, 1.05908203125, 1.309814453125, 1.560546875, 1.811279296875, 2.06201171875, 2.312744140625, 2.5634765625, 2.814208984375, 3.06494140625, 3.315673828125, 3.56640625, 3.817138671875, 4.06787109375, 4.318603515625, 4.5693359375, 4.820068359375, 5.07080078125, 5.321533203125, 5.572265625, 5.822998046875, 6.07373046875, 6.324462890625, 6.5751953125, 6.825927734375, 7.07666015625, 7.327392578125, 7.578125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 5.0, 8.0, 4.0, 8.0, 10.0, 9.0, 15.0, 17.0, 24.0, 21.0, 23.0, 36.0, 25.0, 27.0, 43.0, 43.0, 46.0, 35.0, 44.0, 43.0, 43.0, 43.0, 37.0, 40.0, 44.0, 28.0, 34.0, 35.0, 29.0, 33.0, 13.0, 19.0, 31.0, 14.0, 13.0, 9.0, 12.0, 9.0, 6.0, 3.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.953125, -10.61474609375, -10.2763671875, -9.93798828125, -9.599609375, -9.26123046875, -8.9228515625, -8.58447265625, -8.24609375, -7.90771484375, -7.5693359375, -7.23095703125, -6.892578125, -6.55419921875, -6.2158203125, -5.87744140625, -5.5390625, -5.20068359375, -4.8623046875, -4.52392578125, -4.185546875, -3.84716796875, -3.5087890625, -3.17041015625, -2.83203125, -2.49365234375, -2.1552734375, -1.81689453125, -1.478515625, -1.14013671875, -0.8017578125, -0.46337890625, -0.125, 0.21337890625, 0.5517578125, 0.89013671875, 1.228515625, 1.56689453125, 1.9052734375, 2.24365234375, 2.58203125, 2.92041015625, 3.2587890625, 3.59716796875, 3.935546875, 4.27392578125, 4.6123046875, 4.95068359375, 5.2890625, 5.62744140625, 5.9658203125, 6.30419921875, 6.642578125, 6.98095703125, 7.3193359375, 7.65771484375, 7.99609375, 8.33447265625, 8.6728515625, 9.01123046875, 9.349609375, 9.68798828125, 10.0263671875, 10.36474609375, 10.703125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 10.0, 11.0, 15.0, 26.0, 32.0, 45.0, 70.0, 109.0, 194.0, 258.0, 389.0, 596.0, 887.0, 1397.0, 2366.0, 4006.0, 6628.0, 12461.0, 23738.0, 47877.0, 101055.0, 207705.0, 285017.0, 180179.0, 85606.0, 40910.0, 20507.0, 11011.0, 6019.0, 3532.0, 2082.0, 1389.0, 803.0, 593.0, 333.0, 247.0, 151.0, 111.0, 61.0, 32.0, 38.0, 27.0, 16.0, 6.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.3515625, -9.9993896484375, -9.647216796875, -9.2950439453125, -8.94287109375, -8.5906982421875, -8.238525390625, -7.8863525390625, -7.5341796875, -7.1820068359375, -6.829833984375, -6.4776611328125, -6.12548828125, -5.7733154296875, -5.421142578125, -5.0689697265625, -4.716796875, -4.3646240234375, -4.012451171875, -3.6602783203125, -3.30810546875, -2.9559326171875, -2.603759765625, -2.2515869140625, -1.8994140625, -1.5472412109375, -1.195068359375, -0.8428955078125, -0.49072265625, -0.1385498046875, 0.213623046875, 0.5657958984375, 0.91796875, 1.2701416015625, 1.622314453125, 1.9744873046875, 2.32666015625, 2.6788330078125, 3.031005859375, 3.3831787109375, 3.7353515625, 4.0875244140625, 4.439697265625, 4.7918701171875, 5.14404296875, 5.4962158203125, 5.848388671875, 6.2005615234375, 6.552734375, 6.9049072265625, 7.257080078125, 7.6092529296875, 7.96142578125, 8.3135986328125, 8.665771484375, 9.0179443359375, 9.3701171875, 9.7222900390625, 10.074462890625, 10.4266357421875, 10.77880859375, 11.1309814453125, 11.483154296875, 11.8353271484375, 12.1875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 4.0, 8.0, 10.0, 14.0, 11.0, 13.0, 13.0, 16.0, 23.0, 24.0, 23.0, 29.0, 38.0, 44.0, 35.0, 39.0, 39.0, 30.0, 38.0, 42.0, 51.0, 35.0, 37.0, 50.0, 44.0, 29.0, 32.0, 29.0, 25.0, 25.0, 23.0, 20.0, 19.0, 13.0, 9.0, 13.0, 9.0, 4.0, 11.0, 6.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.6636962890625, -6.468017578125, -6.2723388671875, -6.07666015625, -5.8809814453125, -5.685302734375, -5.4896240234375, -5.2939453125, -5.0982666015625, -4.902587890625, -4.7069091796875, -4.51123046875, -4.3155517578125, -4.119873046875, -3.9241943359375, -3.728515625, -3.5328369140625, -3.337158203125, -3.1414794921875, -2.94580078125, -2.7501220703125, -2.554443359375, -2.3587646484375, -2.1630859375, -1.9674072265625, -1.771728515625, -1.5760498046875, -1.38037109375, -1.1846923828125, -0.989013671875, -0.7933349609375, -0.59765625, -0.4019775390625, -0.206298828125, -0.0106201171875, 0.18505859375, 0.3807373046875, 0.576416015625, 0.7720947265625, 0.9677734375, 1.1634521484375, 1.359130859375, 1.5548095703125, 1.75048828125, 1.9461669921875, 2.141845703125, 2.3375244140625, 2.533203125, 2.7288818359375, 2.924560546875, 3.1202392578125, 3.31591796875, 3.5115966796875, 3.707275390625, 3.9029541015625, 4.0986328125, 4.2943115234375, 4.489990234375, 4.6856689453125, 4.88134765625, 5.0770263671875, 5.272705078125, 5.4683837890625, 5.6640625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 11.0, 12.0, 20.0, 33.0, 28.0, 41.0, 55.0, 65.0, 112.0, 152.0, 198.0, 267.0, 402.0, 669.0, 954.0, 1647.0, 2659.0, 4605.0, 8798.0, 18342.0, 44058.0, 124305.0, 366112.0, 305867.0, 98450.0, 36071.0, 15669.0, 7947.0, 4180.0, 2498.0, 1471.0, 946.0, 590.0, 370.0, 271.0, 198.0, 129.0, 95.0, 69.0, 50.0, 39.0, 20.0, 19.0, 12.0, 14.0, 6.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.4609375, -5.28973388671875, -5.1185302734375, -4.94732666015625, -4.776123046875, -4.60491943359375, -4.4337158203125, -4.26251220703125, -4.09130859375, -3.92010498046875, -3.7489013671875, -3.57769775390625, -3.406494140625, -3.23529052734375, -3.0640869140625, -2.89288330078125, -2.7216796875, -2.55047607421875, -2.3792724609375, -2.20806884765625, -2.036865234375, -1.86566162109375, -1.6944580078125, -1.52325439453125, -1.35205078125, -1.18084716796875, -1.0096435546875, -0.83843994140625, -0.667236328125, -0.49603271484375, -0.3248291015625, -0.15362548828125, 0.017578125, 0.18878173828125, 0.3599853515625, 0.53118896484375, 0.702392578125, 0.87359619140625, 1.0447998046875, 1.21600341796875, 1.38720703125, 1.55841064453125, 1.7296142578125, 1.90081787109375, 2.072021484375, 2.24322509765625, 2.4144287109375, 2.58563232421875, 2.7568359375, 2.92803955078125, 3.0992431640625, 3.27044677734375, 3.441650390625, 3.61285400390625, 3.7840576171875, 3.95526123046875, 4.12646484375, 4.29766845703125, 4.4688720703125, 4.64007568359375, 4.811279296875, 4.98248291015625, 5.1536865234375, 5.32489013671875, 5.49609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 6.0, 8.0, 5.0, 6.0, 18.0, 25.0, 38.0, 69.0, 126.0, 136.0, 162.0, 154.0, 99.0, 45.0, 35.0, 14.0, 17.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0005412101745605469, -0.0005239173769950867, -0.0005066245794296265, -0.0004893317818641663, -0.00047203898429870605, -0.00045474618673324585, -0.00043745338916778564, -0.00042016059160232544, -0.00040286779403686523, -0.00038557499647140503, -0.0003682821989059448, -0.0003509894013404846, -0.0003336966037750244, -0.0003164038062095642, -0.000299111008644104, -0.0002818182110786438, -0.0002645254135131836, -0.0002472326159477234, -0.00022993981838226318, -0.00021264702081680298, -0.00019535422325134277, -0.00017806142568588257, -0.00016076862812042236, -0.00014347583055496216, -0.00012618303298950195, -0.00010889023542404175, -9.159743785858154e-05, -7.430464029312134e-05, -5.701184272766113e-05, -3.971904516220093e-05, -2.2426247596740723e-05, -5.133450031280518e-06, 1.2159347534179688e-05, 2.9452145099639893e-05, 4.67449426651001e-05, 6.40377402305603e-05, 8.133053779602051e-05, 9.862333536148071e-05, 0.00011591613292694092, 0.00013320893049240112, 0.00015050172805786133, 0.00016779452562332153, 0.00018508732318878174, 0.00020238012075424194, 0.00021967291831970215, 0.00023696571588516235, 0.00025425851345062256, 0.00027155131101608276, 0.00028884410858154297, 0.0003061369061470032, 0.0003234297037124634, 0.0003407225012779236, 0.0003580152988433838, 0.000375308096408844, 0.0003926008939743042, 0.0004098936915397644, 0.0004271864891052246, 0.0004444792866706848, 0.000461772084236145, 0.0004790648818016052, 0.0004963576793670654, 0.0005136504769325256, 0.0005309432744979858, 0.000548236072063446, 0.0005655288696289062]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 5.0, 11.0, 15.0, 16.0, 22.0, 42.0, 82.0, 87.0, 142.0, 190.0, 309.0, 501.0, 781.0, 1297.0, 2263.0, 3841.0, 7277.0, 14032.0, 29037.0, 68265.0, 169363.0, 315911.0, 244777.0, 104837.0, 43362.0, 19831.0, 9749.0, 5312.0, 2846.0, 1648.0, 950.0, 641.0, 382.0, 252.0, 137.0, 119.0, 88.0, 46.0, 30.0, 24.0, 12.0, 9.0, 10.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.0078125, -4.859375, -4.7109375, -4.5625, -4.4140625, -4.265625, -4.1171875, -3.96875, -3.8203125, -3.671875, -3.5234375, -3.375, -3.2265625, -3.078125, -2.9296875, -2.78125, -2.6328125, -2.484375, -2.3359375, -2.1875, -2.0390625, -1.890625, -1.7421875, -1.59375, -1.4453125, -1.296875, -1.1484375, -1.0, -0.8515625, -0.703125, -0.5546875, -0.40625, -0.2578125, -0.109375, 0.0390625, 0.1875, 0.3359375, 0.484375, 0.6328125, 0.78125, 0.9296875, 1.078125, 1.2265625, 1.375, 1.5234375, 1.671875, 1.8203125, 1.96875, 2.1171875, 2.265625, 2.4140625, 2.5625, 2.7109375, 2.859375, 3.0078125, 3.15625, 3.3046875, 3.453125, 3.6015625, 3.75, 3.8984375, 4.046875, 4.1953125, 4.34375, 4.4921875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 7.0, 6.0, 10.0, 8.0, 12.0, 18.0, 10.0, 11.0, 27.0, 28.0, 28.0, 37.0, 52.0, 50.0, 64.0, 62.0, 64.0, 73.0, 65.0, 43.0, 52.0, 34.0, 35.0, 44.0, 22.0, 21.0, 22.0, 15.0, 15.0, 6.0, 10.0, 6.0, 5.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.9990234375, -0.9684524536132812, -0.9378814697265625, -0.9073104858398438, -0.876739501953125, -0.8461685180664062, -0.8155975341796875, -0.7850265502929688, -0.75445556640625, -0.7238845825195312, -0.6933135986328125, -0.6627426147460938, -0.632171630859375, -0.6016006469726562, -0.5710296630859375, -0.5404586791992188, -0.5098876953125, -0.47931671142578125, -0.4487457275390625, -0.41817474365234375, -0.387603759765625, -0.35703277587890625, -0.3264617919921875, -0.29589080810546875, -0.26531982421875, -0.23474884033203125, -0.2041778564453125, -0.17360687255859375, -0.143035888671875, -0.11246490478515625, -0.0818939208984375, -0.05132293701171875, -0.020751953125, 0.00981903076171875, 0.0403900146484375, 0.07096099853515625, 0.101531982421875, 0.13210296630859375, 0.1626739501953125, 0.19324493408203125, 0.22381591796875, 0.25438690185546875, 0.2849578857421875, 0.31552886962890625, 0.346099853515625, 0.37667083740234375, 0.4072418212890625, 0.43781280517578125, 0.4683837890625, 0.49895477294921875, 0.5295257568359375, 0.5600967407226562, 0.590667724609375, 0.6212387084960938, 0.6518096923828125, 0.6823806762695312, 0.71295166015625, 0.7435226440429688, 0.7740936279296875, 0.8046646118164062, 0.835235595703125, 0.8658065795898438, 0.8963775634765625, 0.9269485473632812, 0.95751953125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 1.0, 9.0, 13.0, 7.0, 13.0, 15.0, 32.0, 35.0, 38.0, 72.0, 79.0, 92.0, 89.0, 92.0, 91.0, 73.0, 52.0, 53.0, 36.0, 30.0, 17.0, 19.0, 9.0, 3.0, 12.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-29.266084671020508, -28.569189071655273, -27.872295379638672, -27.175399780273438, -26.478504180908203, -25.7816104888916, -25.084714889526367, -24.387821197509766, -23.69092559814453, -22.994029998779297, -22.297136306762695, -21.60024070739746, -20.90334701538086, -20.206451416015625, -19.50955581665039, -18.812660217285156, -18.115766525268555, -17.41887092590332, -16.72197723388672, -16.025081634521484, -15.328186988830566, -14.631292343139648, -13.934396743774414, -13.237502098083496, -12.540607452392578, -11.84371280670166, -11.146818161010742, -10.449922561645508, -9.75302791595459, -9.056133270263672, -8.359237670898438, -7.6623430252075195, -6.965449333190918, -6.2685546875, -5.571659564971924, -4.874764442443848, -4.17786979675293, -3.4809749126434326, -2.7840800285339355, -2.0871849060058594, -1.3902902603149414, -0.6933953762054443, 0.0034995079040527344, 0.7003943920135498, 1.3972892761230469, 2.094184160232544, 2.791079044342041, 3.487974166870117, 4.184868812561035, 4.881763458251953, 5.578658580780029, 6.2755537033081055, 6.972448348999023, 7.669342994689941, 8.36623764038086, 9.063133239746094, 9.760027885437012, 10.45692253112793, 11.153818130493164, 11.850712776184082, 12.547607421875, 13.244502067565918, 13.941396713256836, 14.63829231262207, 15.335186958312988]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 6.0, 0.0, 2.0, 9.0, 8.0, 13.0, 13.0, 10.0, 7.0, 21.0, 27.0, 30.0, 26.0, 31.0, 27.0, 33.0, 39.0, 45.0, 40.0, 39.0, 40.0, 35.0, 41.0, 42.0, 36.0, 27.0, 32.0, 35.0, 38.0, 23.0, 33.0, 29.0, 28.0, 17.0, 25.0, 19.0, 17.0, 10.0, 9.0, 5.0, 6.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-9.192453384399414, -8.90573501586914, -8.61901569366455, -8.332297325134277, -8.045578002929688, -7.758859634399414, -7.472140789031982, -7.185421943664551, -6.898703098297119, -6.6119842529296875, -6.325265407562256, -6.038546562194824, -5.751828193664551, -5.465108871459961, -5.1783905029296875, -4.891671657562256, -4.604952812194824, -4.318233966827393, -4.031515121459961, -3.7447965145111084, -3.4580776691436768, -3.171358823776245, -2.8846402168273926, -2.597921371459961, -2.3112025260925293, -2.0244836807250977, -1.7377649545669556, -1.4510462284088135, -1.1643273830413818, -0.8776085376739502, -0.5908898115158081, -0.304171085357666, -0.017452239990234375, 0.2692665457725525, 0.5559853315353394, 0.8427041172981262, 1.129422903060913, 1.4161417484283447, 1.7028604745864868, 1.989579200744629, 2.2762980461120605, 2.563016891479492, 2.849735736846924, 3.1364543437957764, 3.423173189163208, 3.7098920345306396, 3.996610641479492, 4.283329486846924, 4.5700483322143555, 4.856767177581787, 5.143486022949219, 5.43020486831665, 5.716923713684082, 6.0036420822143555, 6.290360927581787, 6.577079772949219, 6.86379861831665, 7.150517463684082, 7.437236309051514, 7.723955154418945, 8.010673522949219, 8.297392845153809, 8.584111213684082, 8.870830535888672, 9.157548904418945]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 12.0, 6.0, 12.0, 13.0, 23.0, 33.0, 64.0, 92.0, 124.0, 229.0, 386.0, 595.0, 1093.0, 2045.0, 3571.0, 6764.0, 12645.0, 24790.0, 49223.0, 94410.0, 164942.0, 223707.0, 199922.0, 125215.0, 67159.0, 34202.0, 17390.0, 9163.0, 4789.0, 2543.0, 1412.0, 791.0, 473.0, 281.0, 133.0, 102.0, 55.0, 47.0, 31.0, 20.0, 14.0, 12.0, 5.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.84375, -15.3597412109375, -14.875732421875, -14.3917236328125, -13.90771484375, -13.4237060546875, -12.939697265625, -12.4556884765625, -11.9716796875, -11.4876708984375, -11.003662109375, -10.5196533203125, -10.03564453125, -9.5516357421875, -9.067626953125, -8.5836181640625, -8.099609375, -7.6156005859375, -7.131591796875, -6.6475830078125, -6.16357421875, -5.6795654296875, -5.195556640625, -4.7115478515625, -4.2275390625, -3.7435302734375, -3.259521484375, -2.7755126953125, -2.29150390625, -1.8074951171875, -1.323486328125, -0.8394775390625, -0.35546875, 0.1285400390625, 0.612548828125, 1.0965576171875, 1.58056640625, 2.0645751953125, 2.548583984375, 3.0325927734375, 3.5166015625, 4.0006103515625, 4.484619140625, 4.9686279296875, 5.45263671875, 5.9366455078125, 6.420654296875, 6.9046630859375, 7.388671875, 7.8726806640625, 8.356689453125, 8.8406982421875, 9.32470703125, 9.8087158203125, 10.292724609375, 10.7767333984375, 11.2607421875, 11.7447509765625, 12.228759765625, 12.7127685546875, 13.19677734375, 13.6807861328125, 14.164794921875, 14.6488037109375, 15.1328125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 3.0, 5.0, 8.0, 7.0, 11.0, 6.0, 25.0, 23.0, 25.0, 24.0, 34.0, 29.0, 28.0, 35.0, 36.0, 34.0, 50.0, 40.0, 34.0, 48.0, 43.0, 35.0, 33.0, 31.0, 32.0, 36.0, 25.0, 36.0, 26.0, 25.0, 22.0, 16.0, 18.0, 23.0, 18.0, 17.0, 10.0, 7.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.1640625, -8.865234375, -8.56640625, -8.267578125, -7.96875, -7.669921875, -7.37109375, -7.072265625, -6.7734375, -6.474609375, -6.17578125, -5.876953125, -5.578125, -5.279296875, -4.98046875, -4.681640625, -4.3828125, -4.083984375, -3.78515625, -3.486328125, -3.1875, -2.888671875, -2.58984375, -2.291015625, -1.9921875, -1.693359375, -1.39453125, -1.095703125, -0.796875, -0.498046875, -0.19921875, 0.099609375, 0.3984375, 0.697265625, 0.99609375, 1.294921875, 1.59375, 1.892578125, 2.19140625, 2.490234375, 2.7890625, 3.087890625, 3.38671875, 3.685546875, 3.984375, 4.283203125, 4.58203125, 4.880859375, 5.1796875, 5.478515625, 5.77734375, 6.076171875, 6.375, 6.673828125, 6.97265625, 7.271484375, 7.5703125, 7.869140625, 8.16796875, 8.466796875, 8.765625, 9.064453125, 9.36328125, 9.662109375, 9.9609375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 16.0, 14.0, 31.0, 38.0, 58.0, 87.0, 101.0, 158.0, 239.0, 360.0, 591.0, 1046.0, 1801.0, 3528.0, 7262.0, 15189.0, 34124.0, 77476.0, 165722.0, 262636.0, 236566.0, 131533.0, 59839.0, 25996.0, 11744.0, 5628.0, 2848.0, 1522.0, 883.0, 517.0, 326.0, 220.0, 132.0, 97.0, 51.0, 46.0, 32.0, 18.0, 17.0, 17.0, 12.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-20.59375, -19.985107421875, -19.37646484375, -18.767822265625, -18.1591796875, -17.550537109375, -16.94189453125, -16.333251953125, -15.724609375, -15.115966796875, -14.50732421875, -13.898681640625, -13.2900390625, -12.681396484375, -12.07275390625, -11.464111328125, -10.85546875, -10.246826171875, -9.63818359375, -9.029541015625, -8.4208984375, -7.812255859375, -7.20361328125, -6.594970703125, -5.986328125, -5.377685546875, -4.76904296875, -4.160400390625, -3.5517578125, -2.943115234375, -2.33447265625, -1.725830078125, -1.1171875, -0.508544921875, 0.10009765625, 0.708740234375, 1.3173828125, 1.926025390625, 2.53466796875, 3.143310546875, 3.751953125, 4.360595703125, 4.96923828125, 5.577880859375, 6.1865234375, 6.795166015625, 7.40380859375, 8.012451171875, 8.62109375, 9.229736328125, 9.83837890625, 10.447021484375, 11.0556640625, 11.664306640625, 12.27294921875, 12.881591796875, 13.490234375, 14.098876953125, 14.70751953125, 15.316162109375, 15.9248046875, 16.533447265625, 17.14208984375, 17.750732421875, 18.359375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 11.0, 14.0, 10.0, 17.0, 17.0, 21.0, 27.0, 30.0, 31.0, 33.0, 44.0, 39.0, 52.0, 44.0, 41.0, 56.0, 46.0, 55.0, 38.0, 48.0, 44.0, 37.0, 32.0, 30.0, 29.0, 24.0, 33.0, 14.0, 22.0, 11.0, 8.0, 7.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.40606689453125, -5.1988525390625, -4.99163818359375, -4.784423828125, -4.57720947265625, -4.3699951171875, -4.16278076171875, -3.95556640625, -3.74835205078125, -3.5411376953125, -3.33392333984375, -3.126708984375, -2.91949462890625, -2.7122802734375, -2.50506591796875, -2.2978515625, -2.09063720703125, -1.8834228515625, -1.67620849609375, -1.468994140625, -1.26177978515625, -1.0545654296875, -0.84735107421875, -0.64013671875, -0.43292236328125, -0.2257080078125, -0.01849365234375, 0.188720703125, 0.39593505859375, 0.6031494140625, 0.81036376953125, 1.017578125, 1.22479248046875, 1.4320068359375, 1.63922119140625, 1.846435546875, 2.05364990234375, 2.2608642578125, 2.46807861328125, 2.67529296875, 2.88250732421875, 3.0897216796875, 3.29693603515625, 3.504150390625, 3.71136474609375, 3.9185791015625, 4.12579345703125, 4.3330078125, 4.54022216796875, 4.7474365234375, 4.95465087890625, 5.161865234375, 5.36907958984375, 5.5762939453125, 5.78350830078125, 5.99072265625, 6.19793701171875, 6.4051513671875, 6.61236572265625, 6.819580078125, 7.02679443359375, 7.2340087890625, 7.44122314453125, 7.6484375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 6.0, 6.0, 8.0, 16.0, 21.0, 32.0, 42.0, 80.0, 105.0, 122.0, 182.0, 290.0, 483.0, 621.0, 1000.0, 1668.0, 2887.0, 5355.0, 11363.0, 27406.0, 79215.0, 232230.0, 381140.0, 194350.0, 64866.0, 23346.0, 9948.0, 4870.0, 2626.0, 1547.0, 903.0, 575.0, 421.0, 252.0, 186.0, 126.0, 81.0, 54.0, 45.0, 29.0, 16.0, 18.0, 10.0, 6.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2890625, -7.9752197265625, -7.661376953125, -7.3475341796875, -7.03369140625, -6.7198486328125, -6.406005859375, -6.0921630859375, -5.7783203125, -5.4644775390625, -5.150634765625, -4.8367919921875, -4.52294921875, -4.2091064453125, -3.895263671875, -3.5814208984375, -3.267578125, -2.9537353515625, -2.639892578125, -2.3260498046875, -2.01220703125, -1.6983642578125, -1.384521484375, -1.0706787109375, -0.7568359375, -0.4429931640625, -0.129150390625, 0.1846923828125, 0.49853515625, 0.8123779296875, 1.126220703125, 1.4400634765625, 1.75390625, 2.0677490234375, 2.381591796875, 2.6954345703125, 3.00927734375, 3.3231201171875, 3.636962890625, 3.9508056640625, 4.2646484375, 4.5784912109375, 4.892333984375, 5.2061767578125, 5.52001953125, 5.8338623046875, 6.147705078125, 6.4615478515625, 6.775390625, 7.0892333984375, 7.403076171875, 7.7169189453125, 8.03076171875, 8.3446044921875, 8.658447265625, 8.9722900390625, 9.2861328125, 9.5999755859375, 9.913818359375, 10.2276611328125, 10.54150390625, 10.8553466796875, 11.169189453125, 11.4830322265625, 11.796875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 12.0, 13.0, 22.0, 34.0, 40.0, 51.0, 54.0, 62.0, 96.0, 109.0, 124.0, 104.0, 79.0, 56.0, 34.0, 31.0, 24.0, 14.0, 9.0, 7.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010318756103515625, -0.0010039210319519043, -0.0009759664535522461, -0.0009480118751525879, -0.0009200572967529297, -0.0008921027183532715, -0.0008641481399536133, -0.0008361935615539551, -0.0008082389831542969, -0.0007802844047546387, -0.0007523298263549805, -0.0007243752479553223, -0.0006964206695556641, -0.0006684660911560059, -0.0006405115127563477, -0.0006125569343566895, -0.0005846023559570312, -0.000556647777557373, -0.0005286931991577148, -0.0005007386207580566, -0.00047278404235839844, -0.00044482946395874023, -0.00041687488555908203, -0.00038892030715942383, -0.0003609657287597656, -0.0003330111503601074, -0.0003050565719604492, -0.000277101993560791, -0.0002491474151611328, -0.0002211928367614746, -0.0001932382583618164, -0.0001652836799621582, -0.0001373291015625, -0.0001093745231628418, -8.14199447631836e-05, -5.346536636352539e-05, -2.5510787963867188e-05, 2.4437904357910156e-06, 3.039836883544922e-05, 5.835294723510742e-05, 8.630752563476562e-05, 0.00011426210403442383, 0.00014221668243408203, 0.00017017126083374023, 0.00019812583923339844, 0.00022608041763305664, 0.00025403499603271484, 0.00028198957443237305, 0.00030994415283203125, 0.00033789873123168945, 0.00036585330963134766, 0.00039380788803100586, 0.00042176246643066406, 0.00044971704483032227, 0.00047767162322998047, 0.0005056262016296387, 0.0005335807800292969, 0.0005615353584289551, 0.0005894899368286133, 0.0006174445152282715, 0.0006453990936279297, 0.0006733536720275879, 0.0007013082504272461, 0.0007292628288269043, 0.0007572174072265625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [5.0, 2.0, 3.0, 4.0, 5.0, 10.0, 16.0, 17.0, 20.0, 27.0, 27.0, 56.0, 64.0, 66.0, 112.0, 173.0, 225.0, 351.0, 512.0, 772.0, 1192.0, 1795.0, 3057.0, 5040.0, 8829.0, 16441.0, 30709.0, 62295.0, 123674.0, 219309.0, 247141.0, 157876.0, 80147.0, 40489.0, 20792.0, 11042.0, 6151.0, 3606.0, 2221.0, 1377.0, 924.0, 604.0, 411.0, 278.0, 213.0, 146.0, 101.0, 72.0, 54.0, 38.0, 28.0, 16.0, 9.0, 6.0, 8.0, 3.0, 5.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.4453125, -6.2318115234375, -6.018310546875, -5.8048095703125, -5.59130859375, -5.3778076171875, -5.164306640625, -4.9508056640625, -4.7373046875, -4.5238037109375, -4.310302734375, -4.0968017578125, -3.88330078125, -3.6697998046875, -3.456298828125, -3.2427978515625, -3.029296875, -2.8157958984375, -2.602294921875, -2.3887939453125, -2.17529296875, -1.9617919921875, -1.748291015625, -1.5347900390625, -1.3212890625, -1.1077880859375, -0.894287109375, -0.6807861328125, -0.46728515625, -0.2537841796875, -0.040283203125, 0.1732177734375, 0.38671875, 0.6002197265625, 0.813720703125, 1.0272216796875, 1.24072265625, 1.4542236328125, 1.667724609375, 1.8812255859375, 2.0947265625, 2.3082275390625, 2.521728515625, 2.7352294921875, 2.94873046875, 3.1622314453125, 3.375732421875, 3.5892333984375, 3.802734375, 4.0162353515625, 4.229736328125, 4.4432373046875, 4.65673828125, 4.8702392578125, 5.083740234375, 5.2972412109375, 5.5107421875, 5.7242431640625, 5.937744140625, 6.1512451171875, 6.36474609375, 6.5782470703125, 6.791748046875, 7.0052490234375, 7.21875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 10.0, 5.0, 9.0, 14.0, 11.0, 21.0, 35.0, 40.0, 50.0, 48.0, 74.0, 60.0, 93.0, 76.0, 72.0, 67.0, 67.0, 58.0, 41.0, 39.0, 33.0, 13.0, 15.0, 9.0, 10.0, 5.0, 7.0, 4.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.76171875, -1.6949462890625, -1.628173828125, -1.5614013671875, -1.49462890625, -1.4278564453125, -1.361083984375, -1.2943115234375, -1.2275390625, -1.1607666015625, -1.093994140625, -1.0272216796875, -0.96044921875, -0.8936767578125, -0.826904296875, -0.7601318359375, -0.693359375, -0.6265869140625, -0.559814453125, -0.4930419921875, -0.42626953125, -0.3594970703125, -0.292724609375, -0.2259521484375, -0.1591796875, -0.0924072265625, -0.025634765625, 0.0411376953125, 0.10791015625, 0.1746826171875, 0.241455078125, 0.3082275390625, 0.375, 0.4417724609375, 0.508544921875, 0.5753173828125, 0.64208984375, 0.7088623046875, 0.775634765625, 0.8424072265625, 0.9091796875, 0.9759521484375, 1.042724609375, 1.1094970703125, 1.17626953125, 1.2430419921875, 1.309814453125, 1.3765869140625, 1.443359375, 1.5101318359375, 1.576904296875, 1.6436767578125, 1.71044921875, 1.7772216796875, 1.843994140625, 1.9107666015625, 1.9775390625, 2.0443115234375, 2.111083984375, 2.1778564453125, 2.24462890625, 2.3114013671875, 2.378173828125, 2.4449462890625, 2.51171875]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 17.0, 19.0, 17.0, 35.0, 42.0, 46.0, 74.0, 84.0, 84.0, 99.0, 86.0, 85.0, 67.0, 54.0, 44.0, 42.0, 23.0, 18.0, 13.0, 6.0, 8.0, 11.0, 3.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0], "bins": [-31.046098709106445, -30.335796356201172, -29.6254940032959, -28.915191650390625, -28.204891204833984, -27.49458885192871, -26.784286499023438, -26.073984146118164, -25.36368179321289, -24.653379440307617, -23.943077087402344, -23.232776641845703, -22.52247428894043, -21.812171936035156, -21.101869583129883, -20.39156723022461, -19.68126678466797, -18.970964431762695, -18.260662078857422, -17.55036163330078, -16.840059280395508, -16.129756927490234, -15.419454574584961, -14.709152221679688, -13.99885082244873, -13.288548469543457, -12.5782470703125, -11.867944717407227, -11.157642364501953, -10.447340965270996, -9.737038612365723, -9.026737213134766, -8.31643295288086, -7.606131076812744, -6.895829200744629, -6.1855268478393555, -5.47522497177124, -4.764923095703125, -4.054620742797852, -3.3443188667297363, -2.634016990661621, -1.9237149953842163, -1.2134130001068115, -0.5031108856201172, 0.20719099044799805, 0.9174928665161133, 1.6277952194213867, 2.338097095489502, 3.048398971557617, 3.7587008476257324, 4.469002723693848, 5.179305076599121, 5.889606952667236, 6.599908828735352, 7.310211181640625, 8.020513534545898, 8.730814933776855, 9.441117286682129, 10.151418685913086, 10.86172103881836, 11.572023391723633, 12.28232479095459, 12.992627143859863, 13.70292854309082, 14.413230895996094]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 0.0, 5.0, 3.0, 8.0, 6.0, 6.0, 17.0, 10.0, 11.0, 21.0, 10.0, 23.0, 21.0, 25.0, 27.0, 35.0, 30.0, 43.0, 44.0, 32.0, 49.0, 33.0, 46.0, 51.0, 33.0, 45.0, 34.0, 36.0, 27.0, 34.0, 27.0, 34.0, 19.0, 14.0, 20.0, 14.0, 19.0, 21.0, 16.0, 7.0, 13.0, 7.0, 6.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.479201316833496, -8.194890022277832, -7.910579204559326, -7.626267910003662, -7.341957092285156, -7.057645797729492, -6.773334503173828, -6.489023208618164, -6.204712390899658, -5.920401096343994, -5.636090278625488, -5.351778984069824, -5.06746768951416, -4.783156871795654, -4.49884557723999, -4.214534759521484, -3.9302234649658203, -3.6459124088287354, -3.3616013526916504, -3.0772900581359863, -2.7929790019989014, -2.5086679458618164, -2.2243566513061523, -1.9400455951690674, -1.6557345390319824, -1.3714234828948975, -1.087112307548523, -0.8028011918067932, -0.5184900760650635, -0.23417901992797852, 0.050132155418395996, 0.3344433307647705, 0.6187534332275391, 0.9030645489692688, 1.1873756647109985, 1.471686840057373, 1.755997896194458, 2.040308952331543, 2.324620246887207, 2.608931303024292, 2.893242359161377, 3.177553415298462, 3.461864471435547, 3.746175765991211, 4.030487060546875, 4.314797878265381, 4.599109172821045, 4.883419990539551, 5.167731285095215, 5.452042579650879, 5.736353397369385, 6.020664691925049, 6.304975509643555, 6.589286804199219, 6.873598098754883, 7.157909393310547, 7.442220211029053, 7.726531505584717, 8.010842323303223, 8.295153617858887, 8.57946491241455, 8.863775253295898, 9.148086547851562, 9.432397842407227, 9.71670913696289]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 12.0, 24.0, 19.0, 43.0, 52.0, 114.0, 159.0, 220.0, 387.0, 670.0, 1053.0, 1923.0, 3327.0, 5780.0, 10622.0, 20739.0, 44174.0, 104670.0, 282464.0, 846967.0, 1550583.0, 845542.0, 278880.0, 103811.0, 44640.0, 21682.0, 11209.0, 5968.0, 3350.0, 1924.0, 1199.0, 730.0, 450.0, 280.0, 178.0, 140.0, 82.0, 63.0, 45.0, 31.0, 25.0, 13.0, 11.0, 5.0, 6.0, 4.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.09375, -17.48046875, -16.8671875, -16.25390625, -15.640625, -15.02734375, -14.4140625, -13.80078125, -13.1875, -12.57421875, -11.9609375, -11.34765625, -10.734375, -10.12109375, -9.5078125, -8.89453125, -8.28125, -7.66796875, -7.0546875, -6.44140625, -5.828125, -5.21484375, -4.6015625, -3.98828125, -3.375, -2.76171875, -2.1484375, -1.53515625, -0.921875, -0.30859375, 0.3046875, 0.91796875, 1.53125, 2.14453125, 2.7578125, 3.37109375, 3.984375, 4.59765625, 5.2109375, 5.82421875, 6.4375, 7.05078125, 7.6640625, 8.27734375, 8.890625, 9.50390625, 10.1171875, 10.73046875, 11.34375, 11.95703125, 12.5703125, 13.18359375, 13.796875, 14.41015625, 15.0234375, 15.63671875, 16.25, 16.86328125, 17.4765625, 18.08984375, 18.703125, 19.31640625, 19.9296875, 20.54296875, 21.15625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 3.0, 7.0, 7.0, 10.0, 16.0, 15.0, 22.0, 27.0, 19.0, 33.0, 34.0, 34.0, 29.0, 44.0, 47.0, 41.0, 42.0, 60.0, 32.0, 58.0, 58.0, 45.0, 31.0, 34.0, 33.0, 38.0, 30.0, 18.0, 16.0, 25.0, 18.0, 16.0, 13.0, 15.0, 1.0, 3.0, 7.0, 2.0, 0.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.74609375, -7.506103515625, -7.26611328125, -7.026123046875, -6.7861328125, -6.546142578125, -6.30615234375, -6.066162109375, -5.826171875, -5.586181640625, -5.34619140625, -5.106201171875, -4.8662109375, -4.626220703125, -4.38623046875, -4.146240234375, -3.90625, -3.666259765625, -3.42626953125, -3.186279296875, -2.9462890625, -2.706298828125, -2.46630859375, -2.226318359375, -1.986328125, -1.746337890625, -1.50634765625, -1.266357421875, -1.0263671875, -0.786376953125, -0.54638671875, -0.306396484375, -0.06640625, 0.173583984375, 0.41357421875, 0.653564453125, 0.8935546875, 1.133544921875, 1.37353515625, 1.613525390625, 1.853515625, 2.093505859375, 2.33349609375, 2.573486328125, 2.8134765625, 3.053466796875, 3.29345703125, 3.533447265625, 3.7734375, 4.013427734375, 4.25341796875, 4.493408203125, 4.7333984375, 4.973388671875, 5.21337890625, 5.453369140625, 5.693359375, 5.933349609375, 6.17333984375, 6.413330078125, 6.6533203125, 6.893310546875, 7.13330078125, 7.373291015625, 7.61328125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 10.0, 16.0, 15.0, 26.0, 38.0, 74.0, 101.0, 163.0, 244.0, 447.0, 817.0, 1252.0, 2228.0, 3961.0, 7499.0, 14258.0, 29449.0, 63394.0, 148652.0, 379294.0, 980095.0, 1395510.0, 698977.0, 266398.0, 107184.0, 47493.0, 22408.0, 11121.0, 5843.0, 3113.0, 1756.0, 955.0, 588.0, 347.0, 218.0, 123.0, 96.0, 45.0, 27.0, 22.0, 18.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.8125, -20.187744140625, -19.56298828125, -18.938232421875, -18.3134765625, -17.688720703125, -17.06396484375, -16.439208984375, -15.814453125, -15.189697265625, -14.56494140625, -13.940185546875, -13.3154296875, -12.690673828125, -12.06591796875, -11.441162109375, -10.81640625, -10.191650390625, -9.56689453125, -8.942138671875, -8.3173828125, -7.692626953125, -7.06787109375, -6.443115234375, -5.818359375, -5.193603515625, -4.56884765625, -3.944091796875, -3.3193359375, -2.694580078125, -2.06982421875, -1.445068359375, -0.8203125, -0.195556640625, 0.42919921875, 1.053955078125, 1.6787109375, 2.303466796875, 2.92822265625, 3.552978515625, 4.177734375, 4.802490234375, 5.42724609375, 6.052001953125, 6.6767578125, 7.301513671875, 7.92626953125, 8.551025390625, 9.17578125, 9.800537109375, 10.42529296875, 11.050048828125, 11.6748046875, 12.299560546875, 12.92431640625, 13.549072265625, 14.173828125, 14.798583984375, 15.42333984375, 16.048095703125, 16.6728515625, 17.297607421875, 17.92236328125, 18.547119140625, 19.171875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 4.0, 9.0, 8.0, 9.0, 17.0, 20.0, 25.0, 20.0, 34.0, 45.0, 82.0, 97.0, 117.0, 133.0, 191.0, 260.0, 277.0, 300.0, 372.0, 351.0, 325.0, 270.0, 224.0, 208.0, 163.0, 136.0, 85.0, 72.0, 46.0, 51.0, 36.0, 27.0, 25.0, 12.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4296875, -5.26519775390625, -5.1007080078125, -4.93621826171875, -4.771728515625, -4.60723876953125, -4.4427490234375, -4.27825927734375, -4.11376953125, -3.94927978515625, -3.7847900390625, -3.62030029296875, -3.455810546875, -3.29132080078125, -3.1268310546875, -2.96234130859375, -2.7978515625, -2.63336181640625, -2.4688720703125, -2.30438232421875, -2.139892578125, -1.97540283203125, -1.8109130859375, -1.64642333984375, -1.48193359375, -1.31744384765625, -1.1529541015625, -0.98846435546875, -0.823974609375, -0.65948486328125, -0.4949951171875, -0.33050537109375, -0.166015625, -0.00152587890625, 0.1629638671875, 0.32745361328125, 0.491943359375, 0.65643310546875, 0.8209228515625, 0.98541259765625, 1.14990234375, 1.31439208984375, 1.4788818359375, 1.64337158203125, 1.807861328125, 1.97235107421875, 2.1368408203125, 2.30133056640625, 2.4658203125, 2.63031005859375, 2.7947998046875, 2.95928955078125, 3.123779296875, 3.28826904296875, 3.4527587890625, 3.61724853515625, 3.78173828125, 3.94622802734375, 4.1107177734375, 4.27520751953125, 4.439697265625, 4.60418701171875, 4.7686767578125, 4.93316650390625, 5.09765625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 7.0, 3.0, 11.0, 6.0, 21.0, 15.0, 28.0, 50.0, 52.0, 84.0, 87.0, 99.0, 93.0, 113.0, 71.0, 74.0, 49.0, 34.0, 27.0, 18.0, 16.0, 17.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.92160415649414, -29.140708923339844, -28.359813690185547, -27.57891845703125, -26.798023223876953, -26.017127990722656, -25.23623275756836, -24.455337524414062, -23.674442291259766, -22.89354705810547, -22.112651824951172, -21.331756591796875, -20.550861358642578, -19.76996612548828, -18.989070892333984, -18.208175659179688, -17.42728042602539, -16.646385192871094, -15.865489959716797, -15.0845947265625, -14.303699493408203, -13.522804260253906, -12.74190902709961, -11.961013793945312, -11.180118560791016, -10.399223327636719, -9.618328094482422, -8.837432861328125, -8.056537628173828, -7.275642395019531, -6.494747161865234, -5.7138519287109375, -4.932958602905273, -4.152063369750977, -3.3711681365966797, -2.590272903442383, -1.809377670288086, -1.028482437133789, -0.2475872039794922, 0.5333080291748047, 1.3142032623291016, 2.0950984954833984, 2.8759937286376953, 3.656888961791992, 4.437784194946289, 5.218679428100586, 5.999574661254883, 6.78046989440918, 7.561365127563477, 8.342260360717773, 9.12315559387207, 9.904050827026367, 10.684946060180664, 11.465841293334961, 12.246736526489258, 13.027631759643555, 13.808526992797852, 14.589422225952148, 15.370317459106445, 16.151212692260742, 16.93210792541504, 17.713003158569336, 18.493898391723633, 19.27479362487793, 20.055688858032227]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 10.0, 13.0, 11.0, 14.0, 13.0, 23.0, 29.0, 27.0, 24.0, 32.0, 30.0, 51.0, 52.0, 43.0, 47.0, 58.0, 51.0, 37.0, 45.0, 50.0, 36.0, 38.0, 25.0, 40.0, 35.0, 23.0, 26.0, 29.0, 21.0, 13.0, 9.0, 4.0, 11.0, 10.0, 4.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.636570930480957, -10.317435264587402, -9.998299598693848, -9.679163932800293, -9.360027313232422, -9.040891647338867, -8.721755981445312, -8.402620315551758, -8.083484649658203, -7.764348983764648, -7.445213317871094, -7.126077175140381, -6.806941509246826, -6.4878058433532715, -6.168669700622559, -5.849534034729004, -5.530398368835449, -5.2112627029418945, -4.89212703704834, -4.572990894317627, -4.253855228424072, -3.9347195625305176, -3.615583658218384, -3.29644775390625, -2.9773120880126953, -2.6581764221191406, -2.339040517807007, -2.019904613494873, -1.7007689476013184, -1.3816331624984741, -1.0624973773956299, -0.7433614730834961, -0.4242267608642578, -0.10509097576141357, 0.21404480934143066, 0.5331805944442749, 0.8523163795471191, 1.1714521646499634, 1.4905879497528076, 1.8097238540649414, 2.128859519958496, 2.447995185852051, 2.7671310901641846, 3.0862669944763184, 3.405402660369873, 3.7245383262634277, 4.043674468994141, 4.362810134887695, 4.68194580078125, 5.001081466674805, 5.320217132568359, 5.639353275299072, 5.958488941192627, 6.277624607086182, 6.5967607498168945, 6.915896415710449, 7.235032081604004, 7.554167747497559, 7.873303413391113, 8.192439079284668, 8.511575698852539, 8.830711364746094, 9.149847030639648, 9.468982696533203, 9.788118362426758]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 8.0, 11.0, 12.0, 19.0, 28.0, 43.0, 56.0, 99.0, 143.0, 252.0, 406.0, 704.0, 1124.0, 2045.0, 3863.0, 7021.0, 13825.0, 27538.0, 55535.0, 110359.0, 198017.0, 248079.0, 182114.0, 97338.0, 48753.0, 24475.0, 12220.0, 6507.0, 3356.0, 1904.0, 1078.0, 635.0, 386.0, 208.0, 143.0, 90.0, 58.0, 37.0, 31.0, 12.0, 11.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91796875, -6.69049072265625, -6.4630126953125, -6.23553466796875, -6.008056640625, -5.78057861328125, -5.5531005859375, -5.32562255859375, -5.09814453125, -4.87066650390625, -4.6431884765625, -4.41571044921875, -4.188232421875, -3.96075439453125, -3.7332763671875, -3.50579833984375, -3.2783203125, -3.05084228515625, -2.8233642578125, -2.59588623046875, -2.368408203125, -2.14093017578125, -1.9134521484375, -1.68597412109375, -1.45849609375, -1.23101806640625, -1.0035400390625, -0.77606201171875, -0.548583984375, -0.32110595703125, -0.0936279296875, 0.13385009765625, 0.361328125, 0.58880615234375, 0.8162841796875, 1.04376220703125, 1.271240234375, 1.49871826171875, 1.7261962890625, 1.95367431640625, 2.18115234375, 2.40863037109375, 2.6361083984375, 2.86358642578125, 3.091064453125, 3.31854248046875, 3.5460205078125, 3.77349853515625, 4.0009765625, 4.22845458984375, 4.4559326171875, 4.68341064453125, 4.910888671875, 5.13836669921875, 5.3658447265625, 5.59332275390625, 5.82080078125, 6.04827880859375, 6.2757568359375, 6.50323486328125, 6.730712890625, 6.95819091796875, 7.1856689453125, 7.41314697265625, 7.640625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 13.0, 3.0, 16.0, 21.0, 25.0, 19.0, 25.0, 22.0, 26.0, 55.0, 46.0, 51.0, 58.0, 55.0, 52.0, 63.0, 46.0, 54.0, 51.0, 43.0, 36.0, 35.0, 26.0, 25.0, 21.0, 25.0, 17.0, 16.0, 7.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1328125, -10.7611083984375, -10.389404296875, -10.0177001953125, -9.64599609375, -9.2742919921875, -8.902587890625, -8.5308837890625, -8.1591796875, -7.7874755859375, -7.415771484375, -7.0440673828125, -6.67236328125, -6.3006591796875, -5.928955078125, -5.5572509765625, -5.185546875, -4.8138427734375, -4.442138671875, -4.0704345703125, -3.69873046875, -3.3270263671875, -2.955322265625, -2.5836181640625, -2.2119140625, -1.8402099609375, -1.468505859375, -1.0968017578125, -0.72509765625, -0.3533935546875, 0.018310546875, 0.3900146484375, 0.76171875, 1.1334228515625, 1.505126953125, 1.8768310546875, 2.24853515625, 2.6202392578125, 2.991943359375, 3.3636474609375, 3.7353515625, 4.1070556640625, 4.478759765625, 4.8504638671875, 5.22216796875, 5.5938720703125, 5.965576171875, 6.3372802734375, 6.708984375, 7.0806884765625, 7.452392578125, 7.8240966796875, 8.19580078125, 8.5675048828125, 8.939208984375, 9.3109130859375, 9.6826171875, 10.0543212890625, 10.426025390625, 10.7977294921875, 11.16943359375, 11.5411376953125, 11.912841796875, 12.2845458984375, 12.65625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 10.0, 7.0, 12.0, 18.0, 34.0, 35.0, 50.0, 100.0, 108.0, 125.0, 213.0, 287.0, 378.0, 546.0, 793.0, 1089.0, 1563.0, 2230.0, 3284.0, 5009.0, 7914.0, 12558.0, 20082.0, 33487.0, 56356.0, 94729.0, 150515.0, 198292.0, 172163.0, 112091.0, 67612.0, 40598.0, 24006.0, 14575.0, 9110.0, 5988.0, 3939.0, 2624.0, 1723.0, 1237.0, 869.0, 643.0, 435.0, 314.0, 215.0, 195.0, 125.0, 89.0, 62.0, 42.0, 28.0, 21.0, 13.0, 8.0, 6.0, 2.0, 5.0, 3.0, 2.0], "bins": [-6.42578125, -6.2291259765625, -6.032470703125, -5.8358154296875, -5.63916015625, -5.4425048828125, -5.245849609375, -5.0491943359375, -4.8525390625, -4.6558837890625, -4.459228515625, -4.2625732421875, -4.06591796875, -3.8692626953125, -3.672607421875, -3.4759521484375, -3.279296875, -3.0826416015625, -2.885986328125, -2.6893310546875, -2.49267578125, -2.2960205078125, -2.099365234375, -1.9027099609375, -1.7060546875, -1.5093994140625, -1.312744140625, -1.1160888671875, -0.91943359375, -0.7227783203125, -0.526123046875, -0.3294677734375, -0.1328125, 0.0638427734375, 0.260498046875, 0.4571533203125, 0.65380859375, 0.8504638671875, 1.047119140625, 1.2437744140625, 1.4404296875, 1.6370849609375, 1.833740234375, 2.0303955078125, 2.22705078125, 2.4237060546875, 2.620361328125, 2.8170166015625, 3.013671875, 3.2103271484375, 3.406982421875, 3.6036376953125, 3.80029296875, 3.9969482421875, 4.193603515625, 4.3902587890625, 4.5869140625, 4.7835693359375, 4.980224609375, 5.1768798828125, 5.37353515625, 5.5701904296875, 5.766845703125, 5.9635009765625, 6.16015625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 6.0, 6.0, 9.0, 4.0, 12.0, 6.0, 10.0, 14.0, 19.0, 20.0, 28.0, 21.0, 20.0, 26.0, 30.0, 29.0, 25.0, 35.0, 33.0, 42.0, 37.0, 36.0, 31.0, 39.0, 44.0, 42.0, 41.0, 29.0, 34.0, 36.0, 32.0, 25.0, 30.0, 22.0, 18.0, 16.0, 19.0, 12.0, 13.0, 5.0, 7.0, 6.0, 7.0, 12.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.8046875, -4.6480712890625, -4.491455078125, -4.3348388671875, -4.17822265625, -4.0216064453125, -3.864990234375, -3.7083740234375, -3.5517578125, -3.3951416015625, -3.238525390625, -3.0819091796875, -2.92529296875, -2.7686767578125, -2.612060546875, -2.4554443359375, -2.298828125, -2.1422119140625, -1.985595703125, -1.8289794921875, -1.67236328125, -1.5157470703125, -1.359130859375, -1.2025146484375, -1.0458984375, -0.8892822265625, -0.732666015625, -0.5760498046875, -0.41943359375, -0.2628173828125, -0.106201171875, 0.0504150390625, 0.20703125, 0.3636474609375, 0.520263671875, 0.6768798828125, 0.83349609375, 0.9901123046875, 1.146728515625, 1.3033447265625, 1.4599609375, 1.6165771484375, 1.773193359375, 1.9298095703125, 2.08642578125, 2.2430419921875, 2.399658203125, 2.5562744140625, 2.712890625, 2.8695068359375, 3.026123046875, 3.1827392578125, 3.33935546875, 3.4959716796875, 3.652587890625, 3.8092041015625, 3.9658203125, 4.1224365234375, 4.279052734375, 4.4356689453125, 4.59228515625, 4.7489013671875, 4.905517578125, 5.0621337890625, 5.21875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 9.0, 10.0, 21.0, 36.0, 43.0, 65.0, 99.0, 158.0, 225.0, 344.0, 534.0, 861.0, 1354.0, 2160.0, 3801.0, 6597.0, 11866.0, 22169.0, 41866.0, 82045.0, 158307.0, 253006.0, 215267.0, 117992.0, 60035.0, 31234.0, 16367.0, 9066.0, 5129.0, 3065.0, 1776.0, 1066.0, 688.0, 421.0, 290.0, 198.0, 111.0, 76.0, 64.0, 33.0, 25.0, 27.0, 12.0, 7.0, 4.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.697265625, -2.614959716796875, -2.53265380859375, -2.450347900390625, -2.3680419921875, -2.285736083984375, -2.20343017578125, -2.121124267578125, -2.038818359375, -1.956512451171875, -1.87420654296875, -1.791900634765625, -1.7095947265625, -1.627288818359375, -1.54498291015625, -1.462677001953125, -1.38037109375, -1.298065185546875, -1.21575927734375, -1.133453369140625, -1.0511474609375, -0.968841552734375, -0.88653564453125, -0.804229736328125, -0.721923828125, -0.639617919921875, -0.55731201171875, -0.475006103515625, -0.3927001953125, -0.310394287109375, -0.22808837890625, -0.145782470703125, -0.0634765625, 0.018829345703125, 0.10113525390625, 0.183441162109375, 0.2657470703125, 0.348052978515625, 0.43035888671875, 0.512664794921875, 0.594970703125, 0.677276611328125, 0.75958251953125, 0.841888427734375, 0.9241943359375, 1.006500244140625, 1.08880615234375, 1.171112060546875, 1.25341796875, 1.335723876953125, 1.41802978515625, 1.500335693359375, 1.5826416015625, 1.664947509765625, 1.74725341796875, 1.829559326171875, 1.911865234375, 1.994171142578125, 2.07647705078125, 2.158782958984375, 2.2410888671875, 2.323394775390625, 2.40570068359375, 2.488006591796875, 2.5703125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 9.0, 9.0, 6.0, 8.0, 19.0, 14.0, 25.0, 22.0, 34.0, 55.0, 44.0, 51.0, 60.0, 81.0, 59.0, 70.0, 52.0, 54.0, 53.0, 44.0, 37.0, 29.0, 30.0, 27.0, 19.0, 11.0, 14.0, 11.0, 17.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0002396106719970703, -0.00023347511887550354, -0.00022733956575393677, -0.00022120401263237, -0.00021506845951080322, -0.00020893290638923645, -0.00020279735326766968, -0.0001966618001461029, -0.00019052624702453613, -0.00018439069390296936, -0.0001782551407814026, -0.00017211958765983582, -0.00016598403453826904, -0.00015984848141670227, -0.0001537129282951355, -0.00014757737517356873, -0.00014144182205200195, -0.00013530626893043518, -0.0001291707158088684, -0.00012303516268730164, -0.00011689960956573486, -0.00011076405644416809, -0.00010462850332260132, -9.849295020103455e-05, -9.235739707946777e-05, -8.6221843957901e-05, -8.008629083633423e-05, -7.395073771476746e-05, -6.781518459320068e-05, -6.167963147163391e-05, -5.554407835006714e-05, -4.9408525228500366e-05, -4.3272972106933594e-05, -3.713741898536682e-05, -3.100186586380005e-05, -2.4866312742233276e-05, -1.8730759620666504e-05, -1.2595206499099731e-05, -6.459653377532959e-06, -3.241002559661865e-07, 5.811452865600586e-06, 1.1947005987167358e-05, 1.808255910873413e-05, 2.4218112230300903e-05, 3.0353665351867676e-05, 3.648921847343445e-05, 4.262477159500122e-05, 4.876032471656799e-05, 5.4895877838134766e-05, 6.103143095970154e-05, 6.716698408126831e-05, 7.330253720283508e-05, 7.943809032440186e-05, 8.557364344596863e-05, 9.17091965675354e-05, 9.784474968910217e-05, 0.00010398030281066895, 0.00011011585593223572, 0.00011625140905380249, 0.00012238696217536926, 0.00012852251529693604, 0.0001346580684185028, 0.00014079362154006958, 0.00014692917466163635, 0.00015306472778320312]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 22.0, 18.0, 41.0, 55.0, 93.0, 112.0, 171.0, 283.0, 422.0, 627.0, 990.0, 1476.0, 2314.0, 3856.0, 6311.0, 10955.0, 18810.0, 32914.0, 57295.0, 97763.0, 153220.0, 191815.0, 174302.0, 121283.0, 72621.0, 42126.0, 23791.0, 13790.0, 8046.0, 4851.0, 2862.0, 1903.0, 1128.0, 783.0, 510.0, 342.0, 192.0, 152.0, 98.0, 71.0, 33.0, 36.0, 24.0, 12.0, 8.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15234375, -2.082275390625, -2.01220703125, -1.942138671875, -1.8720703125, -1.802001953125, -1.73193359375, -1.661865234375, -1.591796875, -1.521728515625, -1.45166015625, -1.381591796875, -1.3115234375, -1.241455078125, -1.17138671875, -1.101318359375, -1.03125, -0.961181640625, -0.89111328125, -0.821044921875, -0.7509765625, -0.680908203125, -0.61083984375, -0.540771484375, -0.470703125, -0.400634765625, -0.33056640625, -0.260498046875, -0.1904296875, -0.120361328125, -0.05029296875, 0.019775390625, 0.08984375, 0.159912109375, 0.22998046875, 0.300048828125, 0.3701171875, 0.440185546875, 0.51025390625, 0.580322265625, 0.650390625, 0.720458984375, 0.79052734375, 0.860595703125, 0.9306640625, 1.000732421875, 1.07080078125, 1.140869140625, 1.2109375, 1.281005859375, 1.35107421875, 1.421142578125, 1.4912109375, 1.561279296875, 1.63134765625, 1.701416015625, 1.771484375, 1.841552734375, 1.91162109375, 1.981689453125, 2.0517578125, 2.121826171875, 2.19189453125, 2.261962890625, 2.33203125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 8.0, 5.0, 12.0, 9.0, 16.0, 12.0, 26.0, 20.0, 26.0, 33.0, 29.0, 39.0, 36.0, 26.0, 49.0, 41.0, 53.0, 44.0, 42.0, 50.0, 44.0, 47.0, 40.0, 41.0, 36.0, 32.0, 25.0, 27.0, 18.0, 13.0, 12.0, 14.0, 12.0, 7.0, 11.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.58349609375, -0.5662384033203125, -0.548980712890625, -0.5317230224609375, -0.51446533203125, -0.4972076416015625, -0.479949951171875, -0.4626922607421875, -0.4454345703125, -0.4281768798828125, -0.410919189453125, -0.3936614990234375, -0.37640380859375, -0.3591461181640625, -0.341888427734375, -0.3246307373046875, -0.307373046875, -0.2901153564453125, -0.272857666015625, -0.2555999755859375, -0.23834228515625, -0.2210845947265625, -0.203826904296875, -0.1865692138671875, -0.1693115234375, -0.1520538330078125, -0.134796142578125, -0.1175384521484375, -0.10028076171875, -0.0830230712890625, -0.065765380859375, -0.0485076904296875, -0.03125, -0.0139923095703125, 0.003265380859375, 0.0205230712890625, 0.03778076171875, 0.0550384521484375, 0.072296142578125, 0.0895538330078125, 0.1068115234375, 0.1240692138671875, 0.141326904296875, 0.1585845947265625, 0.17584228515625, 0.1930999755859375, 0.210357666015625, 0.2276153564453125, 0.244873046875, 0.2621307373046875, 0.279388427734375, 0.2966461181640625, 0.31390380859375, 0.3311614990234375, 0.348419189453125, 0.3656768798828125, 0.3829345703125, 0.4001922607421875, 0.417449951171875, 0.4347076416015625, 0.45196533203125, 0.4692230224609375, 0.486480712890625, 0.5037384033203125, 0.52099609375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 5.0, 8.0, 9.0, 9.0, 17.0, 22.0, 33.0, 46.0, 49.0, 96.0, 87.0, 92.0, 111.0, 91.0, 80.0, 66.0, 48.0, 32.0, 28.0, 20.0, 11.0, 11.0, 11.0, 3.0, 2.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.20969581604004, -28.44330406188965, -27.676910400390625, -26.910518646240234, -26.144126892089844, -25.37773323059082, -24.61134147644043, -23.844947814941406, -23.078556060791016, -22.312164306640625, -21.5457706451416, -20.77937889099121, -20.012985229492188, -19.246593475341797, -18.480201721191406, -17.713809967041016, -16.947416305541992, -16.1810245513916, -15.414630889892578, -14.648239135742188, -13.88184642791748, -13.115453720092773, -12.349061965942383, -11.582669258117676, -10.816276550292969, -10.049883842468262, -9.283491134643555, -8.517099380493164, -7.750706672668457, -6.98431396484375, -6.217921733856201, -5.451529502868652, -4.685136795043945, -3.9187443256378174, -3.1523518562316895, -2.3859593868255615, -1.6195669174194336, -0.8531744480133057, -0.08678197860717773, 0.6796102523803711, 1.4460029602050781, 2.212395429611206, 2.978787899017334, 3.745180368423462, 4.51157283782959, 5.277965545654297, 6.044357776641846, 6.8107500076293945, 7.577142715454102, 8.343535423278809, 9.109928131103516, 9.876319885253906, 10.642712593078613, 11.40910530090332, 12.175497055053711, 12.941889762878418, 13.708282470703125, 14.474675178527832, 15.241067886352539, 16.00745964050293, 16.773853302001953, 17.540245056152344, 18.306636810302734, 19.073028564453125, 19.83942222595215]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 9.0, 9.0, 14.0, 8.0, 17.0, 15.0, 26.0, 27.0, 25.0, 25.0, 34.0, 39.0, 44.0, 56.0, 46.0, 52.0, 55.0, 44.0, 40.0, 57.0, 34.0, 45.0, 31.0, 40.0, 30.0, 30.0, 26.0, 28.0, 23.0, 21.0, 5.0, 13.0, 6.0, 13.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.59731388092041, -10.278158187866211, -9.959001541137695, -9.639845848083496, -9.320690155029297, -9.001534461975098, -8.682378768920898, -8.363222122192383, -8.044066429138184, -7.724910736083984, -7.405754566192627, -7.0865983963012695, -6.76744270324707, -6.448287010192871, -6.129130840301514, -5.809974670410156, -5.490818977355957, -5.171663284301758, -4.8525071144104, -4.533350944519043, -4.214195251464844, -3.8950393199920654, -3.575883388519287, -3.256727457046509, -2.9375715255737305, -2.618415594100952, -2.299259662628174, -1.9801037311553955, -1.6609477996826172, -1.3417918682098389, -1.0226359367370605, -0.7034800052642822, -0.3843231201171875, -0.06516718864440918, 0.25398874282836914, 0.5731446743011475, 0.8923006057739258, 1.211456537246704, 1.5306124687194824, 1.8497684001922607, 2.168924331665039, 2.4880802631378174, 2.8072361946105957, 3.126392126083374, 3.4455480575561523, 3.7647039890289307, 4.083859920501709, 4.403016090393066, 4.722171783447266, 5.041327476501465, 5.360483646392822, 5.67963981628418, 5.998795509338379, 6.317951202392578, 6.6371073722839355, 6.956263542175293, 7.275419235229492, 7.594574928283691, 7.913731098175049, 8.232887268066406, 8.552042961120605, 8.871198654174805, 9.19035530090332, 9.50951099395752, 9.828666687011719]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 8.0, 11.0, 12.0, 24.0, 42.0, 58.0, 82.0, 143.0, 186.0, 313.0, 492.0, 808.0, 1279.0, 2214.0, 3587.0, 5819.0, 9926.0, 17075.0, 28856.0, 50085.0, 84116.0, 131007.0, 173593.0, 177320.0, 139069.0, 90285.0, 54760.0, 32108.0, 18317.0, 10717.0, 6291.0, 3804.0, 2268.0, 1408.0, 952.0, 565.0, 317.0, 228.0, 137.0, 97.0, 59.0, 42.0, 28.0, 17.0, 13.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.578125, -10.21435546875, -9.8505859375, -9.48681640625, -9.123046875, -8.75927734375, -8.3955078125, -8.03173828125, -7.66796875, -7.30419921875, -6.9404296875, -6.57666015625, -6.212890625, -5.84912109375, -5.4853515625, -5.12158203125, -4.7578125, -4.39404296875, -4.0302734375, -3.66650390625, -3.302734375, -2.93896484375, -2.5751953125, -2.21142578125, -1.84765625, -1.48388671875, -1.1201171875, -0.75634765625, -0.392578125, -0.02880859375, 0.3349609375, 0.69873046875, 1.0625, 1.42626953125, 1.7900390625, 2.15380859375, 2.517578125, 2.88134765625, 3.2451171875, 3.60888671875, 3.97265625, 4.33642578125, 4.7001953125, 5.06396484375, 5.427734375, 5.79150390625, 6.1552734375, 6.51904296875, 6.8828125, 7.24658203125, 7.6103515625, 7.97412109375, 8.337890625, 8.70166015625, 9.0654296875, 9.42919921875, 9.79296875, 10.15673828125, 10.5205078125, 10.88427734375, 11.248046875, 11.61181640625, 11.9755859375, 12.33935546875, 12.703125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 6.0, 5.0, 9.0, 17.0, 13.0, 20.0, 14.0, 23.0, 26.0, 18.0, 35.0, 40.0, 41.0, 41.0, 51.0, 39.0, 49.0, 48.0, 41.0, 38.0, 39.0, 33.0, 34.0, 38.0, 34.0, 34.0, 34.0, 23.0, 25.0, 13.0, 18.0, 15.0, 20.0, 15.0, 11.0, 8.0, 9.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-9.5859375, -9.2713623046875, -8.956787109375, -8.6422119140625, -8.32763671875, -8.0130615234375, -7.698486328125, -7.3839111328125, -7.0693359375, -6.7547607421875, -6.440185546875, -6.1256103515625, -5.81103515625, -5.4964599609375, -5.181884765625, -4.8673095703125, -4.552734375, -4.2381591796875, -3.923583984375, -3.6090087890625, -3.29443359375, -2.9798583984375, -2.665283203125, -2.3507080078125, -2.0361328125, -1.7215576171875, -1.406982421875, -1.0924072265625, -0.77783203125, -0.4632568359375, -0.148681640625, 0.1658935546875, 0.48046875, 0.7950439453125, 1.109619140625, 1.4241943359375, 1.73876953125, 2.0533447265625, 2.367919921875, 2.6824951171875, 2.9970703125, 3.3116455078125, 3.626220703125, 3.9407958984375, 4.25537109375, 4.5699462890625, 4.884521484375, 5.1990966796875, 5.513671875, 5.8282470703125, 6.142822265625, 6.4573974609375, 6.77197265625, 7.0865478515625, 7.401123046875, 7.7156982421875, 8.0302734375, 8.3448486328125, 8.659423828125, 8.9739990234375, 9.28857421875, 9.6031494140625, 9.917724609375, 10.2322998046875, 10.546875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 6.0, 13.0, 19.0, 36.0, 37.0, 79.0, 80.0, 138.0, 235.0, 345.0, 515.0, 892.0, 1378.0, 2393.0, 3931.0, 6619.0, 11244.0, 20420.0, 37016.0, 64431.0, 108105.0, 158392.0, 186891.0, 166467.0, 115884.0, 70571.0, 39905.0, 21932.0, 12500.0, 7260.0, 4162.0, 2444.0, 1545.0, 943.0, 596.0, 379.0, 267.0, 158.0, 92.0, 78.0, 57.0, 35.0, 19.0, 13.0, 9.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-13.421875, -13.03369140625, -12.6455078125, -12.25732421875, -11.869140625, -11.48095703125, -11.0927734375, -10.70458984375, -10.31640625, -9.92822265625, -9.5400390625, -9.15185546875, -8.763671875, -8.37548828125, -7.9873046875, -7.59912109375, -7.2109375, -6.82275390625, -6.4345703125, -6.04638671875, -5.658203125, -5.27001953125, -4.8818359375, -4.49365234375, -4.10546875, -3.71728515625, -3.3291015625, -2.94091796875, -2.552734375, -2.16455078125, -1.7763671875, -1.38818359375, -1.0, -0.61181640625, -0.2236328125, 0.16455078125, 0.552734375, 0.94091796875, 1.3291015625, 1.71728515625, 2.10546875, 2.49365234375, 2.8818359375, 3.27001953125, 3.658203125, 4.04638671875, 4.4345703125, 4.82275390625, 5.2109375, 5.59912109375, 5.9873046875, 6.37548828125, 6.763671875, 7.15185546875, 7.5400390625, 7.92822265625, 8.31640625, 8.70458984375, 9.0927734375, 9.48095703125, 9.869140625, 10.25732421875, 10.6455078125, 11.03369140625, 11.421875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 7.0, 6.0, 7.0, 8.0, 15.0, 11.0, 10.0, 16.0, 18.0, 18.0, 17.0, 31.0, 26.0, 51.0, 31.0, 30.0, 40.0, 41.0, 26.0, 46.0, 35.0, 39.0, 43.0, 41.0, 42.0, 43.0, 28.0, 43.0, 30.0, 32.0, 33.0, 23.0, 19.0, 12.0, 16.0, 11.0, 10.0, 9.0, 9.0, 8.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.796875, -5.62530517578125, -5.4537353515625, -5.28216552734375, -5.110595703125, -4.93902587890625, -4.7674560546875, -4.59588623046875, -4.42431640625, -4.25274658203125, -4.0811767578125, -3.90960693359375, -3.738037109375, -3.56646728515625, -3.3948974609375, -3.22332763671875, -3.0517578125, -2.88018798828125, -2.7086181640625, -2.53704833984375, -2.365478515625, -2.19390869140625, -2.0223388671875, -1.85076904296875, -1.67919921875, -1.50762939453125, -1.3360595703125, -1.16448974609375, -0.992919921875, -0.82135009765625, -0.6497802734375, -0.47821044921875, -0.306640625, -0.13507080078125, 0.0364990234375, 0.20806884765625, 0.379638671875, 0.55120849609375, 0.7227783203125, 0.89434814453125, 1.06591796875, 1.23748779296875, 1.4090576171875, 1.58062744140625, 1.752197265625, 1.92376708984375, 2.0953369140625, 2.26690673828125, 2.4384765625, 2.61004638671875, 2.7816162109375, 2.95318603515625, 3.124755859375, 3.29632568359375, 3.4678955078125, 3.63946533203125, 3.81103515625, 3.98260498046875, 4.1541748046875, 4.32574462890625, 4.497314453125, 4.66888427734375, 4.8404541015625, 5.01202392578125, 5.18359375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 12.0, 9.0, 27.0, 42.0, 65.0, 74.0, 127.0, 179.0, 277.0, 409.0, 641.0, 927.0, 1480.0, 2371.0, 3925.0, 6438.0, 10634.0, 17975.0, 31224.0, 54709.0, 92261.0, 146311.0, 189532.0, 178464.0, 125698.0, 76640.0, 44830.0, 25504.0, 15000.0, 8732.0, 5320.0, 3159.0, 2003.0, 1232.0, 844.0, 474.0, 338.0, 214.0, 137.0, 85.0, 78.0, 41.0, 40.0, 21.0, 12.0, 11.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.47265625, -4.33636474609375, -4.2000732421875, -4.06378173828125, -3.927490234375, -3.79119873046875, -3.6549072265625, -3.51861572265625, -3.38232421875, -3.24603271484375, -3.1097412109375, -2.97344970703125, -2.837158203125, -2.70086669921875, -2.5645751953125, -2.42828369140625, -2.2919921875, -2.15570068359375, -2.0194091796875, -1.88311767578125, -1.746826171875, -1.61053466796875, -1.4742431640625, -1.33795166015625, -1.20166015625, -1.06536865234375, -0.9290771484375, -0.79278564453125, -0.656494140625, -0.52020263671875, -0.3839111328125, -0.24761962890625, -0.111328125, 0.02496337890625, 0.1612548828125, 0.29754638671875, 0.433837890625, 0.57012939453125, 0.7064208984375, 0.84271240234375, 0.97900390625, 1.11529541015625, 1.2515869140625, 1.38787841796875, 1.524169921875, 1.66046142578125, 1.7967529296875, 1.93304443359375, 2.0693359375, 2.20562744140625, 2.3419189453125, 2.47821044921875, 2.614501953125, 2.75079345703125, 2.8870849609375, 3.02337646484375, 3.15966796875, 3.29595947265625, 3.4322509765625, 3.56854248046875, 3.704833984375, 3.84112548828125, 3.9774169921875, 4.11370849609375, 4.25]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 5.0, 6.0, 6.0, 9.0, 6.0, 8.0, 11.0, 14.0, 18.0, 17.0, 17.0, 31.0, 36.0, 27.0, 40.0, 58.0, 44.0, 62.0, 44.0, 50.0, 63.0, 56.0, 66.0, 44.0, 42.0, 32.0, 39.0, 34.0, 30.0, 21.0, 12.0, 13.0, 14.0, 11.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00038814544677734375, -0.000374622642993927, -0.00036109983921051025, -0.0003475770354270935, -0.00033405423164367676, -0.00032053142786026, -0.00030700862407684326, -0.0002934858202934265, -0.00027996301651000977, -0.000266440212726593, -0.00025291740894317627, -0.00023939460515975952, -0.00022587180137634277, -0.00021234899759292603, -0.00019882619380950928, -0.00018530339002609253, -0.00017178058624267578, -0.00015825778245925903, -0.00014473497867584229, -0.00013121217489242554, -0.00011768937110900879, -0.00010416656732559204, -9.064376354217529e-05, -7.712095975875854e-05, -6.35981559753418e-05, -5.007535219192505e-05, -3.65525484085083e-05, -2.3029744625091553e-05, -9.506940841674805e-06, 4.015862941741943e-06, 1.753866672515869e-05, 3.106147050857544e-05, 4.458427429199219e-05, 5.8107078075408936e-05, 7.162988185882568e-05, 8.515268564224243e-05, 9.867548942565918e-05, 0.00011219829320907593, 0.00012572109699249268, 0.00013924390077590942, 0.00015276670455932617, 0.00016628950834274292, 0.00017981231212615967, 0.00019333511590957642, 0.00020685791969299316, 0.0002203807234764099, 0.00023390352725982666, 0.0002474263310432434, 0.00026094913482666016, 0.0002744719386100769, 0.00028799474239349365, 0.0003015175461769104, 0.00031504034996032715, 0.0003285631537437439, 0.00034208595752716064, 0.0003556087613105774, 0.00036913156509399414, 0.0003826543688774109, 0.00039617717266082764, 0.0004096999764442444, 0.00042322278022766113, 0.0004367455840110779, 0.00045026838779449463, 0.0004637911915779114, 0.0004773139953613281]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 8.0, 11.0, 18.0, 15.0, 32.0, 33.0, 50.0, 73.0, 106.0, 216.0, 288.0, 439.0, 693.0, 1085.0, 1716.0, 2744.0, 4262.0, 7263.0, 12056.0, 20013.0, 33542.0, 56154.0, 91997.0, 141120.0, 181245.0, 171559.0, 124038.0, 78497.0, 47707.0, 28031.0, 16813.0, 10306.0, 6131.0, 3761.0, 2362.0, 1494.0, 913.0, 608.0, 392.0, 258.0, 145.0, 101.0, 77.0, 52.0, 47.0, 37.0, 15.0, 14.0, 10.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.296875, -4.15753173828125, -4.0181884765625, -3.87884521484375, -3.739501953125, -3.60015869140625, -3.4608154296875, -3.32147216796875, -3.18212890625, -3.04278564453125, -2.9034423828125, -2.76409912109375, -2.624755859375, -2.48541259765625, -2.3460693359375, -2.20672607421875, -2.0673828125, -1.92803955078125, -1.7886962890625, -1.64935302734375, -1.510009765625, -1.37066650390625, -1.2313232421875, -1.09197998046875, -0.95263671875, -0.81329345703125, -0.6739501953125, -0.53460693359375, -0.395263671875, -0.25592041015625, -0.1165771484375, 0.02276611328125, 0.162109375, 0.30145263671875, 0.4407958984375, 0.58013916015625, 0.719482421875, 0.85882568359375, 0.9981689453125, 1.13751220703125, 1.27685546875, 1.41619873046875, 1.5555419921875, 1.69488525390625, 1.834228515625, 1.97357177734375, 2.1129150390625, 2.25225830078125, 2.3916015625, 2.53094482421875, 2.6702880859375, 2.80963134765625, 2.948974609375, 3.08831787109375, 3.2276611328125, 3.36700439453125, 3.50634765625, 3.64569091796875, 3.7850341796875, 3.92437744140625, 4.063720703125, 4.20306396484375, 4.3424072265625, 4.48175048828125, 4.62109375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 6.0, 5.0, 9.0, 20.0, 16.0, 25.0, 20.0, 31.0, 28.0, 30.0, 36.0, 43.0, 40.0, 44.0, 57.0, 54.0, 52.0, 59.0, 44.0, 54.0, 42.0, 42.0, 41.0, 34.0, 33.0, 30.0, 18.0, 13.0, 18.0, 11.0, 13.0, 10.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.3525390625, -1.3134613037109375, -1.274383544921875, -1.2353057861328125, -1.19622802734375, -1.1571502685546875, -1.118072509765625, -1.0789947509765625, -1.0399169921875, -1.0008392333984375, -0.961761474609375, -0.9226837158203125, -0.88360595703125, -0.8445281982421875, -0.805450439453125, -0.7663726806640625, -0.727294921875, -0.6882171630859375, -0.649139404296875, -0.6100616455078125, -0.57098388671875, -0.5319061279296875, -0.492828369140625, -0.4537506103515625, -0.4146728515625, -0.3755950927734375, -0.336517333984375, -0.2974395751953125, -0.25836181640625, -0.2192840576171875, -0.180206298828125, -0.1411285400390625, -0.10205078125, -0.0629730224609375, -0.023895263671875, 0.0151824951171875, 0.05426025390625, 0.0933380126953125, 0.132415771484375, 0.1714935302734375, 0.2105712890625, 0.2496490478515625, 0.288726806640625, 0.3278045654296875, 0.36688232421875, 0.4059600830078125, 0.445037841796875, 0.4841156005859375, 0.523193359375, 0.5622711181640625, 0.601348876953125, 0.6404266357421875, 0.67950439453125, 0.7185821533203125, 0.757659912109375, 0.7967376708984375, 0.8358154296875, 0.8748931884765625, 0.913970947265625, 0.9530487060546875, 0.99212646484375, 1.0312042236328125, 1.070281982421875, 1.1093597412109375, 1.1484375]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 7.0, 17.0, 12.0, 14.0, 24.0, 37.0, 63.0, 71.0, 91.0, 109.0, 100.0, 97.0, 98.0, 66.0, 46.0, 38.0, 21.0, 19.0, 15.0, 13.0, 9.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.74650001525879, -27.978233337402344, -27.2099666595459, -26.441699981689453, -25.673431396484375, -24.90516471862793, -24.136898040771484, -23.36863136291504, -22.600364685058594, -21.83209800720215, -21.063831329345703, -20.295562744140625, -19.52729606628418, -18.759029388427734, -17.99076271057129, -17.222496032714844, -16.454227447509766, -15.68596076965332, -14.917693138122559, -14.149426460266113, -13.381158828735352, -12.612892150878906, -11.844625473022461, -11.076358795166016, -10.308091163635254, -9.539824485778809, -8.771556854248047, -8.003290176391602, -7.235023021697998, -6.4667558670043945, -5.698489189147949, -4.930222034454346, -4.161952972412109, -3.393685817718506, -2.6254189014434814, -1.857151985168457, -1.0888848304748535, -0.32061767578125, 0.4476490020751953, 1.2159161567687988, 1.9841833114624023, 2.752450466156006, 3.5207173824310303, 4.288984298706055, 5.057251453399658, 5.825518608093262, 6.593785285949707, 7.3620524406433105, 8.130319595336914, 8.89858627319336, 9.666853904724121, 10.435120582580566, 11.203388214111328, 11.971654891967773, 12.739921569824219, 13.508188247680664, 14.276455879211426, 15.044722557067871, 15.812990188598633, 16.581256866455078, 17.349523544311523, 18.11779022216797, 18.886058807373047, 19.654325485229492, 20.422592163085938]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 8.0, 7.0, 10.0, 8.0, 11.0, 4.0, 16.0, 15.0, 26.0, 29.0, 36.0, 22.0, 43.0, 44.0, 44.0, 44.0, 37.0, 37.0, 46.0, 53.0, 47.0, 39.0, 41.0, 50.0, 32.0, 39.0, 33.0, 33.0, 21.0, 23.0, 27.0, 16.0, 10.0, 8.0, 15.0, 6.0, 8.0, 5.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.555373191833496, -10.253592491149902, -9.951812744140625, -9.650032043457031, -9.348251342773438, -9.04647159576416, -8.744690895080566, -8.442911148071289, -8.141130447387695, -7.83935022354126, -7.537569999694824, -7.2357892990112305, -6.934009075164795, -6.632228851318359, -6.330448150634766, -6.02866792678833, -5.7268877029418945, -5.425107479095459, -5.123327255249023, -4.82154655456543, -4.519766330718994, -4.217986106872559, -3.916205644607544, -3.6144251823425293, -3.3126449584960938, -3.010864734649658, -2.7090842723846436, -2.407303810119629, -2.1055235862731934, -1.8037432432174683, -1.5019629001617432, -1.2001824378967285, -0.8984012603759766, -0.5966209173202515, -0.29484057426452637, 0.0069397687911987305, 0.30872011184692383, 0.6105004549026489, 0.912280797958374, 1.2140612602233887, 1.5158414840698242, 1.8176218271255493, 2.1194021701812744, 2.421182632446289, 2.7229628562927246, 3.02474308013916, 3.326523542404175, 3.6283040046691895, 3.930084228515625, 4.2318644523620605, 4.533644676208496, 4.83542537689209, 5.137205600738525, 5.438985824584961, 5.740766525268555, 6.04254674911499, 6.344326972961426, 6.646107196807861, 6.947887420654297, 7.249668121337891, 7.551448345184326, 7.853228569030762, 8.155009269714355, 8.456789016723633, 8.758569717407227]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 10.0, 13.0, 16.0, 19.0, 39.0, 60.0, 89.0, 120.0, 208.0, 321.0, 535.0, 769.0, 1321.0, 2223.0, 3808.0, 6954.0, 13364.0, 26885.0, 59025.0, 140947.0, 387492.0, 1072273.0, 1433278.0, 650378.0, 224835.0, 87404.0, 38934.0, 19056.0, 9979.0, 5403.0, 3157.0, 1949.0, 1171.0, 762.0, 483.0, 310.0, 223.0, 158.0, 96.0, 58.0, 41.0, 35.0, 30.0, 19.0, 10.0, 6.0, 3.0, 5.0, 7.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.140625, -15.569091796875, -14.99755859375, -14.426025390625, -13.8544921875, -13.282958984375, -12.71142578125, -12.139892578125, -11.568359375, -10.996826171875, -10.42529296875, -9.853759765625, -9.2822265625, -8.710693359375, -8.13916015625, -7.567626953125, -6.99609375, -6.424560546875, -5.85302734375, -5.281494140625, -4.7099609375, -4.138427734375, -3.56689453125, -2.995361328125, -2.423828125, -1.852294921875, -1.28076171875, -0.709228515625, -0.1376953125, 0.433837890625, 1.00537109375, 1.576904296875, 2.1484375, 2.719970703125, 3.29150390625, 3.863037109375, 4.4345703125, 5.006103515625, 5.57763671875, 6.149169921875, 6.720703125, 7.292236328125, 7.86376953125, 8.435302734375, 9.0068359375, 9.578369140625, 10.14990234375, 10.721435546875, 11.29296875, 11.864501953125, 12.43603515625, 13.007568359375, 13.5791015625, 14.150634765625, 14.72216796875, 15.293701171875, 15.865234375, 16.436767578125, 17.00830078125, 17.579833984375, 18.1513671875, 18.722900390625, 19.29443359375, 19.865966796875, 20.4375]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 11.0, 9.0, 6.0, 14.0, 11.0, 12.0, 20.0, 24.0, 27.0, 26.0, 25.0, 37.0, 40.0, 37.0, 40.0, 44.0, 42.0, 44.0, 34.0, 35.0, 45.0, 37.0, 42.0, 55.0, 32.0, 38.0, 38.0, 20.0, 25.0, 22.0, 22.0, 21.0, 9.0, 8.0, 7.0, 9.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.01171875, -6.7952880859375, -6.578857421875, -6.3624267578125, -6.14599609375, -5.9295654296875, -5.713134765625, -5.4967041015625, -5.2802734375, -5.0638427734375, -4.847412109375, -4.6309814453125, -4.41455078125, -4.1981201171875, -3.981689453125, -3.7652587890625, -3.548828125, -3.3323974609375, -3.115966796875, -2.8995361328125, -2.68310546875, -2.4666748046875, -2.250244140625, -2.0338134765625, -1.8173828125, -1.6009521484375, -1.384521484375, -1.1680908203125, -0.95166015625, -0.7352294921875, -0.518798828125, -0.3023681640625, -0.0859375, 0.1304931640625, 0.346923828125, 0.5633544921875, 0.77978515625, 0.9962158203125, 1.212646484375, 1.4290771484375, 1.6455078125, 1.8619384765625, 2.078369140625, 2.2947998046875, 2.51123046875, 2.7276611328125, 2.944091796875, 3.1605224609375, 3.376953125, 3.5933837890625, 3.809814453125, 4.0262451171875, 4.24267578125, 4.4591064453125, 4.675537109375, 4.8919677734375, 5.1083984375, 5.3248291015625, 5.541259765625, 5.7576904296875, 5.97412109375, 6.1905517578125, 6.406982421875, 6.6234130859375, 6.83984375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 6.0, 13.0, 20.0, 24.0, 42.0, 49.0, 77.0, 122.0, 188.0, 242.0, 476.0, 713.0, 1178.0, 2001.0, 3234.0, 5850.0, 10503.0, 20184.0, 41310.0, 90135.0, 216389.0, 550684.0, 1230338.0, 1159887.0, 498878.0, 198077.0, 83200.0, 38242.0, 18807.0, 9873.0, 5449.0, 3128.0, 1918.0, 1190.0, 682.0, 431.0, 235.0, 188.0, 116.0, 66.0, 49.0, 21.0, 28.0, 16.0, 10.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.81396484375, -18.2060546875, -17.59814453125, -16.990234375, -16.38232421875, -15.7744140625, -15.16650390625, -14.55859375, -13.95068359375, -13.3427734375, -12.73486328125, -12.126953125, -11.51904296875, -10.9111328125, -10.30322265625, -9.6953125, -9.08740234375, -8.4794921875, -7.87158203125, -7.263671875, -6.65576171875, -6.0478515625, -5.43994140625, -4.83203125, -4.22412109375, -3.6162109375, -3.00830078125, -2.400390625, -1.79248046875, -1.1845703125, -0.57666015625, 0.03125, 0.63916015625, 1.2470703125, 1.85498046875, 2.462890625, 3.07080078125, 3.6787109375, 4.28662109375, 4.89453125, 5.50244140625, 6.1103515625, 6.71826171875, 7.326171875, 7.93408203125, 8.5419921875, 9.14990234375, 9.7578125, 10.36572265625, 10.9736328125, 11.58154296875, 12.189453125, 12.79736328125, 13.4052734375, 14.01318359375, 14.62109375, 15.22900390625, 15.8369140625, 16.44482421875, 17.052734375, 17.66064453125, 18.2685546875, 18.87646484375, 19.484375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 9.0, 11.0, 23.0, 23.0, 33.0, 48.0, 58.0, 60.0, 109.0, 131.0, 148.0, 188.0, 223.0, 290.0, 339.0, 350.0, 336.0, 310.0, 278.0, 238.0, 195.0, 160.0, 129.0, 88.0, 49.0, 46.0, 45.0, 35.0, 25.0, 20.0, 11.0, 10.0, 14.0, 4.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.55859375, -5.399658203125, -5.24072265625, -5.081787109375, -4.9228515625, -4.763916015625, -4.60498046875, -4.446044921875, -4.287109375, -4.128173828125, -3.96923828125, -3.810302734375, -3.6513671875, -3.492431640625, -3.33349609375, -3.174560546875, -3.015625, -2.856689453125, -2.69775390625, -2.538818359375, -2.3798828125, -2.220947265625, -2.06201171875, -1.903076171875, -1.744140625, -1.585205078125, -1.42626953125, -1.267333984375, -1.1083984375, -0.949462890625, -0.79052734375, -0.631591796875, -0.47265625, -0.313720703125, -0.15478515625, 0.004150390625, 0.1630859375, 0.322021484375, 0.48095703125, 0.639892578125, 0.798828125, 0.957763671875, 1.11669921875, 1.275634765625, 1.4345703125, 1.593505859375, 1.75244140625, 1.911376953125, 2.0703125, 2.229248046875, 2.38818359375, 2.547119140625, 2.7060546875, 2.864990234375, 3.02392578125, 3.182861328125, 3.341796875, 3.500732421875, 3.65966796875, 3.818603515625, 3.9775390625, 4.136474609375, 4.29541015625, 4.454345703125, 4.61328125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 12.0, 27.0, 31.0, 27.0, 35.0, 61.0, 68.0, 93.0, 106.0, 97.0, 98.0, 87.0, 59.0, 50.0, 38.0, 24.0, 21.0, 11.0, 5.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.156291961669922, -27.379981994628906, -26.60367202758789, -25.827362060546875, -25.051050186157227, -24.27474021911621, -23.498430252075195, -22.72212028503418, -21.94580841064453, -21.169498443603516, -20.3931884765625, -19.616878509521484, -18.840566635131836, -18.06425666809082, -17.287946701049805, -16.51163673400879, -15.735326766967773, -14.959016799926758, -14.182705879211426, -13.40639591217041, -12.630084991455078, -11.853775024414062, -11.077465057373047, -10.301155090332031, -9.5248441696167, -8.748534202575684, -7.972223281860352, -7.195913314819336, -6.419602870941162, -5.643292427062988, -4.866982460021973, -4.090672016143799, -3.314361572265625, -2.538051128387451, -1.7617409229278564, -0.9854307174682617, -0.2091202735900879, 0.5671901702880859, 1.3435001373291016, 2.1198105812072754, 2.896121025085449, 3.672431468963623, 4.448741912841797, 5.2250518798828125, 6.001362323760986, 6.77767276763916, 7.553982734680176, 8.330293655395508, 9.106603622436523, 9.882913589477539, 10.659224510192871, 11.435534477233887, 12.211845397949219, 12.988155364990234, 13.76446533203125, 14.540775299072266, 15.317086219787598, 16.09339714050293, 16.869707107543945, 17.64601707458496, 18.422327041625977, 19.198638916015625, 19.97494888305664, 20.751258850097656, 21.527568817138672]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 11.0, 12.0, 10.0, 12.0, 15.0, 31.0, 25.0, 24.0, 18.0, 23.0, 25.0, 49.0, 47.0, 43.0, 35.0, 53.0, 53.0, 45.0, 42.0, 37.0, 48.0, 49.0, 35.0, 39.0, 26.0, 32.0, 27.0, 27.0, 25.0, 17.0, 10.0, 8.0, 11.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.673925399780273, -9.38236141204834, -9.090797424316406, -8.799233436584473, -8.507669448852539, -8.216106414794922, -7.924542427062988, -7.632978439331055, -7.341414451599121, -7.0498504638671875, -6.758286476135254, -6.4667229652404785, -6.175158977508545, -5.883594989776611, -5.592031478881836, -5.300467491149902, -5.008903503417969, -4.717339515686035, -4.425775527954102, -4.134212017059326, -3.8426480293273926, -3.551084041595459, -3.2595202922821045, -2.96795654296875, -2.6763925552368164, -2.384828567504883, -2.0932648181915283, -1.8017009496688843, -1.5101370811462402, -1.2185732126235962, -0.9270093441009521, -0.6354455947875977, -0.34388256072998047, -0.052318692207336426, 0.23924517631530762, 0.5308090448379517, 0.8223729133605957, 1.1139367818832397, 1.4055006504058838, 1.6970643997192383, 1.9886283874511719, 2.2801923751831055, 2.57175612449646, 2.8633198738098145, 3.154883861541748, 3.4464478492736816, 3.738011598587036, 4.029575347900391, 4.321139335632324, 4.612703323364258, 4.904267311096191, 5.195830821990967, 5.4873948097229, 5.778958797454834, 6.070522308349609, 6.362086296081543, 6.653650283813477, 6.94521427154541, 7.236778259277344, 7.528341770172119, 7.819905757904053, 8.111469268798828, 8.403033256530762, 8.694597244262695, 8.986161231994629]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 9.0, 19.0, 10.0, 18.0, 30.0, 70.0, 67.0, 133.0, 196.0, 292.0, 456.0, 787.0, 1341.0, 2365.0, 4223.0, 8062.0, 15797.0, 31183.0, 63709.0, 128020.0, 223267.0, 247390.0, 158639.0, 81154.0, 39573.0, 19630.0, 9979.0, 5179.0, 2917.0, 1585.0, 950.0, 539.0, 348.0, 213.0, 130.0, 99.0, 60.0, 36.0, 17.0, 25.0, 12.0, 12.0, 4.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.48046875, -7.2479248046875, -7.015380859375, -6.7828369140625, -6.55029296875, -6.3177490234375, -6.085205078125, -5.8526611328125, -5.6201171875, -5.3875732421875, -5.155029296875, -4.9224853515625, -4.68994140625, -4.4573974609375, -4.224853515625, -3.9923095703125, -3.759765625, -3.5272216796875, -3.294677734375, -3.0621337890625, -2.82958984375, -2.5970458984375, -2.364501953125, -2.1319580078125, -1.8994140625, -1.6668701171875, -1.434326171875, -1.2017822265625, -0.96923828125, -0.7366943359375, -0.504150390625, -0.2716064453125, -0.0390625, 0.1934814453125, 0.426025390625, 0.6585693359375, 0.89111328125, 1.1236572265625, 1.356201171875, 1.5887451171875, 1.8212890625, 2.0538330078125, 2.286376953125, 2.5189208984375, 2.75146484375, 2.9840087890625, 3.216552734375, 3.4490966796875, 3.681640625, 3.9141845703125, 4.146728515625, 4.3792724609375, 4.61181640625, 4.8443603515625, 5.076904296875, 5.3094482421875, 5.5419921875, 5.7745361328125, 6.007080078125, 6.2396240234375, 6.47216796875, 6.7047119140625, 6.937255859375, 7.1697998046875, 7.40234375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 10.0, 5.0, 4.0, 11.0, 15.0, 9.0, 18.0, 20.0, 23.0, 38.0, 34.0, 33.0, 52.0, 39.0, 47.0, 55.0, 56.0, 51.0, 54.0, 54.0, 44.0, 43.0, 36.0, 41.0, 34.0, 31.0, 31.0, 19.0, 13.0, 23.0, 9.0, 10.0, 11.0, 7.0, 11.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.7890625, -11.4381103515625, -11.087158203125, -10.7362060546875, -10.38525390625, -10.0343017578125, -9.683349609375, -9.3323974609375, -8.9814453125, -8.6304931640625, -8.279541015625, -7.9285888671875, -7.57763671875, -7.2266845703125, -6.875732421875, -6.5247802734375, -6.173828125, -5.8228759765625, -5.471923828125, -5.1209716796875, -4.77001953125, -4.4190673828125, -4.068115234375, -3.7171630859375, -3.3662109375, -3.0152587890625, -2.664306640625, -2.3133544921875, -1.96240234375, -1.6114501953125, -1.260498046875, -0.9095458984375, -0.55859375, -0.2076416015625, 0.143310546875, 0.4942626953125, 0.84521484375, 1.1961669921875, 1.547119140625, 1.8980712890625, 2.2490234375, 2.5999755859375, 2.950927734375, 3.3018798828125, 3.65283203125, 4.0037841796875, 4.354736328125, 4.7056884765625, 5.056640625, 5.4075927734375, 5.758544921875, 6.1094970703125, 6.46044921875, 6.8114013671875, 7.162353515625, 7.5133056640625, 7.8642578125, 8.2152099609375, 8.566162109375, 8.9171142578125, 9.26806640625, 9.6190185546875, 9.969970703125, 10.3209228515625, 10.671875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 8.0, 16.0, 17.0, 36.0, 42.0, 62.0, 79.0, 140.0, 154.0, 251.0, 384.0, 560.0, 789.0, 1203.0, 1851.0, 2855.0, 4453.0, 7397.0, 12135.0, 20294.0, 36648.0, 64542.0, 115678.0, 190663.0, 222377.0, 155925.0, 89627.0, 49881.0, 28060.0, 16186.0, 9570.0, 5941.0, 3707.0, 2338.0, 1494.0, 1054.0, 684.0, 461.0, 305.0, 219.0, 145.0, 109.0, 76.0, 45.0, 29.0, 17.0, 16.0, 13.0, 4.0, 5.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.90625, -6.67816162109375, -6.4500732421875, -6.22198486328125, -5.993896484375, -5.76580810546875, -5.5377197265625, -5.30963134765625, -5.08154296875, -4.85345458984375, -4.6253662109375, -4.39727783203125, -4.169189453125, -3.94110107421875, -3.7130126953125, -3.48492431640625, -3.2568359375, -3.02874755859375, -2.8006591796875, -2.57257080078125, -2.344482421875, -2.11639404296875, -1.8883056640625, -1.66021728515625, -1.43212890625, -1.20404052734375, -0.9759521484375, -0.74786376953125, -0.519775390625, -0.29168701171875, -0.0635986328125, 0.16448974609375, 0.392578125, 0.62066650390625, 0.8487548828125, 1.07684326171875, 1.304931640625, 1.53302001953125, 1.7611083984375, 1.98919677734375, 2.21728515625, 2.44537353515625, 2.6734619140625, 2.90155029296875, 3.129638671875, 3.35772705078125, 3.5858154296875, 3.81390380859375, 4.0419921875, 4.27008056640625, 4.4981689453125, 4.72625732421875, 4.954345703125, 5.18243408203125, 5.4105224609375, 5.63861083984375, 5.86669921875, 6.09478759765625, 6.3228759765625, 6.55096435546875, 6.779052734375, 7.00714111328125, 7.2352294921875, 7.46331787109375, 7.69140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 7.0, 4.0, 10.0, 18.0, 11.0, 14.0, 13.0, 16.0, 24.0, 18.0, 26.0, 26.0, 19.0, 32.0, 32.0, 30.0, 41.0, 42.0, 33.0, 35.0, 39.0, 28.0, 26.0, 46.0, 36.0, 26.0, 35.0, 39.0, 25.0, 35.0, 31.0, 26.0, 20.0, 22.0, 12.0, 18.0, 13.0, 17.0, 9.0, 12.0, 9.0, 10.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.5478515625, -4.392578125, -4.2373046875, -4.08203125, -3.9267578125, -3.771484375, -3.6162109375, -3.4609375, -3.3056640625, -3.150390625, -2.9951171875, -2.83984375, -2.6845703125, -2.529296875, -2.3740234375, -2.21875, -2.0634765625, -1.908203125, -1.7529296875, -1.59765625, -1.4423828125, -1.287109375, -1.1318359375, -0.9765625, -0.8212890625, -0.666015625, -0.5107421875, -0.35546875, -0.2001953125, -0.044921875, 0.1103515625, 0.265625, 0.4208984375, 0.576171875, 0.7314453125, 0.88671875, 1.0419921875, 1.197265625, 1.3525390625, 1.5078125, 1.6630859375, 1.818359375, 1.9736328125, 2.12890625, 2.2841796875, 2.439453125, 2.5947265625, 2.75, 2.9052734375, 3.060546875, 3.2158203125, 3.37109375, 3.5263671875, 3.681640625, 3.8369140625, 3.9921875, 4.1474609375, 4.302734375, 4.4580078125, 4.61328125, 4.7685546875, 4.923828125, 5.0791015625, 5.234375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 8.0, 5.0, 6.0, 19.0, 21.0, 34.0, 43.0, 61.0, 124.0, 198.0, 322.0, 550.0, 885.0, 1641.0, 3033.0, 5552.0, 10782.0, 21843.0, 47423.0, 108229.0, 240895.0, 310862.0, 161990.0, 70684.0, 31723.0, 14973.0, 7605.0, 3904.0, 2136.0, 1267.0, 699.0, 403.0, 261.0, 151.0, 98.0, 43.0, 35.0, 21.0, 8.0, 13.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.892578125, -3.788055419921875, -3.68353271484375, -3.579010009765625, -3.4744873046875, -3.369964599609375, -3.26544189453125, -3.160919189453125, -3.056396484375, -2.951873779296875, -2.84735107421875, -2.742828369140625, -2.6383056640625, -2.533782958984375, -2.42926025390625, -2.324737548828125, -2.22021484375, -2.115692138671875, -2.01116943359375, -1.906646728515625, -1.8021240234375, -1.697601318359375, -1.59307861328125, -1.488555908203125, -1.384033203125, -1.279510498046875, -1.17498779296875, -1.070465087890625, -0.9659423828125, -0.861419677734375, -0.75689697265625, -0.652374267578125, -0.5478515625, -0.443328857421875, -0.33880615234375, -0.234283447265625, -0.1297607421875, -0.025238037109375, 0.07928466796875, 0.183807373046875, 0.288330078125, 0.392852783203125, 0.49737548828125, 0.601898193359375, 0.7064208984375, 0.810943603515625, 0.91546630859375, 1.019989013671875, 1.12451171875, 1.229034423828125, 1.33355712890625, 1.438079833984375, 1.5426025390625, 1.647125244140625, 1.75164794921875, 1.856170654296875, 1.960693359375, 2.065216064453125, 2.16973876953125, 2.274261474609375, 2.3787841796875, 2.483306884765625, 2.58782958984375, 2.692352294921875, 2.796875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 6.0, 12.0, 7.0, 16.0, 29.0, 28.0, 38.0, 38.0, 59.0, 66.0, 67.0, 68.0, 75.0, 81.0, 76.0, 69.0, 49.0, 48.0, 32.0, 32.0, 14.0, 16.0, 23.0, 16.0, 9.0, 12.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002593994140625, -0.00025214627385139465, -0.0002448931336402893, -0.00023763999342918396, -0.0002303868532180786, -0.00022313371300697327, -0.00021588057279586792, -0.00020862743258476257, -0.00020137429237365723, -0.00019412115216255188, -0.00018686801195144653, -0.0001796148717403412, -0.00017236173152923584, -0.0001651085913181305, -0.00015785545110702515, -0.0001506023108959198, -0.00014334917068481445, -0.0001360960304737091, -0.00012884289026260376, -0.00012158975005149841, -0.00011433660984039307, -0.00010708346962928772, -9.983032941818237e-05, -9.257718920707703e-05, -8.532404899597168e-05, -7.807090878486633e-05, -7.081776857376099e-05, -6.356462836265564e-05, -5.631148815155029e-05, -4.9058347940444946e-05, -4.18052077293396e-05, -3.455206751823425e-05, -2.7298927307128906e-05, -2.004578709602356e-05, -1.2792646884918213e-05, -5.539506673812866e-06, 1.7136335372924805e-06, 8.966773748397827e-06, 1.6219913959503174e-05, 2.347305417060852e-05, 3.072619438171387e-05, 3.7979334592819214e-05, 4.523247480392456e-05, 5.248561501502991e-05, 5.9738755226135254e-05, 6.69918954372406e-05, 7.424503564834595e-05, 8.14981758594513e-05, 8.875131607055664e-05, 9.600445628166199e-05, 0.00010325759649276733, 0.00011051073670387268, 0.00011776387691497803, 0.00012501701712608337, 0.00013227015733718872, 0.00013952329754829407, 0.00014677643775939941, 0.00015402957797050476, 0.0001612827181816101, 0.00016853585839271545, 0.0001757889986038208, 0.00018304213881492615, 0.0001902952790260315, 0.00019754841923713684, 0.0002048015594482422]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 8.0, 18.0, 18.0, 24.0, 28.0, 46.0, 56.0, 93.0, 141.0, 187.0, 287.0, 454.0, 679.0, 1056.0, 1744.0, 2793.0, 4808.0, 8116.0, 13860.0, 24592.0, 43747.0, 78082.0, 130524.0, 186441.0, 195446.0, 146644.0, 89654.0, 51224.0, 28324.0, 16046.0, 9287.0, 5340.0, 3280.0, 2061.0, 1233.0, 783.0, 479.0, 316.0, 221.0, 119.0, 105.0, 59.0, 41.0, 28.0, 28.0, 18.0, 6.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-2.599609375, -2.5234375, -2.447265625, -2.37109375, -2.294921875, -2.21875, -2.142578125, -2.06640625, -1.990234375, -1.9140625, -1.837890625, -1.76171875, -1.685546875, -1.609375, -1.533203125, -1.45703125, -1.380859375, -1.3046875, -1.228515625, -1.15234375, -1.076171875, -1.0, -0.923828125, -0.84765625, -0.771484375, -0.6953125, -0.619140625, -0.54296875, -0.466796875, -0.390625, -0.314453125, -0.23828125, -0.162109375, -0.0859375, -0.009765625, 0.06640625, 0.142578125, 0.21875, 0.294921875, 0.37109375, 0.447265625, 0.5234375, 0.599609375, 0.67578125, 0.751953125, 0.828125, 0.904296875, 0.98046875, 1.056640625, 1.1328125, 1.208984375, 1.28515625, 1.361328125, 1.4375, 1.513671875, 1.58984375, 1.666015625, 1.7421875, 1.818359375, 1.89453125, 1.970703125, 2.046875, 2.123046875, 2.19921875, 2.275390625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 3.0, 8.0, 8.0, 14.0, 10.0, 11.0, 9.0, 13.0, 20.0, 28.0, 15.0, 25.0, 25.0, 39.0, 33.0, 34.0, 48.0, 42.0, 38.0, 49.0, 50.0, 56.0, 50.0, 45.0, 50.0, 29.0, 36.0, 29.0, 23.0, 18.0, 22.0, 20.0, 11.0, 7.0, 7.0, 11.0, 13.0, 4.0, 3.0, 13.0, 9.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.477783203125, -0.4606971740722656, -0.44361114501953125, -0.4265251159667969, -0.4094390869140625, -0.3923530578613281, -0.37526702880859375, -0.3581809997558594, -0.341094970703125, -0.3240089416503906, -0.30692291259765625, -0.2898368835449219, -0.2727508544921875, -0.2556648254394531, -0.23857879638671875, -0.22149276733398438, -0.20440673828125, -0.18732070922851562, -0.17023468017578125, -0.15314865112304688, -0.1360626220703125, -0.11897659301757812, -0.10189056396484375, -0.08480453491210938, -0.067718505859375, -0.050632476806640625, -0.03354644775390625, -0.016460418701171875, 0.0006256103515625, 0.017711639404296875, 0.03479766845703125, 0.051883697509765625, 0.0689697265625, 0.08605575561523438, 0.10314178466796875, 0.12022781372070312, 0.1373138427734375, 0.15439987182617188, 0.17148590087890625, 0.18857192993164062, 0.205657958984375, 0.22274398803710938, 0.23983001708984375, 0.2569160461425781, 0.2740020751953125, 0.2910881042480469, 0.30817413330078125, 0.3252601623535156, 0.34234619140625, 0.3594322204589844, 0.37651824951171875, 0.3936042785644531, 0.4106903076171875, 0.4277763366699219, 0.44486236572265625, 0.4619483947753906, 0.479034423828125, 0.4961204528808594, 0.5132064819335938, 0.5302925109863281, 0.5473785400390625, 0.5644645690917969, 0.5815505981445312, 0.5986366271972656, 0.61572265625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 8.0, 16.0, 22.0, 32.0, 30.0, 29.0, 58.0, 79.0, 100.0, 100.0, 99.0, 103.0, 92.0, 43.0, 51.0, 32.0, 24.0, 17.0, 10.0, 8.0, 9.0, 5.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.03840446472168, -27.26146125793457, -26.48451805114746, -25.70757484436035, -24.930631637573242, -24.153688430786133, -23.37674331665039, -22.59980010986328, -21.822856903076172, -21.045913696289062, -20.268970489501953, -19.492027282714844, -18.715084075927734, -17.938140869140625, -17.161197662353516, -16.384254455566406, -15.607311248779297, -14.830368041992188, -14.053424835205078, -13.276481628417969, -12.49953842163086, -11.72259521484375, -10.945651054382324, -10.168707847595215, -9.391764640808105, -8.614821434020996, -7.837878227233887, -7.060934543609619, -6.28399133682251, -5.5070481300354, -4.730104446411133, -3.9531612396240234, -3.176219940185547, -2.3992767333984375, -1.622333288192749, -0.8453898429870605, -0.06844663619995117, 0.7084965705871582, 1.4854402542114258, 2.262383460998535, 3.0393266677856445, 3.816269874572754, 4.593213081359863, 5.370156764984131, 6.14709997177124, 6.92404317855835, 7.700986862182617, 8.477930068969727, 9.254873275756836, 10.031816482543945, 10.808759689331055, 11.585702896118164, 12.362646102905273, 13.139589309692383, 13.916533470153809, 14.693476676940918, 15.470419883728027, 16.247364044189453, 17.024307250976562, 17.801250457763672, 18.57819366455078, 19.35513687133789, 20.132080078125, 20.90902328491211, 21.68596649169922]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 9.0, 4.0, 8.0, 16.0, 7.0, 13.0, 13.0, 27.0, 28.0, 23.0, 20.0, 23.0, 26.0, 43.0, 47.0, 45.0, 35.0, 52.0, 51.0, 39.0, 51.0, 39.0, 51.0, 44.0, 40.0, 40.0, 23.0, 31.0, 24.0, 30.0, 30.0, 14.0, 12.0, 9.0, 11.0, 4.0, 7.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.641823768615723, -9.352274894714355, -9.062726020812988, -8.773177146911621, -8.483628273010254, -8.194079399108887, -7.904531002044678, -7.6149821281433105, -7.325433254241943, -7.035884380340576, -6.746335506439209, -6.456786632537842, -6.167238235473633, -5.877689361572266, -5.588140487670898, -5.298591613769531, -5.009042739868164, -4.719493865966797, -4.42994499206543, -4.1403961181640625, -3.8508474826812744, -3.5612986087799072, -3.271749973297119, -2.982201099395752, -2.6926522254943848, -2.4031033515930176, -2.1135544776916504, -1.8240058422088623, -1.5344569683074951, -1.244908094406128, -0.9553593397140503, -0.6658105850219727, -0.3762626647949219, -0.08671385049819946, 0.20283496379852295, 0.49238377809524536, 0.7819325923919678, 1.071481466293335, 1.3610302209854126, 1.6505789756774902, 1.9401278495788574, 2.2296767234802246, 2.519225597381592, 2.80877423286438, 3.098323106765747, 3.3878719806671143, 3.6774206161499023, 3.9669694900512695, 4.256518363952637, 4.546067237854004, 4.835616111755371, 5.125164985656738, 5.4147138595581055, 5.704262733459473, 5.993811130523682, 6.283360004425049, 6.572908878326416, 6.862457752227783, 7.15200662612915, 7.441555500030518, 7.731103897094727, 8.020652770996094, 8.310201644897461, 8.599750518798828, 8.889299392700195]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 12.0, 7.0, 15.0, 27.0, 30.0, 40.0, 64.0, 93.0, 139.0, 182.0, 301.0, 451.0, 693.0, 1084.0, 1605.0, 2479.0, 3905.0, 6266.0, 10201.0, 17068.0, 27889.0, 44955.0, 70278.0, 105351.0, 142008.0, 160607.0, 145726.0, 109481.0, 73783.0, 47446.0, 29269.0, 17934.0, 10816.0, 6698.0, 4210.0, 2627.0, 1639.0, 1074.0, 674.0, 468.0, 316.0, 211.0, 120.0, 90.0, 72.0, 52.0, 28.0, 26.0, 18.0, 11.0, 8.0, 5.0, 5.0, 2.0, 3.0, 3.0], "bins": [-11.21875, -10.8843994140625, -10.550048828125, -10.2156982421875, -9.88134765625, -9.5469970703125, -9.212646484375, -8.8782958984375, -8.5439453125, -8.2095947265625, -7.875244140625, -7.5408935546875, -7.20654296875, -6.8721923828125, -6.537841796875, -6.2034912109375, -5.869140625, -5.5347900390625, -5.200439453125, -4.8660888671875, -4.53173828125, -4.1973876953125, -3.863037109375, -3.5286865234375, -3.1943359375, -2.8599853515625, -2.525634765625, -2.1912841796875, -1.85693359375, -1.5225830078125, -1.188232421875, -0.8538818359375, -0.51953125, -0.1851806640625, 0.149169921875, 0.4835205078125, 0.81787109375, 1.1522216796875, 1.486572265625, 1.8209228515625, 2.1552734375, 2.4896240234375, 2.823974609375, 3.1583251953125, 3.49267578125, 3.8270263671875, 4.161376953125, 4.4957275390625, 4.830078125, 5.1644287109375, 5.498779296875, 5.8331298828125, 6.16748046875, 6.5018310546875, 6.836181640625, 7.1705322265625, 7.5048828125, 7.8392333984375, 8.173583984375, 8.5079345703125, 8.84228515625, 9.1766357421875, 9.510986328125, 9.8453369140625, 10.1796875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 6.0, 9.0, 9.0, 15.0, 15.0, 21.0, 18.0, 18.0, 14.0, 29.0, 31.0, 44.0, 42.0, 40.0, 32.0, 46.0, 43.0, 56.0, 58.0, 42.0, 42.0, 40.0, 34.0, 32.0, 33.0, 28.0, 31.0, 36.0, 20.0, 21.0, 20.0, 16.0, 9.0, 12.0, 4.0, 6.0, 5.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.8671875, -9.5587158203125, -9.250244140625, -8.9417724609375, -8.63330078125, -8.3248291015625, -8.016357421875, -7.7078857421875, -7.3994140625, -7.0909423828125, -6.782470703125, -6.4739990234375, -6.16552734375, -5.8570556640625, -5.548583984375, -5.2401123046875, -4.931640625, -4.6231689453125, -4.314697265625, -4.0062255859375, -3.69775390625, -3.3892822265625, -3.080810546875, -2.7723388671875, -2.4638671875, -2.1553955078125, -1.846923828125, -1.5384521484375, -1.22998046875, -0.9215087890625, -0.613037109375, -0.3045654296875, 0.00390625, 0.3123779296875, 0.620849609375, 0.9293212890625, 1.23779296875, 1.5462646484375, 1.854736328125, 2.1632080078125, 2.4716796875, 2.7801513671875, 3.088623046875, 3.3970947265625, 3.70556640625, 4.0140380859375, 4.322509765625, 4.6309814453125, 4.939453125, 5.2479248046875, 5.556396484375, 5.8648681640625, 6.17333984375, 6.4818115234375, 6.790283203125, 7.0987548828125, 7.4072265625, 7.7156982421875, 8.024169921875, 8.3326416015625, 8.64111328125, 8.9495849609375, 9.258056640625, 9.5665283203125, 9.875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 12.0, 7.0, 14.0, 16.0, 31.0, 39.0, 68.0, 118.0, 171.0, 285.0, 452.0, 671.0, 1183.0, 2034.0, 3446.0, 6058.0, 10641.0, 19299.0, 34190.0, 59740.0, 99504.0, 147613.0, 180085.0, 169759.0, 125797.0, 80045.0, 46706.0, 26137.0, 14771.0, 8109.0, 4645.0, 2733.0, 1651.0, 935.0, 599.0, 356.0, 219.0, 143.0, 90.0, 65.0, 43.0, 29.0, 19.0, 14.0, 6.0, 4.0, 3.0, 1.0, 2.0], "bins": [-14.8984375, -14.5040283203125, -14.109619140625, -13.7152099609375, -13.32080078125, -12.9263916015625, -12.531982421875, -12.1375732421875, -11.7431640625, -11.3487548828125, -10.954345703125, -10.5599365234375, -10.16552734375, -9.7711181640625, -9.376708984375, -8.9822998046875, -8.587890625, -8.1934814453125, -7.799072265625, -7.4046630859375, -7.01025390625, -6.6158447265625, -6.221435546875, -5.8270263671875, -5.4326171875, -5.0382080078125, -4.643798828125, -4.2493896484375, -3.85498046875, -3.4605712890625, -3.066162109375, -2.6717529296875, -2.27734375, -1.8829345703125, -1.488525390625, -1.0941162109375, -0.69970703125, -0.3052978515625, 0.089111328125, 0.4835205078125, 0.8779296875, 1.2723388671875, 1.666748046875, 2.0611572265625, 2.45556640625, 2.8499755859375, 3.244384765625, 3.6387939453125, 4.033203125, 4.4276123046875, 4.822021484375, 5.2164306640625, 5.61083984375, 6.0052490234375, 6.399658203125, 6.7940673828125, 7.1884765625, 7.5828857421875, 7.977294921875, 8.3717041015625, 8.76611328125, 9.1605224609375, 9.554931640625, 9.9493408203125, 10.34375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 4.0, 5.0, 9.0, 6.0, 9.0, 12.0, 14.0, 15.0, 17.0, 20.0, 32.0, 22.0, 22.0, 27.0, 29.0, 34.0, 42.0, 45.0, 43.0, 37.0, 53.0, 26.0, 39.0, 36.0, 49.0, 45.0, 31.0, 25.0, 28.0, 35.0, 31.0, 27.0, 30.0, 18.0, 21.0, 9.0, 6.0, 9.0, 10.0, 6.0, 8.0, 4.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.140625, -4.9735107421875, -4.806396484375, -4.6392822265625, -4.47216796875, -4.3050537109375, -4.137939453125, -3.9708251953125, -3.8037109375, -3.6365966796875, -3.469482421875, -3.3023681640625, -3.13525390625, -2.9681396484375, -2.801025390625, -2.6339111328125, -2.466796875, -2.2996826171875, -2.132568359375, -1.9654541015625, -1.79833984375, -1.6312255859375, -1.464111328125, -1.2969970703125, -1.1298828125, -0.9627685546875, -0.795654296875, -0.6285400390625, -0.46142578125, -0.2943115234375, -0.127197265625, 0.0399169921875, 0.20703125, 0.3741455078125, 0.541259765625, 0.7083740234375, 0.87548828125, 1.0426025390625, 1.209716796875, 1.3768310546875, 1.5439453125, 1.7110595703125, 1.878173828125, 2.0452880859375, 2.21240234375, 2.3795166015625, 2.546630859375, 2.7137451171875, 2.880859375, 3.0479736328125, 3.215087890625, 3.3822021484375, 3.54931640625, 3.7164306640625, 3.883544921875, 4.0506591796875, 4.2177734375, 4.3848876953125, 4.552001953125, 4.7191162109375, 4.88623046875, 5.0533447265625, 5.220458984375, 5.3875732421875, 5.5546875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 9.0, 8.0, 15.0, 30.0, 46.0, 65.0, 105.0, 112.0, 193.0, 281.0, 468.0, 745.0, 1080.0, 1677.0, 2725.0, 4547.0, 7626.0, 13142.0, 23409.0, 42881.0, 81503.0, 147718.0, 218323.0, 206998.0, 132915.0, 72534.0, 38669.0, 20974.0, 11828.0, 6904.0, 4148.0, 2441.0, 1577.0, 1002.0, 599.0, 456.0, 247.0, 191.0, 114.0, 92.0, 54.0, 46.0, 19.0, 11.0, 10.0, 9.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.33203125, -5.1649169921875, -4.997802734375, -4.8306884765625, -4.66357421875, -4.4964599609375, -4.329345703125, -4.1622314453125, -3.9951171875, -3.8280029296875, -3.660888671875, -3.4937744140625, -3.32666015625, -3.1595458984375, -2.992431640625, -2.8253173828125, -2.658203125, -2.4910888671875, -2.323974609375, -2.1568603515625, -1.98974609375, -1.8226318359375, -1.655517578125, -1.4884033203125, -1.3212890625, -1.1541748046875, -0.987060546875, -0.8199462890625, -0.65283203125, -0.4857177734375, -0.318603515625, -0.1514892578125, 0.015625, 0.1827392578125, 0.349853515625, 0.5169677734375, 0.68408203125, 0.8511962890625, 1.018310546875, 1.1854248046875, 1.3525390625, 1.5196533203125, 1.686767578125, 1.8538818359375, 2.02099609375, 2.1881103515625, 2.355224609375, 2.5223388671875, 2.689453125, 2.8565673828125, 3.023681640625, 3.1907958984375, 3.35791015625, 3.5250244140625, 3.692138671875, 3.8592529296875, 4.0263671875, 4.1934814453125, 4.360595703125, 4.5277099609375, 4.69482421875, 4.8619384765625, 5.029052734375, 5.1961669921875, 5.36328125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 3.0, 9.0, 9.0, 18.0, 17.0, 21.0, 27.0, 28.0, 39.0, 46.0, 55.0, 67.0, 74.0, 60.0, 71.0, 65.0, 57.0, 65.0, 46.0, 41.0, 34.0, 15.0, 20.0, 21.0, 20.0, 8.0, 9.0, 13.0, 5.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004773139953613281, -0.000460110604763031, -0.0004429072141647339, -0.00042570382356643677, -0.00040850043296813965, -0.00039129704236984253, -0.0003740936517715454, -0.0003568902611732483, -0.00033968687057495117, -0.00032248347997665405, -0.00030528008937835693, -0.0002880766987800598, -0.0002708733081817627, -0.0002536699175834656, -0.00023646652698516846, -0.00021926313638687134, -0.00020205974578857422, -0.0001848563551902771, -0.00016765296459197998, -0.00015044957399368286, -0.00013324618339538574, -0.00011604279279708862, -9.88394021987915e-05, -8.163601160049438e-05, -6.443262100219727e-05, -4.7229230403900146e-05, -3.0025839805603027e-05, -1.2822449207305908e-05, 4.380941390991211e-06, 2.158433198928833e-05, 3.878772258758545e-05, 5.599111318588257e-05, 7.319450378417969e-05, 9.03978943824768e-05, 0.00010760128498077393, 0.00012480467557907104, 0.00014200806617736816, 0.00015921145677566528, 0.0001764148473739624, 0.00019361823797225952, 0.00021082162857055664, 0.00022802501916885376, 0.0002452284097671509, 0.000262431800365448, 0.0002796351909637451, 0.00029683858156204224, 0.00031404197216033936, 0.0003312453627586365, 0.0003484487533569336, 0.0003656521439552307, 0.00038285553455352783, 0.00040005892515182495, 0.00041726231575012207, 0.0004344657063484192, 0.0004516690969467163, 0.00046887248754501343, 0.00048607587814331055, 0.0005032792687416077, 0.0005204826593399048, 0.0005376860499382019, 0.000554889440536499, 0.0005720928311347961, 0.0005892962217330933, 0.0006064996123313904, 0.0006237030029296875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 7.0, 7.0, 8.0, 7.0, 14.0, 17.0, 16.0, 36.0, 48.0, 74.0, 113.0, 148.0, 204.0, 296.0, 425.0, 625.0, 895.0, 1336.0, 1959.0, 2927.0, 4640.0, 7194.0, 11654.0, 18945.0, 32408.0, 55556.0, 93714.0, 149239.0, 192570.0, 174409.0, 119690.0, 72102.0, 41991.0, 24599.0, 14679.0, 9102.0, 5837.0, 3668.0, 2413.0, 1617.0, 1140.0, 697.0, 463.0, 343.0, 204.0, 156.0, 105.0, 91.0, 45.0, 46.0, 16.0, 18.0, 20.0, 7.0, 15.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0], "bins": [-4.58203125, -4.43768310546875, -4.2933349609375, -4.14898681640625, -4.004638671875, -3.86029052734375, -3.7159423828125, -3.57159423828125, -3.42724609375, -3.28289794921875, -3.1385498046875, -2.99420166015625, -2.849853515625, -2.70550537109375, -2.5611572265625, -2.41680908203125, -2.2724609375, -2.12811279296875, -1.9837646484375, -1.83941650390625, -1.695068359375, -1.55072021484375, -1.4063720703125, -1.26202392578125, -1.11767578125, -0.97332763671875, -0.8289794921875, -0.68463134765625, -0.540283203125, -0.39593505859375, -0.2515869140625, -0.10723876953125, 0.037109375, 0.18145751953125, 0.3258056640625, 0.47015380859375, 0.614501953125, 0.75885009765625, 0.9031982421875, 1.04754638671875, 1.19189453125, 1.33624267578125, 1.4805908203125, 1.62493896484375, 1.769287109375, 1.91363525390625, 2.0579833984375, 2.20233154296875, 2.3466796875, 2.49102783203125, 2.6353759765625, 2.77972412109375, 2.924072265625, 3.06842041015625, 3.2127685546875, 3.35711669921875, 3.50146484375, 3.64581298828125, 3.7901611328125, 3.93450927734375, 4.078857421875, 4.22320556640625, 4.3675537109375, 4.51190185546875, 4.65625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 11.0, 11.0, 13.0, 18.0, 16.0, 11.0, 15.0, 20.0, 26.0, 39.0, 29.0, 48.0, 48.0, 49.0, 62.0, 64.0, 59.0, 46.0, 52.0, 68.0, 41.0, 37.0, 33.0, 25.0, 17.0, 29.0, 21.0, 14.0, 10.0, 11.0, 11.0, 9.0, 4.0, 5.0, 6.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.7060546875, -1.658447265625, -1.61083984375, -1.563232421875, -1.515625, -1.468017578125, -1.42041015625, -1.372802734375, -1.3251953125, -1.277587890625, -1.22998046875, -1.182373046875, -1.134765625, -1.087158203125, -1.03955078125, -0.991943359375, -0.9443359375, -0.896728515625, -0.84912109375, -0.801513671875, -0.75390625, -0.706298828125, -0.65869140625, -0.611083984375, -0.5634765625, -0.515869140625, -0.46826171875, -0.420654296875, -0.373046875, -0.325439453125, -0.27783203125, -0.230224609375, -0.1826171875, -0.135009765625, -0.08740234375, -0.039794921875, 0.0078125, 0.055419921875, 0.10302734375, 0.150634765625, 0.1982421875, 0.245849609375, 0.29345703125, 0.341064453125, 0.388671875, 0.436279296875, 0.48388671875, 0.531494140625, 0.5791015625, 0.626708984375, 0.67431640625, 0.721923828125, 0.76953125, 0.817138671875, 0.86474609375, 0.912353515625, 0.9599609375, 1.007568359375, 1.05517578125, 1.102783203125, 1.150390625, 1.197998046875, 1.24560546875, 1.293212890625, 1.3408203125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 6.0, 7.0, 17.0, 25.0, 16.0, 27.0, 35.0, 40.0, 61.0, 81.0, 88.0, 99.0, 90.0, 80.0, 67.0, 58.0, 49.0, 25.0, 30.0, 14.0, 20.0, 6.0, 7.0, 8.0, 9.0, 3.0, 3.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.686668395996094, -23.007476806640625, -22.328285217285156, -21.649091720581055, -20.969900131225586, -20.290708541870117, -19.611515045166016, -18.932323455810547, -18.253131866455078, -17.57394027709961, -16.89474868774414, -16.21555519104004, -15.53636360168457, -14.857172012329102, -14.177979469299316, -13.498786926269531, -12.819595336914062, -12.140403747558594, -11.461211204528809, -10.782018661499023, -10.102827072143555, -9.423635482788086, -8.7444429397583, -8.065250396728516, -7.386058807373047, -6.70686674118042, -6.027674674987793, -5.348482608795166, -4.669290542602539, -3.990098476409912, -3.310906410217285, -2.631714344024658, -1.9525203704833984, -1.2733283042907715, -0.5941362380981445, 0.08505582809448242, 0.7642478942871094, 1.4434399604797363, 2.1226320266723633, 2.8018240928649902, 3.481016159057617, 4.160208225250244, 4.839400291442871, 5.518592357635498, 6.197784423828125, 6.876976490020752, 7.556168556213379, 8.235361099243164, 8.914552688598633, 9.593744277954102, 10.272936820983887, 10.952129364013672, 11.63132095336914, 12.31051254272461, 12.989705085754395, 13.66889762878418, 14.348089218139648, 15.027280807495117, 15.706473350524902, 16.385665893554688, 17.064857482910156, 17.744049072265625, 18.423240661621094, 19.102434158325195, 19.781625747680664]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 4.0, 0.0, 4.0, 5.0, 14.0, 11.0, 14.0, 20.0, 19.0, 15.0, 22.0, 20.0, 17.0, 22.0, 30.0, 34.0, 36.0, 36.0, 42.0, 36.0, 45.0, 34.0, 52.0, 45.0, 35.0, 36.0, 37.0, 33.0, 38.0, 43.0, 22.0, 23.0, 28.0, 21.0, 24.0, 11.0, 16.0, 7.0, 12.0, 9.0, 5.0, 7.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-9.297547340393066, -9.032727241516113, -8.76790714263916, -8.50308609008789, -8.238265991210938, -7.973445892333984, -7.708625793457031, -7.44380521774292, -7.178984642028809, -6.9141645431518555, -6.649343967437744, -6.384523868560791, -6.11970329284668, -5.854883193969727, -5.590063095092773, -5.325242519378662, -5.060422420501709, -4.795602321624756, -4.5307817459106445, -4.265961647033691, -4.00114107131958, -3.736320972442627, -3.4715006351470947, -3.2066802978515625, -2.9418599605560303, -2.677039623260498, -2.412219285964966, -2.1473989486694336, -1.882578730583191, -1.6177583932876587, -1.352938175201416, -1.0881178379058838, -0.8232970237731934, -0.5584766864776611, -0.2936564087867737, -0.02883613109588623, 0.235984206199646, 0.5008045434951782, 0.7656247615814209, 1.0304450988769531, 1.2952654361724854, 1.5600857734680176, 1.8249061107635498, 2.089726448059082, 2.354546546936035, 2.6193671226501465, 2.8841872215270996, 3.149007558822632, 3.413827896118164, 3.6786482334136963, 3.9434685707092285, 4.208288669586182, 4.473109245300293, 4.737929344177246, 5.002749443054199, 5.2675700187683105, 5.532390594482422, 5.797210693359375, 6.062031269073486, 6.3268513679504395, 6.591671943664551, 6.856492042541504, 7.121312141418457, 7.386132717132568, 7.6509528160095215]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 12.0, 8.0, 17.0, 23.0, 41.0, 70.0, 119.0, 170.0, 288.0, 477.0, 720.0, 1336.0, 2351.0, 4611.0, 8922.0, 18858.0, 43168.0, 110209.0, 327936.0, 1085977.0, 1625663.0, 637327.0, 195985.0, 70854.0, 29499.0, 13714.0, 6708.0, 3741.0, 2057.0, 1240.0, 791.0, 457.0, 288.0, 183.0, 151.0, 94.0, 63.0, 41.0, 38.0, 18.0, 14.0, 15.0, 11.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.609375, -17.927001953125, -17.24462890625, -16.562255859375, -15.8798828125, -15.197509765625, -14.51513671875, -13.832763671875, -13.150390625, -12.468017578125, -11.78564453125, -11.103271484375, -10.4208984375, -9.738525390625, -9.05615234375, -8.373779296875, -7.69140625, -7.009033203125, -6.32666015625, -5.644287109375, -4.9619140625, -4.279541015625, -3.59716796875, -2.914794921875, -2.232421875, -1.550048828125, -0.86767578125, -0.185302734375, 0.4970703125, 1.179443359375, 1.86181640625, 2.544189453125, 3.2265625, 3.908935546875, 4.59130859375, 5.273681640625, 5.9560546875, 6.638427734375, 7.32080078125, 8.003173828125, 8.685546875, 9.367919921875, 10.05029296875, 10.732666015625, 11.4150390625, 12.097412109375, 12.77978515625, 13.462158203125, 14.14453125, 14.826904296875, 15.50927734375, 16.191650390625, 16.8740234375, 17.556396484375, 18.23876953125, 18.921142578125, 19.603515625, 20.285888671875, 20.96826171875, 21.650634765625, 22.3330078125, 23.015380859375, 23.69775390625, 24.380126953125, 25.0625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 6.0, 4.0, 4.0, 7.0, 6.0, 13.0, 23.0, 12.0, 16.0, 25.0, 20.0, 23.0, 28.0, 34.0, 35.0, 39.0, 38.0, 43.0, 46.0, 54.0, 47.0, 33.0, 49.0, 47.0, 25.0, 39.0, 43.0, 30.0, 39.0, 27.0, 25.0, 28.0, 18.0, 10.0, 17.0, 12.0, 8.0, 6.0, 7.0, 8.0, 3.0, 5.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.54296875, -7.31884765625, -7.0947265625, -6.87060546875, -6.646484375, -6.42236328125, -6.1982421875, -5.97412109375, -5.75, -5.52587890625, -5.3017578125, -5.07763671875, -4.853515625, -4.62939453125, -4.4052734375, -4.18115234375, -3.95703125, -3.73291015625, -3.5087890625, -3.28466796875, -3.060546875, -2.83642578125, -2.6123046875, -2.38818359375, -2.1640625, -1.93994140625, -1.7158203125, -1.49169921875, -1.267578125, -1.04345703125, -0.8193359375, -0.59521484375, -0.37109375, -0.14697265625, 0.0771484375, 0.30126953125, 0.525390625, 0.74951171875, 0.9736328125, 1.19775390625, 1.421875, 1.64599609375, 1.8701171875, 2.09423828125, 2.318359375, 2.54248046875, 2.7666015625, 2.99072265625, 3.21484375, 3.43896484375, 3.6630859375, 3.88720703125, 4.111328125, 4.33544921875, 4.5595703125, 4.78369140625, 5.0078125, 5.23193359375, 5.4560546875, 5.68017578125, 5.904296875, 6.12841796875, 6.3525390625, 6.57666015625, 6.80078125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 8.0, 7.0, 18.0, 17.0, 24.0, 46.0, 63.0, 84.0, 171.0, 231.0, 316.0, 472.0, 742.0, 1210.0, 1916.0, 2924.0, 4823.0, 8046.0, 13706.0, 24076.0, 44035.0, 85632.0, 176346.0, 383234.0, 816585.0, 1186880.0, 754978.0, 349520.0, 161950.0, 79347.0, 41379.0, 22513.0, 12708.0, 7594.0, 4516.0, 2915.0, 1762.0, 1204.0, 768.0, 486.0, 343.0, 216.0, 162.0, 103.0, 72.0, 45.0, 33.0, 24.0, 12.0, 14.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-17.734375, -17.2041015625, -16.673828125, -16.1435546875, -15.61328125, -15.0830078125, -14.552734375, -14.0224609375, -13.4921875, -12.9619140625, -12.431640625, -11.9013671875, -11.37109375, -10.8408203125, -10.310546875, -9.7802734375, -9.25, -8.7197265625, -8.189453125, -7.6591796875, -7.12890625, -6.5986328125, -6.068359375, -5.5380859375, -5.0078125, -4.4775390625, -3.947265625, -3.4169921875, -2.88671875, -2.3564453125, -1.826171875, -1.2958984375, -0.765625, -0.2353515625, 0.294921875, 0.8251953125, 1.35546875, 1.8857421875, 2.416015625, 2.9462890625, 3.4765625, 4.0068359375, 4.537109375, 5.0673828125, 5.59765625, 6.1279296875, 6.658203125, 7.1884765625, 7.71875, 8.2490234375, 8.779296875, 9.3095703125, 9.83984375, 10.3701171875, 10.900390625, 11.4306640625, 11.9609375, 12.4912109375, 13.021484375, 13.5517578125, 14.08203125, 14.6123046875, 15.142578125, 15.6728515625, 16.203125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 8.0, 7.0, 11.0, 13.0, 19.0, 28.0, 30.0, 38.0, 44.0, 55.0, 68.0, 93.0, 121.0, 154.0, 190.0, 219.0, 288.0, 311.0, 348.0, 334.0, 302.0, 248.0, 241.0, 190.0, 137.0, 121.0, 86.0, 72.0, 60.0, 49.0, 42.0, 36.0, 21.0, 20.0, 10.0, 12.0, 15.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.86328125, -4.71044921875, -4.5576171875, -4.40478515625, -4.251953125, -4.09912109375, -3.9462890625, -3.79345703125, -3.640625, -3.48779296875, -3.3349609375, -3.18212890625, -3.029296875, -2.87646484375, -2.7236328125, -2.57080078125, -2.41796875, -2.26513671875, -2.1123046875, -1.95947265625, -1.806640625, -1.65380859375, -1.5009765625, -1.34814453125, -1.1953125, -1.04248046875, -0.8896484375, -0.73681640625, -0.583984375, -0.43115234375, -0.2783203125, -0.12548828125, 0.02734375, 0.18017578125, 0.3330078125, 0.48583984375, 0.638671875, 0.79150390625, 0.9443359375, 1.09716796875, 1.25, 1.40283203125, 1.5556640625, 1.70849609375, 1.861328125, 2.01416015625, 2.1669921875, 2.31982421875, 2.47265625, 2.62548828125, 2.7783203125, 2.93115234375, 3.083984375, 3.23681640625, 3.3896484375, 3.54248046875, 3.6953125, 3.84814453125, 4.0009765625, 4.15380859375, 4.306640625, 4.45947265625, 4.6123046875, 4.76513671875, 4.91796875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 11.0, 3.0, 13.0, 16.0, 31.0, 27.0, 53.0, 75.0, 91.0, 112.0, 116.0, 112.0, 87.0, 73.0, 35.0, 38.0, 30.0, 17.0, 12.0, 11.0, 10.0, 7.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-38.19105911254883, -37.31455612182617, -36.438053131103516, -35.561546325683594, -34.68504333496094, -33.80854034423828, -32.932037353515625, -32.05553436279297, -31.17902946472168, -30.302526473999023, -29.426021575927734, -28.549518585205078, -27.673015594482422, -26.796510696411133, -25.920007705688477, -25.043502807617188, -24.16699981689453, -23.290496826171875, -22.413991928100586, -21.53748893737793, -20.66098403930664, -19.784481048583984, -18.907978057861328, -18.031475067138672, -17.154970169067383, -16.278467178344727, -15.401962280273438, -14.525459289550781, -13.648955345153809, -12.772451400756836, -11.89594841003418, -11.019444465637207, -10.142940521240234, -9.266436576843262, -8.389932632446289, -7.513429641723633, -6.63692569732666, -5.7604217529296875, -4.883918285369873, -4.007414817810059, -3.130910873413086, -2.2544071674346924, -1.3779034614562988, -0.5013997554779053, 0.3751039505004883, 1.251607894897461, 2.1281113624572754, 3.00461483001709, 3.8811187744140625, 4.757622718811035, 5.63412618637085, 6.510629653930664, 7.387133598327637, 8.26363754272461, 9.140140533447266, 10.016644477844238, 10.893148422241211, 11.769652366638184, 12.646156311035156, 13.522659301757812, 14.399163246154785, 15.275667190551758, 16.152170181274414, 17.028675079345703, 17.90517807006836]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 5.0, 7.0, 4.0, 10.0, 11.0, 8.0, 9.0, 10.0, 18.0, 17.0, 23.0, 19.0, 22.0, 27.0, 29.0, 31.0, 40.0, 48.0, 32.0, 34.0, 40.0, 49.0, 45.0, 36.0, 43.0, 38.0, 46.0, 35.0, 35.0, 26.0, 37.0, 35.0, 19.0, 17.0, 18.0, 17.0, 26.0, 7.0, 8.0, 7.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-9.3289213180542, -9.054272651672363, -8.779623031616211, -8.504974365234375, -8.230324745178223, -7.9556756019592285, -7.681026458740234, -7.406377792358398, -7.131728172302246, -6.857079029083252, -6.582429885864258, -6.307780742645264, -6.0331315994262695, -5.758482456207275, -5.483833312988281, -5.209184646606445, -4.934535503387451, -4.659886360168457, -4.385237216949463, -4.110588073730469, -3.8359389305114746, -3.5612897872924805, -3.2866408824920654, -3.0119917392730713, -2.737342596054077, -2.462693452835083, -2.188044309616089, -1.9133952856063843, -1.6387461423873901, -1.364096999168396, -1.0894479751586914, -0.8147988319396973, -0.5401496887207031, -0.26550057530403137, 0.00914853811264038, 0.28379762172698975, 0.5584467649459839, 0.833095908164978, 1.1077449321746826, 1.3823940753936768, 1.657043218612671, 1.931692361831665, 2.206341505050659, 2.480990409851074, 2.7556395530700684, 3.0302886962890625, 3.3049378395080566, 3.579586982727051, 3.854236125946045, 4.128885269165039, 4.403534412384033, 4.678183555603027, 4.9528326988220215, 5.227481842041016, 5.502130508422852, 5.776780128479004, 6.05142879486084, 6.326077938079834, 6.600727081298828, 6.875376224517822, 7.150025367736816, 7.4246745109558105, 7.699323654174805, 7.973972320556641, 8.248621940612793]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 10.0, 10.0, 14.0, 37.0, 53.0, 70.0, 120.0, 195.0, 305.0, 555.0, 1064.0, 2255.0, 5258.0, 15145.0, 50234.0, 176845.0, 413819.0, 266978.0, 79216.0, 22817.0, 7574.0, 2955.0, 1436.0, 653.0, 366.0, 214.0, 118.0, 80.0, 56.0, 40.0, 21.0, 12.0, 11.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.890625, -16.417236328125, -15.94384765625, -15.470458984375, -14.9970703125, -14.523681640625, -14.05029296875, -13.576904296875, -13.103515625, -12.630126953125, -12.15673828125, -11.683349609375, -11.2099609375, -10.736572265625, -10.26318359375, -9.789794921875, -9.31640625, -8.843017578125, -8.36962890625, -7.896240234375, -7.4228515625, -6.949462890625, -6.47607421875, -6.002685546875, -5.529296875, -5.055908203125, -4.58251953125, -4.109130859375, -3.6357421875, -3.162353515625, -2.68896484375, -2.215576171875, -1.7421875, -1.268798828125, -0.79541015625, -0.322021484375, 0.1513671875, 0.624755859375, 1.09814453125, 1.571533203125, 2.044921875, 2.518310546875, 2.99169921875, 3.465087890625, 3.9384765625, 4.411865234375, 4.88525390625, 5.358642578125, 5.83203125, 6.305419921875, 6.77880859375, 7.252197265625, 7.7255859375, 8.198974609375, 8.67236328125, 9.145751953125, 9.619140625, 10.092529296875, 10.56591796875, 11.039306640625, 11.5126953125, 11.986083984375, 12.45947265625, 12.932861328125, 13.40625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 3.0, 8.0, 7.0, 18.0, 12.0, 16.0, 13.0, 19.0, 30.0, 32.0, 42.0, 34.0, 60.0, 46.0, 53.0, 56.0, 52.0, 59.0, 65.0, 55.0, 56.0, 45.0, 37.0, 34.0, 24.0, 32.0, 20.0, 18.0, 14.0, 9.0, 13.0, 6.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0], "bins": [-17.0625, -16.653076171875, -16.24365234375, -15.834228515625, -15.4248046875, -15.015380859375, -14.60595703125, -14.196533203125, -13.787109375, -13.377685546875, -12.96826171875, -12.558837890625, -12.1494140625, -11.739990234375, -11.33056640625, -10.921142578125, -10.51171875, -10.102294921875, -9.69287109375, -9.283447265625, -8.8740234375, -8.464599609375, -8.05517578125, -7.645751953125, -7.236328125, -6.826904296875, -6.41748046875, -6.008056640625, -5.5986328125, -5.189208984375, -4.77978515625, -4.370361328125, -3.9609375, -3.551513671875, -3.14208984375, -2.732666015625, -2.3232421875, -1.913818359375, -1.50439453125, -1.094970703125, -0.685546875, -0.276123046875, 0.13330078125, 0.542724609375, 0.9521484375, 1.361572265625, 1.77099609375, 2.180419921875, 2.58984375, 2.999267578125, 3.40869140625, 3.818115234375, 4.2275390625, 4.636962890625, 5.04638671875, 5.455810546875, 5.865234375, 6.274658203125, 6.68408203125, 7.093505859375, 7.5029296875, 7.912353515625, 8.32177734375, 8.731201171875, 9.140625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 5.0, 5.0, 6.0, 9.0, 15.0, 12.0, 20.0, 23.0, 49.0, 71.0, 107.0, 159.0, 351.0, 615.0, 1276.0, 2883.0, 7822.0, 24596.0, 98487.0, 404364.0, 381388.0, 90681.0, 22760.0, 7342.0, 2798.0, 1310.0, 629.0, 289.0, 171.0, 111.0, 72.0, 38.0, 27.0, 21.0, 9.0, 10.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.546875, -18.915771484375, -18.28466796875, -17.653564453125, -17.0224609375, -16.391357421875, -15.76025390625, -15.129150390625, -14.498046875, -13.866943359375, -13.23583984375, -12.604736328125, -11.9736328125, -11.342529296875, -10.71142578125, -10.080322265625, -9.44921875, -8.818115234375, -8.18701171875, -7.555908203125, -6.9248046875, -6.293701171875, -5.66259765625, -5.031494140625, -4.400390625, -3.769287109375, -3.13818359375, -2.507080078125, -1.8759765625, -1.244873046875, -0.61376953125, 0.017333984375, 0.6484375, 1.279541015625, 1.91064453125, 2.541748046875, 3.1728515625, 3.803955078125, 4.43505859375, 5.066162109375, 5.697265625, 6.328369140625, 6.95947265625, 7.590576171875, 8.2216796875, 8.852783203125, 9.48388671875, 10.114990234375, 10.74609375, 11.377197265625, 12.00830078125, 12.639404296875, 13.2705078125, 13.901611328125, 14.53271484375, 15.163818359375, 15.794921875, 16.426025390625, 17.05712890625, 17.688232421875, 18.3193359375, 18.950439453125, 19.58154296875, 20.212646484375, 20.84375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 4.0, 6.0, 9.0, 11.0, 15.0, 14.0, 14.0, 18.0, 16.0, 19.0, 26.0, 30.0, 31.0, 49.0, 41.0, 46.0, 32.0, 44.0, 44.0, 43.0, 43.0, 43.0, 36.0, 51.0, 33.0, 40.0, 30.0, 29.0, 28.0, 21.0, 20.0, 24.0, 16.0, 9.0, 18.0, 13.0, 9.0, 5.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.671875, -6.48162841796875, -6.2913818359375, -6.10113525390625, -5.910888671875, -5.72064208984375, -5.5303955078125, -5.34014892578125, -5.14990234375, -4.95965576171875, -4.7694091796875, -4.57916259765625, -4.388916015625, -4.19866943359375, -4.0084228515625, -3.81817626953125, -3.6279296875, -3.43768310546875, -3.2474365234375, -3.05718994140625, -2.866943359375, -2.67669677734375, -2.4864501953125, -2.29620361328125, -2.10595703125, -1.91571044921875, -1.7254638671875, -1.53521728515625, -1.344970703125, -1.15472412109375, -0.9644775390625, -0.77423095703125, -0.583984375, -0.39373779296875, -0.2034912109375, -0.01324462890625, 0.177001953125, 0.36724853515625, 0.5574951171875, 0.74774169921875, 0.93798828125, 1.12823486328125, 1.3184814453125, 1.50872802734375, 1.698974609375, 1.88922119140625, 2.0794677734375, 2.26971435546875, 2.4599609375, 2.65020751953125, 2.8404541015625, 3.03070068359375, 3.220947265625, 3.41119384765625, 3.6014404296875, 3.79168701171875, 3.98193359375, 4.17218017578125, 4.3624267578125, 4.55267333984375, 4.742919921875, 4.93316650390625, 5.1234130859375, 5.31365966796875, 5.50390625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 17.0, 15.0, 21.0, 27.0, 33.0, 68.0, 93.0, 143.0, 205.0, 307.0, 421.0, 689.0, 1165.0, 1896.0, 3400.0, 6954.0, 16396.0, 47058.0, 171195.0, 480213.0, 222109.0, 59135.0, 19661.0, 7926.0, 3963.0, 2142.0, 1207.0, 683.0, 449.0, 306.0, 220.0, 142.0, 92.0, 54.0, 42.0, 29.0, 22.0, 24.0, 11.0, 6.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.1656494140625, -5.964111328125, -5.7625732421875, -5.56103515625, -5.3594970703125, -5.157958984375, -4.9564208984375, -4.7548828125, -4.5533447265625, -4.351806640625, -4.1502685546875, -3.94873046875, -3.7471923828125, -3.545654296875, -3.3441162109375, -3.142578125, -2.9410400390625, -2.739501953125, -2.5379638671875, -2.33642578125, -2.1348876953125, -1.933349609375, -1.7318115234375, -1.5302734375, -1.3287353515625, -1.127197265625, -0.9256591796875, -0.72412109375, -0.5225830078125, -0.321044921875, -0.1195068359375, 0.08203125, 0.2835693359375, 0.485107421875, 0.6866455078125, 0.88818359375, 1.0897216796875, 1.291259765625, 1.4927978515625, 1.6943359375, 1.8958740234375, 2.097412109375, 2.2989501953125, 2.50048828125, 2.7020263671875, 2.903564453125, 3.1051025390625, 3.306640625, 3.5081787109375, 3.709716796875, 3.9112548828125, 4.11279296875, 4.3143310546875, 4.515869140625, 4.7174072265625, 4.9189453125, 5.1204833984375, 5.322021484375, 5.5235595703125, 5.72509765625, 5.9266357421875, 6.128173828125, 6.3297119140625, 6.53125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 8.0, 10.0, 17.0, 27.0, 32.0, 55.0, 70.0, 90.0, 113.0, 109.0, 94.0, 77.0, 86.0, 57.0, 39.0, 37.0, 18.0, 9.0, 16.0, 14.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0005025863647460938, -0.0004896000027656555, -0.0004766136407852173, -0.00046362727880477905, -0.0004506409168243408, -0.0004376545548439026, -0.00042466819286346436, -0.0004116818308830261, -0.0003986954689025879, -0.00038570910692214966, -0.0003727227449417114, -0.0003597363829612732, -0.00034675002098083496, -0.00033376365900039673, -0.0003207772970199585, -0.00030779093503952026, -0.00029480457305908203, -0.0002818182110786438, -0.00026883184909820557, -0.00025584548711776733, -0.0002428591251373291, -0.00022987276315689087, -0.00021688640117645264, -0.0002039000391960144, -0.00019091367721557617, -0.00017792731523513794, -0.0001649409532546997, -0.00015195459127426147, -0.00013896822929382324, -0.000125981867313385, -0.00011299550533294678, -0.00010000914335250854, -8.702278137207031e-05, -7.403641939163208e-05, -6.105005741119385e-05, -4.8063695430755615e-05, -3.507733345031738e-05, -2.209097146987915e-05, -9.104609489440918e-06, 3.8817524909973145e-06, 1.6868114471435547e-05, 2.985447645187378e-05, 4.284083843231201e-05, 5.5827200412750244e-05, 6.881356239318848e-05, 8.179992437362671e-05, 9.478628635406494e-05, 0.00010777264833450317, 0.0001207590103149414, 0.00013374537229537964, 0.00014673173427581787, 0.0001597180962562561, 0.00017270445823669434, 0.00018569082021713257, 0.0001986771821975708, 0.00021166354417800903, 0.00022464990615844727, 0.0002376362681388855, 0.00025062263011932373, 0.00026360899209976196, 0.0002765953540802002, 0.00028958171606063843, 0.00030256807804107666, 0.0003155544400215149, 0.0003285408020019531]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 4.0, 10.0, 12.0, 16.0, 20.0, 31.0, 30.0, 64.0, 75.0, 100.0, 150.0, 224.0, 275.0, 419.0, 539.0, 855.0, 1330.0, 2193.0, 3606.0, 6689.0, 15235.0, 40528.0, 129877.0, 357099.0, 318907.0, 107146.0, 34413.0, 13311.0, 6193.0, 3326.0, 1939.0, 1243.0, 818.0, 534.0, 388.0, 250.0, 227.0, 111.0, 87.0, 69.0, 66.0, 30.0, 33.0, 22.0, 21.0, 14.0, 8.0, 8.0, 2.0, 4.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5390625, -5.35394287109375, -5.1688232421875, -4.98370361328125, -4.798583984375, -4.61346435546875, -4.4283447265625, -4.24322509765625, -4.05810546875, -3.87298583984375, -3.6878662109375, -3.50274658203125, -3.317626953125, -3.13250732421875, -2.9473876953125, -2.76226806640625, -2.5771484375, -2.39202880859375, -2.2069091796875, -2.02178955078125, -1.836669921875, -1.65155029296875, -1.4664306640625, -1.28131103515625, -1.09619140625, -0.91107177734375, -0.7259521484375, -0.54083251953125, -0.355712890625, -0.17059326171875, 0.0145263671875, 0.19964599609375, 0.384765625, 0.56988525390625, 0.7550048828125, 0.94012451171875, 1.125244140625, 1.31036376953125, 1.4954833984375, 1.68060302734375, 1.86572265625, 2.05084228515625, 2.2359619140625, 2.42108154296875, 2.606201171875, 2.79132080078125, 2.9764404296875, 3.16156005859375, 3.3466796875, 3.53179931640625, 3.7169189453125, 3.90203857421875, 4.087158203125, 4.27227783203125, 4.4573974609375, 4.64251708984375, 4.82763671875, 5.01275634765625, 5.1978759765625, 5.38299560546875, 5.568115234375, 5.75323486328125, 5.9383544921875, 6.12347412109375, 6.30859375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 9.0, 3.0, 11.0, 16.0, 38.0, 44.0, 95.0, 131.0, 168.0, 177.0, 112.0, 87.0, 51.0, 26.0, 11.0, 5.0, 5.0, 3.0, 2.0, 0.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.619140625, -2.54425048828125, -2.4693603515625, -2.39447021484375, -2.319580078125, -2.24468994140625, -2.1697998046875, -2.09490966796875, -2.02001953125, -1.94512939453125, -1.8702392578125, -1.79534912109375, -1.720458984375, -1.64556884765625, -1.5706787109375, -1.49578857421875, -1.4208984375, -1.34600830078125, -1.2711181640625, -1.19622802734375, -1.121337890625, -1.04644775390625, -0.9715576171875, -0.89666748046875, -0.82177734375, -0.74688720703125, -0.6719970703125, -0.59710693359375, -0.522216796875, -0.44732666015625, -0.3724365234375, -0.29754638671875, -0.22265625, -0.14776611328125, -0.0728759765625, 0.00201416015625, 0.076904296875, 0.15179443359375, 0.2266845703125, 0.30157470703125, 0.37646484375, 0.45135498046875, 0.5262451171875, 0.60113525390625, 0.676025390625, 0.75091552734375, 0.8258056640625, 0.90069580078125, 0.9755859375, 1.05047607421875, 1.1253662109375, 1.20025634765625, 1.275146484375, 1.35003662109375, 1.4249267578125, 1.49981689453125, 1.57470703125, 1.64959716796875, 1.7244873046875, 1.79937744140625, 1.874267578125, 1.94915771484375, 2.0240478515625, 2.09893798828125, 2.173828125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 6.0, 5.0, 9.0, 10.0, 22.0, 20.0, 41.0, 46.0, 89.0, 96.0, 115.0, 127.0, 106.0, 82.0, 63.0, 41.0, 37.0, 23.0, 13.0, 11.0, 11.0, 10.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-39.90776824951172, -39.006874084472656, -38.10598373413086, -37.2050895690918, -36.30419921875, -35.40330505371094, -34.502410888671875, -33.60152053833008, -32.700626373291016, -31.799734115600586, -30.898841857910156, -29.997947692871094, -29.097055435180664, -28.196163177490234, -27.295270919799805, -26.394378662109375, -25.493486404418945, -24.592594146728516, -23.691701889038086, -22.790809631347656, -21.889915466308594, -20.989023208618164, -20.088130950927734, -19.187238693237305, -18.286346435546875, -17.385454177856445, -16.484561920166016, -15.58366870880127, -14.682775497436523, -13.781883239746094, -12.880990982055664, -11.980098724365234, -11.079206466674805, -10.178314208984375, -9.277420997619629, -8.3765287399292, -7.475636005401611, -6.574743270874023, -5.673851013183594, -4.772958278656006, -3.872065544128418, -2.97117280960083, -2.0702803134918213, -1.1693878173828125, -0.2684950828552246, 0.6323976516723633, 1.533289909362793, 2.434182643890381, 3.3350753784179688, 4.235968112945557, 5.1368608474731445, 6.037753105163574, 6.938645839691162, 7.83953857421875, 8.74043083190918, 9.64132308959961, 10.542216300964355, 11.443108558654785, 12.344001770019531, 13.244894027709961, 14.14578628540039, 15.046679496765137, 15.947571754455566, 16.848464965820312, 17.749357223510742]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 5.0, 6.0, 7.0, 14.0, 4.0, 14.0, 11.0, 15.0, 23.0, 18.0, 20.0, 23.0, 31.0, 33.0, 31.0, 44.0, 35.0, 39.0, 34.0, 47.0, 51.0, 43.0, 42.0, 37.0, 41.0, 47.0, 35.0, 26.0, 40.0, 30.0, 27.0, 20.0, 20.0, 18.0, 22.0, 14.0, 8.0, 8.0, 5.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-9.776090621948242, -9.494546890258789, -9.213003158569336, -8.931458473205566, -8.649914741516113, -8.36837100982666, -8.086827278137207, -7.805283546447754, -7.523739337921143, -7.2421956062316895, -6.960651397705078, -6.679107666015625, -6.397563934326172, -6.1160197257995605, -5.834475994110107, -5.552931785583496, -5.271388053894043, -4.98984432220459, -4.7083001136779785, -4.426756381988525, -4.145212173461914, -3.863668441772461, -3.582124710083008, -3.3005807399749756, -3.0190367698669434, -2.737492799758911, -2.455948829650879, -2.174405097961426, -1.8928611278533936, -1.6113171577453613, -1.3297733068466187, -1.048229455947876, -0.7666854858398438, -0.4851415753364563, -0.20359766483306885, 0.0779462456703186, 0.35949015617370605, 0.6410341262817383, 0.922577977180481, 1.2041218280792236, 1.4856657981872559, 1.767209768295288, 2.0487537384033203, 2.3302974700927734, 2.6118414402008057, 2.893385410308838, 3.174929141998291, 3.4564731121063232, 3.7380170822143555, 4.019560813903809, 4.30110502243042, 4.582648754119873, 4.864192962646484, 5.1457366943359375, 5.427280426025391, 5.708824157714844, 5.990368366241455, 6.271912097930908, 6.5534563064575195, 6.835000038146973, 7.116543769836426, 7.398087978363037, 7.67963171005249, 7.961175918579102, 8.242719650268555]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 6.0, 13.0, 15.0, 32.0, 45.0, 48.0, 89.0, 154.0, 238.0, 450.0, 797.0, 1456.0, 2866.0, 5613.0, 11546.0, 24004.0, 50536.0, 103317.0, 188922.0, 247354.0, 196393.0, 109881.0, 54203.0, 25473.0, 12509.0, 5952.0, 3065.0, 1583.0, 848.0, 420.0, 291.0, 152.0, 102.0, 53.0, 38.0, 24.0, 24.0, 14.0, 4.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.546875, -15.98681640625, -15.4267578125, -14.86669921875, -14.306640625, -13.74658203125, -13.1865234375, -12.62646484375, -12.06640625, -11.50634765625, -10.9462890625, -10.38623046875, -9.826171875, -9.26611328125, -8.7060546875, -8.14599609375, -7.5859375, -7.02587890625, -6.4658203125, -5.90576171875, -5.345703125, -4.78564453125, -4.2255859375, -3.66552734375, -3.10546875, -2.54541015625, -1.9853515625, -1.42529296875, -0.865234375, -0.30517578125, 0.2548828125, 0.81494140625, 1.375, 1.93505859375, 2.4951171875, 3.05517578125, 3.615234375, 4.17529296875, 4.7353515625, 5.29541015625, 5.85546875, 6.41552734375, 6.9755859375, 7.53564453125, 8.095703125, 8.65576171875, 9.2158203125, 9.77587890625, 10.3359375, 10.89599609375, 11.4560546875, 12.01611328125, 12.576171875, 13.13623046875, 13.6962890625, 14.25634765625, 14.81640625, 15.37646484375, 15.9365234375, 16.49658203125, 17.056640625, 17.61669921875, 18.1767578125, 18.73681640625, 19.296875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 5.0, 11.0, 11.0, 8.0, 10.0, 11.0, 20.0, 20.0, 30.0, 29.0, 38.0, 28.0, 43.0, 40.0, 42.0, 56.0, 37.0, 46.0, 52.0, 43.0, 51.0, 41.0, 47.0, 39.0, 32.0, 25.0, 35.0, 19.0, 19.0, 18.0, 20.0, 11.0, 16.0, 10.0, 1.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 4.0, 3.0, 0.0, 2.0], "bins": [-11.8515625, -11.52685546875, -11.2021484375, -10.87744140625, -10.552734375, -10.22802734375, -9.9033203125, -9.57861328125, -9.25390625, -8.92919921875, -8.6044921875, -8.27978515625, -7.955078125, -7.63037109375, -7.3056640625, -6.98095703125, -6.65625, -6.33154296875, -6.0068359375, -5.68212890625, -5.357421875, -5.03271484375, -4.7080078125, -4.38330078125, -4.05859375, -3.73388671875, -3.4091796875, -3.08447265625, -2.759765625, -2.43505859375, -2.1103515625, -1.78564453125, -1.4609375, -1.13623046875, -0.8115234375, -0.48681640625, -0.162109375, 0.16259765625, 0.4873046875, 0.81201171875, 1.13671875, 1.46142578125, 1.7861328125, 2.11083984375, 2.435546875, 2.76025390625, 3.0849609375, 3.40966796875, 3.734375, 4.05908203125, 4.3837890625, 4.70849609375, 5.033203125, 5.35791015625, 5.6826171875, 6.00732421875, 6.33203125, 6.65673828125, 6.9814453125, 7.30615234375, 7.630859375, 7.95556640625, 8.2802734375, 8.60498046875, 8.9296875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 11.0, 10.0, 18.0, 19.0, 29.0, 56.0, 55.0, 90.0, 140.0, 189.0, 327.0, 580.0, 1021.0, 1930.0, 3927.0, 8354.0, 18775.0, 44059.0, 104956.0, 219089.0, 288103.0, 197087.0, 91017.0, 37880.0, 16077.0, 7237.0, 3446.0, 1721.0, 924.0, 495.0, 351.0, 173.0, 126.0, 81.0, 54.0, 41.0, 35.0, 13.0, 17.0, 13.0, 3.0, 10.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.40625, -20.702392578125, -19.99853515625, -19.294677734375, -18.5908203125, -17.886962890625, -17.18310546875, -16.479248046875, -15.775390625, -15.071533203125, -14.36767578125, -13.663818359375, -12.9599609375, -12.256103515625, -11.55224609375, -10.848388671875, -10.14453125, -9.440673828125, -8.73681640625, -8.032958984375, -7.3291015625, -6.625244140625, -5.92138671875, -5.217529296875, -4.513671875, -3.809814453125, -3.10595703125, -2.402099609375, -1.6982421875, -0.994384765625, -0.29052734375, 0.413330078125, 1.1171875, 1.821044921875, 2.52490234375, 3.228759765625, 3.9326171875, 4.636474609375, 5.34033203125, 6.044189453125, 6.748046875, 7.451904296875, 8.15576171875, 8.859619140625, 9.5634765625, 10.267333984375, 10.97119140625, 11.675048828125, 12.37890625, 13.082763671875, 13.78662109375, 14.490478515625, 15.1943359375, 15.898193359375, 16.60205078125, 17.305908203125, 18.009765625, 18.713623046875, 19.41748046875, 20.121337890625, 20.8251953125, 21.529052734375, 22.23291015625, 22.936767578125, 23.640625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 7.0, 8.0, 7.0, 7.0, 6.0, 7.0, 17.0, 9.0, 16.0, 13.0, 17.0, 20.0, 17.0, 25.0, 24.0, 28.0, 36.0, 31.0, 36.0, 36.0, 46.0, 45.0, 38.0, 38.0, 55.0, 40.0, 32.0, 38.0, 38.0, 37.0, 35.0, 31.0, 25.0, 29.0, 14.0, 8.0, 20.0, 11.0, 7.0, 12.0, 10.0, 10.0, 7.0, 8.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.23046875, -6.0467529296875, -5.863037109375, -5.6793212890625, -5.49560546875, -5.3118896484375, -5.128173828125, -4.9444580078125, -4.7607421875, -4.5770263671875, -4.393310546875, -4.2095947265625, -4.02587890625, -3.8421630859375, -3.658447265625, -3.4747314453125, -3.291015625, -3.1072998046875, -2.923583984375, -2.7398681640625, -2.55615234375, -2.3724365234375, -2.188720703125, -2.0050048828125, -1.8212890625, -1.6375732421875, -1.453857421875, -1.2701416015625, -1.08642578125, -0.9027099609375, -0.718994140625, -0.5352783203125, -0.3515625, -0.1678466796875, 0.015869140625, 0.1995849609375, 0.38330078125, 0.5670166015625, 0.750732421875, 0.9344482421875, 1.1181640625, 1.3018798828125, 1.485595703125, 1.6693115234375, 1.85302734375, 2.0367431640625, 2.220458984375, 2.4041748046875, 2.587890625, 2.7716064453125, 2.955322265625, 3.1390380859375, 3.32275390625, 3.5064697265625, 3.690185546875, 3.8739013671875, 4.0576171875, 4.2413330078125, 4.425048828125, 4.6087646484375, 4.79248046875, 4.9761962890625, 5.159912109375, 5.3436279296875, 5.52734375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 15.0, 19.0, 22.0, 38.0, 46.0, 53.0, 74.0, 102.0, 110.0, 168.0, 241.0, 283.0, 426.0, 623.0, 874.0, 1443.0, 2382.0, 4263.0, 8620.0, 20976.0, 64914.0, 225792.0, 429849.0, 194578.0, 55772.0, 18536.0, 7800.0, 3842.0, 2255.0, 1311.0, 946.0, 543.0, 443.0, 288.0, 222.0, 165.0, 127.0, 110.0, 58.0, 43.0, 39.0, 32.0, 28.0, 26.0, 9.0, 8.0, 9.0, 4.0, 6.0, 1.0, 0.0, 7.0, 1.0, 1.0], "bins": [-11.8671875, -11.5013427734375, -11.135498046875, -10.7696533203125, -10.40380859375, -10.0379638671875, -9.672119140625, -9.3062744140625, -8.9404296875, -8.5745849609375, -8.208740234375, -7.8428955078125, -7.47705078125, -7.1112060546875, -6.745361328125, -6.3795166015625, -6.013671875, -5.6478271484375, -5.281982421875, -4.9161376953125, -4.55029296875, -4.1844482421875, -3.818603515625, -3.4527587890625, -3.0869140625, -2.7210693359375, -2.355224609375, -1.9893798828125, -1.62353515625, -1.2576904296875, -0.891845703125, -0.5260009765625, -0.16015625, 0.2056884765625, 0.571533203125, 0.9373779296875, 1.30322265625, 1.6690673828125, 2.034912109375, 2.4007568359375, 2.7666015625, 3.1324462890625, 3.498291015625, 3.8641357421875, 4.22998046875, 4.5958251953125, 4.961669921875, 5.3275146484375, 5.693359375, 6.0592041015625, 6.425048828125, 6.7908935546875, 7.15673828125, 7.5225830078125, 7.888427734375, 8.2542724609375, 8.6201171875, 8.9859619140625, 9.351806640625, 9.7176513671875, 10.08349609375, 10.4493408203125, 10.815185546875, 11.1810302734375, 11.546875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 14.0, 8.0, 12.0, 22.0, 41.0, 68.0, 91.0, 165.0, 168.0, 149.0, 100.0, 52.0, 55.0, 21.0, 18.0, 7.0, 2.0, 6.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014905929565429688, -0.00144977867603302, -0.0014089643955230713, -0.0013681501150131226, -0.0013273358345031738, -0.001286521553993225, -0.0012457072734832764, -0.0012048929929733276, -0.001164078712463379, -0.0011232644319534302, -0.0010824501514434814, -0.0010416358709335327, -0.001000821590423584, -0.0009600073099136353, -0.0009191930294036865, -0.0008783787488937378, -0.0008375644683837891, -0.0007967501878738403, -0.0007559359073638916, -0.0007151216268539429, -0.0006743073463439941, -0.0006334930658340454, -0.0005926787853240967, -0.000551864504814148, -0.0005110502243041992, -0.0004702359437942505, -0.00042942166328430176, -0.00038860738277435303, -0.0003477931022644043, -0.00030697882175445557, -0.00026616454124450684, -0.0002253502607345581, -0.00018453598022460938, -0.00014372169971466064, -0.00010290741920471191, -6.209313869476318e-05, -2.1278858184814453e-05, 1.9535422325134277e-05, 6.034970283508301e-05, 0.00010116398334503174, 0.00014197826385498047, 0.0001827925443649292, 0.00022360682487487793, 0.00026442110538482666, 0.0003052353858947754, 0.0003460496664047241, 0.00038686394691467285, 0.0004276782274246216, 0.0004684925079345703, 0.000509306788444519, 0.0005501210689544678, 0.0005909353494644165, 0.0006317496299743652, 0.000672563910484314, 0.0007133781909942627, 0.0007541924715042114, 0.0007950067520141602, 0.0008358210325241089, 0.0008766353130340576, 0.0009174495935440063, 0.0009582638740539551, 0.0009990781545639038, 0.0010398924350738525, 0.0010807067155838013, 0.00112152099609375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 16.0, 12.0, 22.0, 37.0, 46.0, 44.0, 89.0, 136.0, 180.0, 231.0, 418.0, 562.0, 821.0, 1368.0, 1978.0, 3287.0, 6058.0, 12177.0, 28387.0, 70832.0, 179841.0, 326344.0, 240420.0, 100873.0, 39283.0, 16283.0, 7705.0, 4146.0, 2325.0, 1562.0, 984.0, 641.0, 452.0, 299.0, 210.0, 122.0, 109.0, 72.0, 46.0, 33.0, 31.0, 18.0, 12.0, 9.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.83203125, -7.56817626953125, -7.3043212890625, -7.04046630859375, -6.776611328125, -6.51275634765625, -6.2489013671875, -5.98504638671875, -5.72119140625, -5.45733642578125, -5.1934814453125, -4.92962646484375, -4.665771484375, -4.40191650390625, -4.1380615234375, -3.87420654296875, -3.6103515625, -3.34649658203125, -3.0826416015625, -2.81878662109375, -2.554931640625, -2.29107666015625, -2.0272216796875, -1.76336669921875, -1.49951171875, -1.23565673828125, -0.9718017578125, -0.70794677734375, -0.444091796875, -0.18023681640625, 0.0836181640625, 0.34747314453125, 0.611328125, 0.87518310546875, 1.1390380859375, 1.40289306640625, 1.666748046875, 1.93060302734375, 2.1944580078125, 2.45831298828125, 2.72216796875, 2.98602294921875, 3.2498779296875, 3.51373291015625, 3.777587890625, 4.04144287109375, 4.3052978515625, 4.56915283203125, 4.8330078125, 5.09686279296875, 5.3607177734375, 5.62457275390625, 5.888427734375, 6.15228271484375, 6.4161376953125, 6.67999267578125, 6.94384765625, 7.20770263671875, 7.4715576171875, 7.73541259765625, 7.999267578125, 8.26312255859375, 8.5269775390625, 8.79083251953125, 9.0546875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 14.0, 20.0, 35.0, 46.0, 70.0, 69.0, 87.0, 111.0, 126.0, 104.0, 89.0, 61.0, 44.0, 26.0, 25.0, 20.0, 13.0, 3.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08984375, -2.9906005859375, -2.891357421875, -2.7921142578125, -2.69287109375, -2.5936279296875, -2.494384765625, -2.3951416015625, -2.2958984375, -2.1966552734375, -2.097412109375, -1.9981689453125, -1.89892578125, -1.7996826171875, -1.700439453125, -1.6011962890625, -1.501953125, -1.4027099609375, -1.303466796875, -1.2042236328125, -1.10498046875, -1.0057373046875, -0.906494140625, -0.8072509765625, -0.7080078125, -0.6087646484375, -0.509521484375, -0.4102783203125, -0.31103515625, -0.2117919921875, -0.112548828125, -0.0133056640625, 0.0859375, 0.1851806640625, 0.284423828125, 0.3836669921875, 0.48291015625, 0.5821533203125, 0.681396484375, 0.7806396484375, 0.8798828125, 0.9791259765625, 1.078369140625, 1.1776123046875, 1.27685546875, 1.3760986328125, 1.475341796875, 1.5745849609375, 1.673828125, 1.7730712890625, 1.872314453125, 1.9715576171875, 2.07080078125, 2.1700439453125, 2.269287109375, 2.3685302734375, 2.4677734375, 2.5670166015625, 2.666259765625, 2.7655029296875, 2.86474609375, 2.9639892578125, 3.063232421875, 3.1624755859375, 3.26171875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 9.0, 11.0, 12.0, 24.0, 48.0, 50.0, 68.0, 77.0, 133.0, 125.0, 111.0, 71.0, 85.0, 41.0, 33.0, 21.0, 20.0, 16.0, 10.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-36.806739807128906, -35.895565032958984, -34.98439025878906, -34.07321548461914, -33.16204071044922, -32.2508659362793, -31.339691162109375, -30.428516387939453, -29.51734161376953, -28.60616683959961, -27.694992065429688, -26.783817291259766, -25.872642517089844, -24.961467742919922, -24.05029296875, -23.139118194580078, -22.227943420410156, -21.316768646240234, -20.405593872070312, -19.49441909790039, -18.58324432373047, -17.672069549560547, -16.760894775390625, -15.849720001220703, -14.938545227050781, -14.02737045288086, -13.116195678710938, -12.205020904541016, -11.293846130371094, -10.382671356201172, -9.47149658203125, -8.560321807861328, -7.649145126342773, -6.737970352172852, -5.82679557800293, -4.915620803833008, -4.004446029663086, -3.093271255493164, -2.182096481323242, -1.2709217071533203, -0.35974693298339844, 0.5514278411865234, 1.4626026153564453, 2.373777389526367, 3.284952163696289, 4.196126937866211, 5.107301712036133, 6.018476486206055, 6.929651260375977, 7.840826034545898, 8.75200080871582, 9.663175582885742, 10.574350357055664, 11.485525131225586, 12.396699905395508, 13.30787467956543, 14.219049453735352, 15.130224227905273, 16.041399002075195, 16.952573776245117, 17.86374855041504, 18.77492332458496, 19.686098098754883, 20.597272872924805, 21.508447647094727]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 3.0, 11.0, 11.0, 6.0, 8.0, 9.0, 11.0, 11.0, 17.0, 10.0, 23.0, 21.0, 25.0, 25.0, 34.0, 20.0, 31.0, 36.0, 34.0, 29.0, 27.0, 37.0, 39.0, 33.0, 31.0, 35.0, 42.0, 28.0, 30.0, 39.0, 32.0, 22.0, 26.0, 23.0, 20.0, 18.0, 16.0, 12.0, 13.0, 15.0, 13.0, 16.0, 15.0, 4.0, 8.0, 5.0, 4.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0], "bins": [-8.060611724853516, -7.823540687561035, -7.586470127105713, -7.349399566650391, -7.11232852935791, -6.87525749206543, -6.638186931610107, -6.401116371154785, -6.164045333862305, -5.926974296569824, -5.689903736114502, -5.45283317565918, -5.215762138366699, -4.978691101074219, -4.7416205406188965, -4.504549980163574, -4.267478942871094, -4.030407905578613, -3.793337345123291, -3.5562665462493896, -3.3191957473754883, -3.082124948501587, -2.8450541496276855, -2.607983350753784, -2.370912551879883, -2.1338417530059814, -1.89677095413208, -1.6597001552581787, -1.4226293563842773, -1.185558557510376, -0.9484877586364746, -0.7114169597625732, -0.47434568405151367, -0.2372748851776123, -0.0002040863037109375, 0.23686671257019043, 0.4739375114440918, 0.7110083103179932, 0.9480791091918945, 1.185149908065796, 1.4222207069396973, 1.6592915058135986, 1.8963623046875, 2.1334331035614014, 2.3705039024353027, 2.607574701309204, 2.8446455001831055, 3.081716299057007, 3.318787097930908, 3.5558578968048096, 3.792928695678711, 4.029999732971191, 4.267070293426514, 4.504140853881836, 4.741211891174316, 4.978282928466797, 5.215353488922119, 5.452424049377441, 5.689495086669922, 5.926566123962402, 6.163636684417725, 6.400707244873047, 6.637778282165527, 6.874849319458008, 7.11191987991333]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 17.0, 8.0, 17.0, 22.0, 38.0, 49.0, 64.0, 83.0, 144.0, 235.0, 316.0, 461.0, 719.0, 1163.0, 1839.0, 3074.0, 5340.0, 10034.0, 19943.0, 41666.0, 94644.0, 243933.0, 736718.0, 1590568.0, 924550.0, 305799.0, 114956.0, 48979.0, 22951.0, 11226.0, 5993.0, 3274.0, 1979.0, 1204.0, 790.0, 505.0, 304.0, 186.0, 137.0, 101.0, 82.0, 48.0, 36.0, 30.0, 10.0, 10.0, 8.0, 10.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-19.96875, -19.316162109375, -18.66357421875, -18.010986328125, -17.3583984375, -16.705810546875, -16.05322265625, -15.400634765625, -14.748046875, -14.095458984375, -13.44287109375, -12.790283203125, -12.1376953125, -11.485107421875, -10.83251953125, -10.179931640625, -9.52734375, -8.874755859375, -8.22216796875, -7.569580078125, -6.9169921875, -6.264404296875, -5.61181640625, -4.959228515625, -4.306640625, -3.654052734375, -3.00146484375, -2.348876953125, -1.6962890625, -1.043701171875, -0.39111328125, 0.261474609375, 0.9140625, 1.566650390625, 2.21923828125, 2.871826171875, 3.5244140625, 4.177001953125, 4.82958984375, 5.482177734375, 6.134765625, 6.787353515625, 7.43994140625, 8.092529296875, 8.7451171875, 9.397705078125, 10.05029296875, 10.702880859375, 11.35546875, 12.008056640625, 12.66064453125, 13.313232421875, 13.9658203125, 14.618408203125, 15.27099609375, 15.923583984375, 16.576171875, 17.228759765625, 17.88134765625, 18.533935546875, 19.1865234375, 19.839111328125, 20.49169921875, 21.144287109375, 21.796875]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 7.0, 7.0, 11.0, 10.0, 7.0, 13.0, 18.0, 19.0, 18.0, 35.0, 33.0, 32.0, 27.0, 28.0, 31.0, 40.0, 44.0, 35.0, 44.0, 31.0, 32.0, 46.0, 42.0, 40.0, 38.0, 46.0, 34.0, 31.0, 18.0, 17.0, 20.0, 26.0, 19.0, 20.0, 14.0, 10.0, 16.0, 7.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-7.09765625, -6.884521484375, -6.67138671875, -6.458251953125, -6.2451171875, -6.031982421875, -5.81884765625, -5.605712890625, -5.392578125, -5.179443359375, -4.96630859375, -4.753173828125, -4.5400390625, -4.326904296875, -4.11376953125, -3.900634765625, -3.6875, -3.474365234375, -3.26123046875, -3.048095703125, -2.8349609375, -2.621826171875, -2.40869140625, -2.195556640625, -1.982421875, -1.769287109375, -1.55615234375, -1.343017578125, -1.1298828125, -0.916748046875, -0.70361328125, -0.490478515625, -0.27734375, -0.064208984375, 0.14892578125, 0.362060546875, 0.5751953125, 0.788330078125, 1.00146484375, 1.214599609375, 1.427734375, 1.640869140625, 1.85400390625, 2.067138671875, 2.2802734375, 2.493408203125, 2.70654296875, 2.919677734375, 3.1328125, 3.345947265625, 3.55908203125, 3.772216796875, 3.9853515625, 4.198486328125, 4.41162109375, 4.624755859375, 4.837890625, 5.051025390625, 5.26416015625, 5.477294921875, 5.6904296875, 5.903564453125, 6.11669921875, 6.329833984375, 6.54296875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 15.0, 16.0, 25.0, 47.0, 63.0, 95.0, 156.0, 249.0, 363.0, 620.0, 890.0, 1445.0, 2373.0, 4037.0, 7026.0, 12494.0, 22767.0, 44260.0, 89876.0, 191893.0, 433692.0, 958447.0, 1227135.0, 649955.0, 283775.0, 128875.0, 62010.0, 31724.0, 16803.0, 9575.0, 5356.0, 3155.0, 1914.0, 1174.0, 736.0, 428.0, 278.0, 179.0, 118.0, 81.0, 64.0, 36.0, 31.0, 6.0, 8.0, 8.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.515625, -15.930908203125, -15.34619140625, -14.761474609375, -14.1767578125, -13.592041015625, -13.00732421875, -12.422607421875, -11.837890625, -11.253173828125, -10.66845703125, -10.083740234375, -9.4990234375, -8.914306640625, -8.32958984375, -7.744873046875, -7.16015625, -6.575439453125, -5.99072265625, -5.406005859375, -4.8212890625, -4.236572265625, -3.65185546875, -3.067138671875, -2.482421875, -1.897705078125, -1.31298828125, -0.728271484375, -0.1435546875, 0.441162109375, 1.02587890625, 1.610595703125, 2.1953125, 2.780029296875, 3.36474609375, 3.949462890625, 4.5341796875, 5.118896484375, 5.70361328125, 6.288330078125, 6.873046875, 7.457763671875, 8.04248046875, 8.627197265625, 9.2119140625, 9.796630859375, 10.38134765625, 10.966064453125, 11.55078125, 12.135498046875, 12.72021484375, 13.304931640625, 13.8896484375, 14.474365234375, 15.05908203125, 15.643798828125, 16.228515625, 16.813232421875, 17.39794921875, 17.982666015625, 18.5673828125, 19.152099609375, 19.73681640625, 20.321533203125, 20.90625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 4.0, 7.0, 7.0, 24.0, 27.0, 34.0, 54.0, 50.0, 72.0, 82.0, 117.0, 145.0, 172.0, 261.0, 267.0, 313.0, 303.0, 349.0, 321.0, 280.0, 272.0, 212.0, 164.0, 116.0, 93.0, 87.0, 55.0, 46.0, 28.0, 30.0, 28.0, 11.0, 9.0, 11.0, 6.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.88671875, -5.7188720703125, -5.551025390625, -5.3831787109375, -5.21533203125, -5.0474853515625, -4.879638671875, -4.7117919921875, -4.5439453125, -4.3760986328125, -4.208251953125, -4.0404052734375, -3.87255859375, -3.7047119140625, -3.536865234375, -3.3690185546875, -3.201171875, -3.0333251953125, -2.865478515625, -2.6976318359375, -2.52978515625, -2.3619384765625, -2.194091796875, -2.0262451171875, -1.8583984375, -1.6905517578125, -1.522705078125, -1.3548583984375, -1.18701171875, -1.0191650390625, -0.851318359375, -0.6834716796875, -0.515625, -0.3477783203125, -0.179931640625, -0.0120849609375, 0.15576171875, 0.3236083984375, 0.491455078125, 0.6593017578125, 0.8271484375, 0.9949951171875, 1.162841796875, 1.3306884765625, 1.49853515625, 1.6663818359375, 1.834228515625, 2.0020751953125, 2.169921875, 2.3377685546875, 2.505615234375, 2.6734619140625, 2.84130859375, 3.0091552734375, 3.177001953125, 3.3448486328125, 3.5126953125, 3.6805419921875, 3.848388671875, 4.0162353515625, 4.18408203125, 4.3519287109375, 4.519775390625, 4.6876220703125, 4.85546875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 8.0, 18.0, 16.0, 25.0, 36.0, 60.0, 80.0, 83.0, 97.0, 98.0, 96.0, 101.0, 72.0, 49.0, 34.0, 29.0, 16.0, 19.0, 5.0, 12.0, 9.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.563068389892578, -30.723012924194336, -29.882959365844727, -29.042903900146484, -28.202850341796875, -27.362794876098633, -26.52273941040039, -25.68268585205078, -24.842632293701172, -24.00257682800293, -23.16252326965332, -22.322467803955078, -21.48241424560547, -20.642358779907227, -19.802303314208984, -18.962249755859375, -18.122194290161133, -17.28213882446289, -16.44208526611328, -15.602029800415039, -14.76197624206543, -13.921920776367188, -13.081866264343262, -12.241811752319336, -11.40175724029541, -10.561702728271484, -9.721648216247559, -8.881593704223633, -8.04153823852539, -7.201484203338623, -6.361429214477539, -5.521374702453613, -4.6813201904296875, -3.8412656784057617, -3.001210927963257, -2.161156177520752, -1.3211016654968262, -0.4810471534729004, 0.3590078353881836, 1.1990623474121094, 2.039116859436035, 2.879171371459961, 3.719226121902466, 4.559280872344971, 5.3993353843688965, 6.239389896392822, 7.079444885253906, 7.919499397277832, 8.759553909301758, 9.599608421325684, 10.43966293334961, 11.279718399047852, 12.119771957397461, 12.959827423095703, 13.799881935119629, 14.639936447143555, 15.47999095916748, 16.320045471191406, 17.16010093688965, 18.000154495239258, 18.8402099609375, 19.68026351928711, 20.52031898498535, 21.360374450683594, 22.200428009033203]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 8.0, 3.0, 4.0, 16.0, 6.0, 10.0, 12.0, 17.0, 16.0, 17.0, 25.0, 19.0, 24.0, 33.0, 37.0, 38.0, 25.0, 34.0, 48.0, 37.0, 36.0, 39.0, 22.0, 25.0, 30.0, 40.0, 33.0, 33.0, 32.0, 33.0, 28.0, 34.0, 30.0, 14.0, 22.0, 23.0, 19.0, 26.0, 8.0, 12.0, 5.0, 9.0, 3.0, 5.0, 2.0, 7.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.10766315460205, -7.854564189910889, -7.601465225219727, -7.348365783691406, -7.095266819000244, -6.842167854309082, -6.589068412780762, -6.3359694480896, -6.0828704833984375, -5.829771518707275, -5.576672554016113, -5.323573112487793, -5.070474147796631, -4.817375183105469, -4.564275741577148, -4.311176776885986, -4.058077812194824, -3.804978847503662, -3.551879644393921, -3.2987804412841797, -3.0456814765930176, -2.7925825119018555, -2.5394833087921143, -2.286384105682373, -2.033285140991211, -1.7801860570907593, -1.5270869731903076, -1.273987889289856, -1.0208888053894043, -0.7677897214889526, -0.514690637588501, -0.2615915536880493, -0.008492469787597656, 0.244606614112854, 0.49770569801330566, 0.7508047819137573, 1.003903865814209, 1.2570029497146606, 1.5101020336151123, 1.763201117515564, 2.0163002014160156, 2.2693991661071777, 2.522498369216919, 2.77559757232666, 3.0286965370178223, 3.2817955017089844, 3.5348947048187256, 3.787993907928467, 4.041092872619629, 4.294191837310791, 4.547290802001953, 4.800390243530273, 5.0534892082214355, 5.306588172912598, 5.559687614440918, 5.81278657913208, 6.065885543823242, 6.318984508514404, 6.572083473205566, 6.825182914733887, 7.078281879425049, 7.331380844116211, 7.584480285644531, 7.837579250335693, 8.090678215026855]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 12.0, 21.0, 26.0, 51.0, 62.0, 103.0, 141.0, 182.0, 295.0, 486.0, 781.0, 1134.0, 1729.0, 2781.0, 4426.0, 7093.0, 11553.0, 19474.0, 32856.0, 55720.0, 92138.0, 141781.0, 180612.0, 171667.0, 126202.0, 79115.0, 47143.0, 27895.0, 16493.0, 9803.0, 6201.0, 3749.0, 2390.0, 1577.0, 979.0, 645.0, 425.0, 238.0, 174.0, 151.0, 83.0, 46.0, 46.0, 25.0, 18.0, 10.0, 5.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.91015625, -5.72454833984375, -5.5389404296875, -5.35333251953125, -5.167724609375, -4.98211669921875, -4.7965087890625, -4.61090087890625, -4.42529296875, -4.23968505859375, -4.0540771484375, -3.86846923828125, -3.682861328125, -3.49725341796875, -3.3116455078125, -3.12603759765625, -2.9404296875, -2.75482177734375, -2.5692138671875, -2.38360595703125, -2.197998046875, -2.01239013671875, -1.8267822265625, -1.64117431640625, -1.45556640625, -1.26995849609375, -1.0843505859375, -0.89874267578125, -0.713134765625, -0.52752685546875, -0.3419189453125, -0.15631103515625, 0.029296875, 0.21490478515625, 0.4005126953125, 0.58612060546875, 0.771728515625, 0.95733642578125, 1.1429443359375, 1.32855224609375, 1.51416015625, 1.69976806640625, 1.8853759765625, 2.07098388671875, 2.256591796875, 2.44219970703125, 2.6278076171875, 2.81341552734375, 2.9990234375, 3.18463134765625, 3.3702392578125, 3.55584716796875, 3.741455078125, 3.92706298828125, 4.1126708984375, 4.29827880859375, 4.48388671875, 4.66949462890625, 4.8551025390625, 5.04071044921875, 5.226318359375, 5.41192626953125, 5.5975341796875, 5.78314208984375, 5.96875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 3.0, 8.0, 9.0, 6.0, 10.0, 11.0, 8.0, 28.0, 14.0, 24.0, 26.0, 22.0, 40.0, 38.0, 38.0, 44.0, 45.0, 43.0, 31.0, 26.0, 36.0, 41.0, 37.0, 38.0, 42.0, 34.0, 36.0, 34.0, 21.0, 27.0, 25.0, 23.0, 29.0, 17.0, 20.0, 16.0, 8.0, 7.0, 8.0, 4.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.046875, -9.7335205078125, -9.420166015625, -9.1068115234375, -8.79345703125, -8.4801025390625, -8.166748046875, -7.8533935546875, -7.5400390625, -7.2266845703125, -6.913330078125, -6.5999755859375, -6.28662109375, -5.9732666015625, -5.659912109375, -5.3465576171875, -5.033203125, -4.7198486328125, -4.406494140625, -4.0931396484375, -3.77978515625, -3.4664306640625, -3.153076171875, -2.8397216796875, -2.5263671875, -2.2130126953125, -1.899658203125, -1.5863037109375, -1.27294921875, -0.9595947265625, -0.646240234375, -0.3328857421875, -0.01953125, 0.2938232421875, 0.607177734375, 0.9205322265625, 1.23388671875, 1.5472412109375, 1.860595703125, 2.1739501953125, 2.4873046875, 2.8006591796875, 3.114013671875, 3.4273681640625, 3.74072265625, 4.0540771484375, 4.367431640625, 4.6807861328125, 4.994140625, 5.3074951171875, 5.620849609375, 5.9342041015625, 6.24755859375, 6.5609130859375, 6.874267578125, 7.1876220703125, 7.5009765625, 7.8143310546875, 8.127685546875, 8.4410400390625, 8.75439453125, 9.0677490234375, 9.381103515625, 9.6944580078125, 10.0078125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 11.0, 20.0, 27.0, 36.0, 47.0, 85.0, 107.0, 194.0, 266.0, 464.0, 722.0, 1240.0, 2097.0, 3438.0, 6419.0, 12125.0, 23300.0, 47875.0, 101407.0, 203506.0, 278494.0, 186119.0, 91192.0, 43290.0, 21175.0, 10827.0, 5720.0, 3352.0, 1948.0, 1162.0, 702.0, 403.0, 283.0, 181.0, 123.0, 52.0, 40.0, 23.0, 22.0, 18.0, 11.0, 5.0, 7.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.875, -9.560791015625, -9.24658203125, -8.932373046875, -8.6181640625, -8.303955078125, -7.98974609375, -7.675537109375, -7.361328125, -7.047119140625, -6.73291015625, -6.418701171875, -6.1044921875, -5.790283203125, -5.47607421875, -5.161865234375, -4.84765625, -4.533447265625, -4.21923828125, -3.905029296875, -3.5908203125, -3.276611328125, -2.96240234375, -2.648193359375, -2.333984375, -2.019775390625, -1.70556640625, -1.391357421875, -1.0771484375, -0.762939453125, -0.44873046875, -0.134521484375, 0.1796875, 0.493896484375, 0.80810546875, 1.122314453125, 1.4365234375, 1.750732421875, 2.06494140625, 2.379150390625, 2.693359375, 3.007568359375, 3.32177734375, 3.635986328125, 3.9501953125, 4.264404296875, 4.57861328125, 4.892822265625, 5.20703125, 5.521240234375, 5.83544921875, 6.149658203125, 6.4638671875, 6.778076171875, 7.09228515625, 7.406494140625, 7.720703125, 8.034912109375, 8.34912109375, 8.663330078125, 8.9775390625, 9.291748046875, 9.60595703125, 9.920166015625, 10.234375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 12.0, 9.0, 14.0, 13.0, 14.0, 16.0, 14.0, 23.0, 29.0, 29.0, 41.0, 38.0, 31.0, 37.0, 56.0, 39.0, 49.0, 41.0, 33.0, 46.0, 43.0, 36.0, 46.0, 28.0, 27.0, 39.0, 27.0, 20.0, 13.0, 18.0, 11.0, 17.0, 11.0, 15.0, 8.0, 8.0, 10.0, 5.0, 1.0, 5.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16015625, -5.974853515625, -5.78955078125, -5.604248046875, -5.4189453125, -5.233642578125, -5.04833984375, -4.863037109375, -4.677734375, -4.492431640625, -4.30712890625, -4.121826171875, -3.9365234375, -3.751220703125, -3.56591796875, -3.380615234375, -3.1953125, -3.010009765625, -2.82470703125, -2.639404296875, -2.4541015625, -2.268798828125, -2.08349609375, -1.898193359375, -1.712890625, -1.527587890625, -1.34228515625, -1.156982421875, -0.9716796875, -0.786376953125, -0.60107421875, -0.415771484375, -0.23046875, -0.045166015625, 0.14013671875, 0.325439453125, 0.5107421875, 0.696044921875, 0.88134765625, 1.066650390625, 1.251953125, 1.437255859375, 1.62255859375, 1.807861328125, 1.9931640625, 2.178466796875, 2.36376953125, 2.549072265625, 2.734375, 2.919677734375, 3.10498046875, 3.290283203125, 3.4755859375, 3.660888671875, 3.84619140625, 4.031494140625, 4.216796875, 4.402099609375, 4.58740234375, 4.772705078125, 4.9580078125, 5.143310546875, 5.32861328125, 5.513916015625, 5.69921875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 9.0, 19.0, 23.0, 29.0, 42.0, 74.0, 92.0, 133.0, 213.0, 321.0, 412.0, 631.0, 961.0, 1430.0, 2341.0, 3672.0, 6003.0, 10150.0, 17903.0, 32789.0, 61919.0, 119947.0, 220980.0, 249909.0, 148595.0, 77352.0, 39928.0, 21342.0, 12052.0, 7231.0, 4227.0, 2669.0, 1773.0, 1096.0, 716.0, 468.0, 330.0, 235.0, 156.0, 107.0, 75.0, 59.0, 45.0, 30.0, 18.0, 18.0, 6.0, 9.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.109375, -3.0126953125, -2.916015625, -2.8193359375, -2.72265625, -2.6259765625, -2.529296875, -2.4326171875, -2.3359375, -2.2392578125, -2.142578125, -2.0458984375, -1.94921875, -1.8525390625, -1.755859375, -1.6591796875, -1.5625, -1.4658203125, -1.369140625, -1.2724609375, -1.17578125, -1.0791015625, -0.982421875, -0.8857421875, -0.7890625, -0.6923828125, -0.595703125, -0.4990234375, -0.40234375, -0.3056640625, -0.208984375, -0.1123046875, -0.015625, 0.0810546875, 0.177734375, 0.2744140625, 0.37109375, 0.4677734375, 0.564453125, 0.6611328125, 0.7578125, 0.8544921875, 0.951171875, 1.0478515625, 1.14453125, 1.2412109375, 1.337890625, 1.4345703125, 1.53125, 1.6279296875, 1.724609375, 1.8212890625, 1.91796875, 2.0146484375, 2.111328125, 2.2080078125, 2.3046875, 2.4013671875, 2.498046875, 2.5947265625, 2.69140625, 2.7880859375, 2.884765625, 2.9814453125, 3.078125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 6.0, 3.0, 2.0, 2.0, 8.0, 9.0, 10.0, 18.0, 22.0, 33.0, 32.0, 50.0, 69.0, 60.0, 69.0, 73.0, 75.0, 64.0, 77.0, 65.0, 61.0, 38.0, 45.0, 29.0, 23.0, 18.0, 10.0, 11.0, 5.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000278472900390625, -0.0002697482705116272, -0.0002610236406326294, -0.0002522990107536316, -0.0002435743808746338, -0.00023484975099563599, -0.00022612512111663818, -0.00021740049123764038, -0.00020867586135864258, -0.00019995123147964478, -0.00019122660160064697, -0.00018250197172164917, -0.00017377734184265137, -0.00016505271196365356, -0.00015632808208465576, -0.00014760345220565796, -0.00013887882232666016, -0.00013015419244766235, -0.00012142956256866455, -0.00011270493268966675, -0.00010398030281066895, -9.525567293167114e-05, -8.653104305267334e-05, -7.780641317367554e-05, -6.908178329467773e-05, -6.035715341567993e-05, -5.163252353668213e-05, -4.2907893657684326e-05, -3.4183263778686523e-05, -2.545863389968872e-05, -1.6734004020690918e-05, -8.009374141693115e-06, 7.152557373046875e-07, 9.43988561630249e-06, 1.8164515495300293e-05, 2.6889145374298096e-05, 3.56137752532959e-05, 4.43384051322937e-05, 5.3063035011291504e-05, 6.17876648902893e-05, 7.051229476928711e-05, 7.923692464828491e-05, 8.796155452728271e-05, 9.668618440628052e-05, 0.00010541081428527832, 0.00011413544416427612, 0.00012286007404327393, 0.00013158470392227173, 0.00014030933380126953, 0.00014903396368026733, 0.00015775859355926514, 0.00016648322343826294, 0.00017520785331726074, 0.00018393248319625854, 0.00019265711307525635, 0.00020138174295425415, 0.00021010637283325195, 0.00021883100271224976, 0.00022755563259124756, 0.00023628026247024536, 0.00024500489234924316, 0.00025372952222824097, 0.00026245415210723877, 0.00027117878198623657, 0.0002799034118652344]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 8.0, 5.0, 14.0, 21.0, 23.0, 30.0, 47.0, 57.0, 104.0, 126.0, 216.0, 307.0, 492.0, 785.0, 1245.0, 2107.0, 3465.0, 5825.0, 10613.0, 19238.0, 36080.0, 71083.0, 134953.0, 216855.0, 226758.0, 148628.0, 79693.0, 40688.0, 21390.0, 11546.0, 6403.0, 3732.0, 2300.0, 1314.0, 806.0, 542.0, 338.0, 268.0, 150.0, 90.0, 56.0, 48.0, 42.0, 23.0, 15.0, 15.0, 8.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.73828125, -2.63330078125, -2.5283203125, -2.42333984375, -2.318359375, -2.21337890625, -2.1083984375, -2.00341796875, -1.8984375, -1.79345703125, -1.6884765625, -1.58349609375, -1.478515625, -1.37353515625, -1.2685546875, -1.16357421875, -1.05859375, -0.95361328125, -0.8486328125, -0.74365234375, -0.638671875, -0.53369140625, -0.4287109375, -0.32373046875, -0.21875, -0.11376953125, -0.0087890625, 0.09619140625, 0.201171875, 0.30615234375, 0.4111328125, 0.51611328125, 0.62109375, 0.72607421875, 0.8310546875, 0.93603515625, 1.041015625, 1.14599609375, 1.2509765625, 1.35595703125, 1.4609375, 1.56591796875, 1.6708984375, 1.77587890625, 1.880859375, 1.98583984375, 2.0908203125, 2.19580078125, 2.30078125, 2.40576171875, 2.5107421875, 2.61572265625, 2.720703125, 2.82568359375, 2.9306640625, 3.03564453125, 3.140625, 3.24560546875, 3.3505859375, 3.45556640625, 3.560546875, 3.66552734375, 3.7705078125, 3.87548828125, 3.98046875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 6.0, 9.0, 11.0, 18.0, 14.0, 27.0, 30.0, 27.0, 31.0, 38.0, 49.0, 49.0, 68.0, 69.0, 53.0, 50.0, 67.0, 60.0, 38.0, 48.0, 39.0, 35.0, 28.0, 30.0, 25.0, 15.0, 10.0, 13.0, 14.0, 8.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86572265625, -0.8377761840820312, -0.8098297119140625, -0.7818832397460938, -0.753936767578125, -0.7259902954101562, -0.6980438232421875, -0.6700973510742188, -0.64215087890625, -0.6142044067382812, -0.5862579345703125, -0.5583114624023438, -0.530364990234375, -0.5024185180664062, -0.4744720458984375, -0.44652557373046875, -0.4185791015625, -0.39063262939453125, -0.3626861572265625, -0.33473968505859375, -0.306793212890625, -0.27884674072265625, -0.2509002685546875, -0.22295379638671875, -0.19500732421875, -0.16706085205078125, -0.1391143798828125, -0.11116790771484375, -0.083221435546875, -0.05527496337890625, -0.0273284912109375, 0.00061798095703125, 0.028564453125, 0.05651092529296875, 0.0844573974609375, 0.11240386962890625, 0.140350341796875, 0.16829681396484375, 0.1962432861328125, 0.22418975830078125, 0.25213623046875, 0.28008270263671875, 0.3080291748046875, 0.33597564697265625, 0.363922119140625, 0.39186859130859375, 0.4198150634765625, 0.44776153564453125, 0.4757080078125, 0.5036544799804688, 0.5316009521484375, 0.5595474243164062, 0.587493896484375, 0.6154403686523438, 0.6433868408203125, 0.6713333129882812, 0.69927978515625, 0.7272262573242188, 0.7551727294921875, 0.7831192016601562, 0.811065673828125, 0.8390121459960938, 0.8669586181640625, 0.8949050903320312, 0.9228515625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 8.0, 17.0, 15.0, 27.0, 28.0, 60.0, 88.0, 67.0, 104.0, 84.0, 109.0, 94.0, 89.0, 45.0, 32.0, 26.0, 24.0, 15.0, 11.0, 11.0, 12.0, 1.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-31.42422866821289, -30.589895248413086, -29.75556182861328, -28.92123031616211, -28.086896896362305, -27.2525634765625, -26.418231964111328, -25.583898544311523, -24.74956512451172, -23.915231704711914, -23.08089828491211, -22.246566772460938, -21.412233352661133, -20.577899932861328, -19.743568420410156, -18.90923500061035, -18.074901580810547, -17.240568161010742, -16.406234741210938, -15.571903228759766, -14.737569808959961, -13.903236389160156, -13.068903923034668, -12.23457145690918, -11.400238037109375, -10.56590461730957, -9.731572151184082, -8.897239685058594, -8.062906265258789, -7.228573322296143, -6.394240379333496, -5.55990743637085, -4.72557258605957, -3.891239643096924, -3.0569067001342773, -2.222573757171631, -1.3882408142089844, -0.5539078712463379, 0.2804250717163086, 1.114758014678955, 1.9490909576416016, 2.783423900604248, 3.6177568435668945, 4.452089786529541, 5.2864227294921875, 6.120755672454834, 6.9550886154174805, 7.789421558380127, 8.623754501342773, 9.458087921142578, 10.292420387268066, 11.126752853393555, 11.96108627319336, 12.795419692993164, 13.629752159118652, 14.46408462524414, 15.298418045043945, 16.13275146484375, 16.967082977294922, 17.801416397094727, 18.63574981689453, 19.470083236694336, 20.30441665649414, 21.138748168945312, 21.973081588745117]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 3.0, 10.0, 13.0, 4.0, 12.0, 7.0, 19.0, 14.0, 22.0, 23.0, 19.0, 23.0, 28.0, 36.0, 37.0, 29.0, 34.0, 44.0, 34.0, 38.0, 38.0, 24.0, 32.0, 27.0, 35.0, 28.0, 35.0, 35.0, 39.0, 25.0, 21.0, 36.0, 26.0, 17.0, 23.0, 20.0, 20.0, 15.0, 9.0, 9.0, 10.0, 1.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.997335910797119, -7.750179767608643, -7.503023147583008, -7.255867004394531, -7.008710861206055, -6.761554718017578, -6.514398097991943, -6.267241954803467, -6.020085334777832, -5.7729291915893555, -5.525772571563721, -5.278616428375244, -5.031460285186768, -4.784303665161133, -4.537147521972656, -4.28999137878418, -4.042835235595703, -3.7956788539886475, -3.548522710800171, -3.3013663291931152, -3.0542101860046387, -2.807053804397583, -2.5598974227905273, -2.312741279602051, -2.065584897994995, -1.818428635597229, -1.571272373199463, -1.3241159915924072, -1.0769597291946411, -0.829803466796875, -0.5826470851898193, -0.3354908227920532, -0.08833456039428711, 0.1588217318058014, 0.4059780240058899, 0.6531343460083008, 0.9002906084060669, 1.147446870803833, 1.3946032524108887, 1.6417595148086548, 1.888915777206421, 2.1360721588134766, 2.383228302001953, 2.630384683609009, 2.8775410652160645, 3.124697208404541, 3.3718535900115967, 3.6190099716186523, 3.866166114807129, 4.1133222579956055, 4.36047887802124, 4.607635021209717, 4.854791164398193, 5.101947784423828, 5.349103927612305, 5.596260070800781, 5.843416213989258, 6.090572357177734, 6.337728977203369, 6.584885120391846, 6.832041263580322, 7.079197883605957, 7.326354026794434, 7.57351016998291, 7.820666790008545]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 17.0, 19.0, 26.0, 33.0, 55.0, 76.0, 111.0, 206.0, 324.0, 469.0, 701.0, 1165.0, 1713.0, 2808.0, 4503.0, 7167.0, 11349.0, 17982.0, 28399.0, 44252.0, 68793.0, 100597.0, 133880.0, 152438.0, 142701.0, 110873.0, 77604.0, 51172.0, 32874.0, 20778.0, 12954.0, 8541.0, 5189.0, 3104.0, 2076.0, 1320.0, 778.0, 524.0, 349.0, 225.0, 137.0, 102.0, 45.0, 42.0, 19.0, 19.0, 18.0, 15.0, 6.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.625, -11.26904296875, -10.9130859375, -10.55712890625, -10.201171875, -9.84521484375, -9.4892578125, -9.13330078125, -8.77734375, -8.42138671875, -8.0654296875, -7.70947265625, -7.353515625, -6.99755859375, -6.6416015625, -6.28564453125, -5.9296875, -5.57373046875, -5.2177734375, -4.86181640625, -4.505859375, -4.14990234375, -3.7939453125, -3.43798828125, -3.08203125, -2.72607421875, -2.3701171875, -2.01416015625, -1.658203125, -1.30224609375, -0.9462890625, -0.59033203125, -0.234375, 0.12158203125, 0.4775390625, 0.83349609375, 1.189453125, 1.54541015625, 1.9013671875, 2.25732421875, 2.61328125, 2.96923828125, 3.3251953125, 3.68115234375, 4.037109375, 4.39306640625, 4.7490234375, 5.10498046875, 5.4609375, 5.81689453125, 6.1728515625, 6.52880859375, 6.884765625, 7.24072265625, 7.5966796875, 7.95263671875, 8.30859375, 8.66455078125, 9.0205078125, 9.37646484375, 9.732421875, 10.08837890625, 10.4443359375, 10.80029296875, 11.15625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 4.0, 9.0, 11.0, 23.0, 13.0, 12.0, 20.0, 14.0, 31.0, 15.0, 26.0, 26.0, 38.0, 38.0, 44.0, 42.0, 41.0, 31.0, 36.0, 46.0, 32.0, 25.0, 36.0, 34.0, 35.0, 38.0, 29.0, 28.0, 30.0, 30.0, 25.0, 21.0, 22.0, 15.0, 19.0, 9.0, 12.0, 9.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2109375, -9.916015625, -9.62109375, -9.326171875, -9.03125, -8.736328125, -8.44140625, -8.146484375, -7.8515625, -7.556640625, -7.26171875, -6.966796875, -6.671875, -6.376953125, -6.08203125, -5.787109375, -5.4921875, -5.197265625, -4.90234375, -4.607421875, -4.3125, -4.017578125, -3.72265625, -3.427734375, -3.1328125, -2.837890625, -2.54296875, -2.248046875, -1.953125, -1.658203125, -1.36328125, -1.068359375, -0.7734375, -0.478515625, -0.18359375, 0.111328125, 0.40625, 0.701171875, 0.99609375, 1.291015625, 1.5859375, 1.880859375, 2.17578125, 2.470703125, 2.765625, 3.060546875, 3.35546875, 3.650390625, 3.9453125, 4.240234375, 4.53515625, 4.830078125, 5.125, 5.419921875, 5.71484375, 6.009765625, 6.3046875, 6.599609375, 6.89453125, 7.189453125, 7.484375, 7.779296875, 8.07421875, 8.369140625, 8.6640625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 11.0, 14.0, 22.0, 28.0, 45.0, 63.0, 116.0, 157.0, 270.0, 403.0, 620.0, 993.0, 1535.0, 2505.0, 4017.0, 6493.0, 10540.0, 17329.0, 28287.0, 46008.0, 72705.0, 108436.0, 144506.0, 159874.0, 144256.0, 108111.0, 72303.0, 45800.0, 28284.0, 17109.0, 10625.0, 6595.0, 3843.0, 2488.0, 1487.0, 940.0, 655.0, 367.0, 243.0, 164.0, 113.0, 63.0, 33.0, 36.0, 23.0, 10.0, 11.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.140625, -12.748291015625, -12.35595703125, -11.963623046875, -11.5712890625, -11.178955078125, -10.78662109375, -10.394287109375, -10.001953125, -9.609619140625, -9.21728515625, -8.824951171875, -8.4326171875, -8.040283203125, -7.64794921875, -7.255615234375, -6.86328125, -6.470947265625, -6.07861328125, -5.686279296875, -5.2939453125, -4.901611328125, -4.50927734375, -4.116943359375, -3.724609375, -3.332275390625, -2.93994140625, -2.547607421875, -2.1552734375, -1.762939453125, -1.37060546875, -0.978271484375, -0.5859375, -0.193603515625, 0.19873046875, 0.591064453125, 0.9833984375, 1.375732421875, 1.76806640625, 2.160400390625, 2.552734375, 2.945068359375, 3.33740234375, 3.729736328125, 4.1220703125, 4.514404296875, 4.90673828125, 5.299072265625, 5.69140625, 6.083740234375, 6.47607421875, 6.868408203125, 7.2607421875, 7.653076171875, 8.04541015625, 8.437744140625, 8.830078125, 9.222412109375, 9.61474609375, 10.007080078125, 10.3994140625, 10.791748046875, 11.18408203125, 11.576416015625, 11.96875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 1.0, 9.0, 4.0, 9.0, 8.0, 10.0, 9.0, 10.0, 14.0, 18.0, 19.0, 23.0, 25.0, 25.0, 25.0, 35.0, 44.0, 35.0, 29.0, 23.0, 42.0, 27.0, 24.0, 37.0, 49.0, 40.0, 44.0, 30.0, 37.0, 35.0, 33.0, 42.0, 24.0, 18.0, 23.0, 17.0, 22.0, 13.0, 13.0, 9.0, 13.0, 9.0, 4.0, 8.0, 3.0, 7.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.48828125, -5.31610107421875, -5.1439208984375, -4.97174072265625, -4.799560546875, -4.62738037109375, -4.4552001953125, -4.28302001953125, -4.11083984375, -3.93865966796875, -3.7664794921875, -3.59429931640625, -3.422119140625, -3.24993896484375, -3.0777587890625, -2.90557861328125, -2.7333984375, -2.56121826171875, -2.3890380859375, -2.21685791015625, -2.044677734375, -1.87249755859375, -1.7003173828125, -1.52813720703125, -1.35595703125, -1.18377685546875, -1.0115966796875, -0.83941650390625, -0.667236328125, -0.49505615234375, -0.3228759765625, -0.15069580078125, 0.021484375, 0.19366455078125, 0.3658447265625, 0.53802490234375, 0.710205078125, 0.88238525390625, 1.0545654296875, 1.22674560546875, 1.39892578125, 1.57110595703125, 1.7432861328125, 1.91546630859375, 2.087646484375, 2.25982666015625, 2.4320068359375, 2.60418701171875, 2.7763671875, 2.94854736328125, 3.1207275390625, 3.29290771484375, 3.465087890625, 3.63726806640625, 3.8094482421875, 3.98162841796875, 4.15380859375, 4.32598876953125, 4.4981689453125, 4.67034912109375, 4.842529296875, 5.01470947265625, 5.1868896484375, 5.35906982421875, 5.53125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 7.0, 11.0, 15.0, 32.0, 34.0, 53.0, 73.0, 101.0, 168.0, 223.0, 321.0, 495.0, 752.0, 1168.0, 1743.0, 2909.0, 4825.0, 8403.0, 14833.0, 29136.0, 60990.0, 132857.0, 253592.0, 261777.0, 140906.0, 64245.0, 30869.0, 15810.0, 8692.0, 4863.0, 3030.0, 1919.0, 1231.0, 839.0, 515.0, 332.0, 250.0, 155.0, 101.0, 77.0, 64.0, 46.0, 34.0, 11.0, 17.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-8.1953125, -7.947265625, -7.69921875, -7.451171875, -7.203125, -6.955078125, -6.70703125, -6.458984375, -6.2109375, -5.962890625, -5.71484375, -5.466796875, -5.21875, -4.970703125, -4.72265625, -4.474609375, -4.2265625, -3.978515625, -3.73046875, -3.482421875, -3.234375, -2.986328125, -2.73828125, -2.490234375, -2.2421875, -1.994140625, -1.74609375, -1.498046875, -1.25, -1.001953125, -0.75390625, -0.505859375, -0.2578125, -0.009765625, 0.23828125, 0.486328125, 0.734375, 0.982421875, 1.23046875, 1.478515625, 1.7265625, 1.974609375, 2.22265625, 2.470703125, 2.71875, 2.966796875, 3.21484375, 3.462890625, 3.7109375, 3.958984375, 4.20703125, 4.455078125, 4.703125, 4.951171875, 5.19921875, 5.447265625, 5.6953125, 5.943359375, 6.19140625, 6.439453125, 6.6875, 6.935546875, 7.18359375, 7.431640625, 7.6796875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 7.0, 5.0, 6.0, 11.0, 17.0, 15.0, 19.0, 29.0, 41.0, 41.0, 55.0, 52.0, 71.0, 77.0, 92.0, 72.0, 63.0, 75.0, 55.0, 42.0, 21.0, 23.0, 22.0, 11.0, 11.0, 13.0, 8.0, 5.0, 4.0, 3.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008358955383300781, -0.0008091703057289124, -0.0007824450731277466, -0.0007557198405265808, -0.000728994607925415, -0.0007022693753242493, -0.0006755441427230835, -0.0006488189101219177, -0.000622093677520752, -0.0005953684449195862, -0.0005686432123184204, -0.0005419179797172546, -0.0005151927471160889, -0.0004884675145149231, -0.0004617422819137573, -0.00043501704931259155, -0.0004082918167114258, -0.00038156658411026, -0.00035484135150909424, -0.00032811611890792847, -0.0003013908863067627, -0.0002746656537055969, -0.00024794042110443115, -0.00022121518850326538, -0.0001944899559020996, -0.00016776472330093384, -0.00014103949069976807, -0.0001143142580986023, -8.758902549743652e-05, -6.086379289627075e-05, -3.413856029510498e-05, -7.413327693939209e-06, 1.9311904907226562e-05, 4.6037137508392334e-05, 7.27623701095581e-05, 9.948760271072388e-05, 0.00012621283531188965, 0.00015293806791305542, 0.0001796633005142212, 0.00020638853311538696, 0.00023311376571655273, 0.0002598389983177185, 0.0002865642309188843, 0.00031328946352005005, 0.0003400146961212158, 0.0003667399287223816, 0.00039346516132354736, 0.00042019039392471313, 0.0004469156265258789, 0.0004736408591270447, 0.0005003660917282104, 0.0005270913243293762, 0.000553816556930542, 0.0005805417895317078, 0.0006072670221328735, 0.0006339922547340393, 0.0006607174873352051, 0.0006874427199363708, 0.0007141679525375366, 0.0007408931851387024, 0.0007676184177398682, 0.0007943436503410339, 0.0008210688829421997, 0.0008477941155433655, 0.0008745193481445312]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 10.0, 1.0, 3.0, 5.0, 10.0, 13.0, 19.0, 27.0, 46.0, 74.0, 105.0, 152.0, 242.0, 344.0, 589.0, 962.0, 1662.0, 2916.0, 5205.0, 10340.0, 20061.0, 42869.0, 91711.0, 194056.0, 286068.0, 203508.0, 97601.0, 44991.0, 21436.0, 10477.0, 5523.0, 3042.0, 1690.0, 1030.0, 688.0, 373.0, 247.0, 140.0, 80.0, 80.0, 55.0, 36.0, 24.0, 19.0, 14.0, 5.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.54296875, -7.29595947265625, -7.0489501953125, -6.80194091796875, -6.554931640625, -6.30792236328125, -6.0609130859375, -5.81390380859375, -5.56689453125, -5.31988525390625, -5.0728759765625, -4.82586669921875, -4.578857421875, -4.33184814453125, -4.0848388671875, -3.83782958984375, -3.5908203125, -3.34381103515625, -3.0968017578125, -2.84979248046875, -2.602783203125, -2.35577392578125, -2.1087646484375, -1.86175537109375, -1.61474609375, -1.36773681640625, -1.1207275390625, -0.87371826171875, -0.626708984375, -0.37969970703125, -0.1326904296875, 0.11431884765625, 0.361328125, 0.60833740234375, 0.8553466796875, 1.10235595703125, 1.349365234375, 1.59637451171875, 1.8433837890625, 2.09039306640625, 2.33740234375, 2.58441162109375, 2.8314208984375, 3.07843017578125, 3.325439453125, 3.57244873046875, 3.8194580078125, 4.06646728515625, 4.3134765625, 4.56048583984375, 4.8074951171875, 5.05450439453125, 5.301513671875, 5.54852294921875, 5.7955322265625, 6.04254150390625, 6.28955078125, 6.53656005859375, 6.7835693359375, 7.03057861328125, 7.277587890625, 7.52459716796875, 7.7716064453125, 8.01861572265625, 8.265625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 5.0, 6.0, 11.0, 13.0, 15.0, 15.0, 18.0, 11.0, 23.0, 26.0, 31.0, 44.0, 36.0, 45.0, 35.0, 47.0, 52.0, 56.0, 49.0, 43.0, 46.0, 50.0, 40.0, 37.0, 39.0, 25.0, 18.0, 26.0, 18.0, 8.0, 21.0, 20.0, 12.0, 6.0, 10.0, 7.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3056640625, -1.2625885009765625, -1.219512939453125, -1.1764373779296875, -1.13336181640625, -1.0902862548828125, -1.047210693359375, -1.0041351318359375, -0.9610595703125, -0.9179840087890625, -0.874908447265625, -0.8318328857421875, -0.78875732421875, -0.7456817626953125, -0.702606201171875, -0.6595306396484375, -0.616455078125, -0.5733795166015625, -0.530303955078125, -0.4872283935546875, -0.44415283203125, -0.4010772705078125, -0.358001708984375, -0.3149261474609375, -0.2718505859375, -0.2287750244140625, -0.185699462890625, -0.1426239013671875, -0.09954833984375, -0.0564727783203125, -0.013397216796875, 0.0296783447265625, 0.07275390625, 0.1158294677734375, 0.158905029296875, 0.2019805908203125, 0.24505615234375, 0.2881317138671875, 0.331207275390625, 0.3742828369140625, 0.4173583984375, 0.4604339599609375, 0.503509521484375, 0.5465850830078125, 0.58966064453125, 0.6327362060546875, 0.675811767578125, 0.7188873291015625, 0.761962890625, 0.8050384521484375, 0.848114013671875, 0.8911895751953125, 0.93426513671875, 0.9773406982421875, 1.020416259765625, 1.0634918212890625, 1.1065673828125, 1.1496429443359375, 1.192718505859375, 1.2357940673828125, 1.27886962890625, 1.3219451904296875, 1.365020751953125, 1.4080963134765625, 1.451171875]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 2.0, 6.0, 8.0, 10.0, 18.0, 33.0, 45.0, 83.0, 89.0, 125.0, 118.0, 125.0, 105.0, 70.0, 44.0, 31.0, 20.0, 18.0, 12.0, 11.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-41.80689239501953, -40.80168533325195, -39.796478271484375, -38.7912712097168, -37.78606414794922, -36.78085708618164, -35.77565002441406, -34.77044677734375, -33.765235900878906, -32.76002883911133, -31.75482177734375, -30.749614715576172, -29.744407653808594, -28.739200592041016, -27.73399543762207, -26.728788375854492, -25.723583221435547, -24.71837615966797, -23.71316909790039, -22.707962036132812, -21.702754974365234, -20.697547912597656, -19.69234275817871, -18.687135696411133, -17.681928634643555, -16.676721572875977, -15.671514511108398, -14.666308403015137, -13.661101341247559, -12.65589427947998, -11.650688171386719, -10.64548110961914, -9.640270233154297, -8.635063171386719, -7.629856586456299, -6.624650001525879, -5.619442939758301, -4.614235877990723, -3.6090292930603027, -2.603822708129883, -1.5986156463623047, -0.5934088230133057, 0.41179800033569336, 1.4170048236846924, 2.4222116470336914, 3.4274187088012695, 4.4326252937316895, 5.437831878662109, 6.4430389404296875, 7.448246002197266, 8.453453063964844, 9.458659172058105, 10.463866233825684, 11.469073295593262, 12.474279403686523, 13.479486465454102, 14.48469352722168, 15.489900588989258, 16.495107650756836, 17.500314712524414, 18.50551986694336, 19.510726928710938, 20.515933990478516, 21.521141052246094, 22.526348114013672]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 2.0, 6.0, 13.0, 8.0, 14.0, 13.0, 20.0, 18.0, 20.0, 18.0, 27.0, 31.0, 30.0, 32.0, 32.0, 45.0, 36.0, 48.0, 49.0, 44.0, 33.0, 43.0, 36.0, 35.0, 38.0, 36.0, 29.0, 33.0, 24.0, 30.0, 25.0, 19.0, 17.0, 17.0, 19.0, 18.0, 11.0, 14.0, 7.0, 4.0, 5.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.87194538116455, -9.583544731140137, -9.295143127441406, -9.006742477416992, -8.718341827392578, -8.429941177368164, -8.141539573669434, -7.8531389236450195, -7.5647382736206055, -7.276337146759033, -6.987936496734619, -6.699535369873047, -6.411134719848633, -6.1227335929870605, -5.834332466125488, -5.545931816101074, -5.257530689239502, -4.96912956237793, -4.680728912353516, -4.392327785491943, -4.103927135467529, -3.815526008605957, -3.527125120162964, -3.2387242317199707, -2.9503233432769775, -2.6619224548339844, -2.373521566390991, -2.085120677947998, -1.7967196702957153, -1.5083187818527222, -1.2199177742004395, -0.9315168857574463, -0.6431159973144531, -0.3547150790691376, -0.06631416082382202, 0.22208678722381592, 0.5104876756668091, 0.7988885641098022, 1.087289571762085, 1.3756904602050781, 1.6640913486480713, 1.9524922370910645, 2.2408931255340576, 2.529294013977051, 2.817695140838623, 3.106095790863037, 3.3944969177246094, 3.6828978061676025, 3.9712986946105957, 4.259699821472168, 4.548100471496582, 4.836501598358154, 5.124902248382568, 5.413303375244141, 5.701704025268555, 5.990105152130127, 6.278506278991699, 6.5669074058532715, 6.8553080558776855, 7.143709182739258, 7.432109832763672, 7.720510959625244, 8.008912086486816, 8.29731273651123, 8.585713386535645]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 9.0, 8.0, 12.0, 20.0, 33.0, 38.0, 65.0, 100.0, 155.0, 257.0, 371.0, 628.0, 1013.0, 1666.0, 2971.0, 5443.0, 10076.0, 19378.0, 39645.0, 85456.0, 206799.0, 583575.0, 1424364.0, 1137368.0, 399460.0, 148983.0, 63446.0, 29864.0, 14972.0, 7753.0, 4247.0, 2438.0, 1439.0, 821.0, 527.0, 317.0, 214.0, 116.0, 86.0, 44.0, 30.0, 25.0, 18.0, 13.0, 5.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.515625, -20.860107421875, -20.20458984375, -19.549072265625, -18.8935546875, -18.238037109375, -17.58251953125, -16.927001953125, -16.271484375, -15.615966796875, -14.96044921875, -14.304931640625, -13.6494140625, -12.993896484375, -12.33837890625, -11.682861328125, -11.02734375, -10.371826171875, -9.71630859375, -9.060791015625, -8.4052734375, -7.749755859375, -7.09423828125, -6.438720703125, -5.783203125, -5.127685546875, -4.47216796875, -3.816650390625, -3.1611328125, -2.505615234375, -1.85009765625, -1.194580078125, -0.5390625, 0.116455078125, 0.77197265625, 1.427490234375, 2.0830078125, 2.738525390625, 3.39404296875, 4.049560546875, 4.705078125, 5.360595703125, 6.01611328125, 6.671630859375, 7.3271484375, 7.982666015625, 8.63818359375, 9.293701171875, 9.94921875, 10.604736328125, 11.26025390625, 11.915771484375, 12.5712890625, 13.226806640625, 13.88232421875, 14.537841796875, 15.193359375, 15.848876953125, 16.50439453125, 17.159912109375, 17.8154296875, 18.470947265625, 19.12646484375, 19.781982421875, 20.4375]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 8.0, 9.0, 11.0, 12.0, 10.0, 21.0, 20.0, 24.0, 30.0, 16.0, 29.0, 25.0, 28.0, 41.0, 42.0, 42.0, 37.0, 38.0, 39.0, 36.0, 50.0, 42.0, 38.0, 29.0, 29.0, 30.0, 31.0, 24.0, 23.0, 26.0, 22.0, 23.0, 14.0, 19.0, 14.0, 19.0, 11.0, 8.0, 9.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.52734375, -7.30157470703125, -7.0758056640625, -6.85003662109375, -6.624267578125, -6.39849853515625, -6.1727294921875, -5.94696044921875, -5.72119140625, -5.49542236328125, -5.2696533203125, -5.04388427734375, -4.818115234375, -4.59234619140625, -4.3665771484375, -4.14080810546875, -3.9150390625, -3.68927001953125, -3.4635009765625, -3.23773193359375, -3.011962890625, -2.78619384765625, -2.5604248046875, -2.33465576171875, -2.10888671875, -1.88311767578125, -1.6573486328125, -1.43157958984375, -1.205810546875, -0.98004150390625, -0.7542724609375, -0.52850341796875, -0.302734375, -0.07696533203125, 0.1488037109375, 0.37457275390625, 0.600341796875, 0.82611083984375, 1.0518798828125, 1.27764892578125, 1.50341796875, 1.72918701171875, 1.9549560546875, 2.18072509765625, 2.406494140625, 2.63226318359375, 2.8580322265625, 3.08380126953125, 3.3095703125, 3.53533935546875, 3.7611083984375, 3.98687744140625, 4.212646484375, 4.43841552734375, 4.6641845703125, 4.88995361328125, 5.11572265625, 5.34149169921875, 5.5672607421875, 5.79302978515625, 6.018798828125, 6.24456787109375, 6.4703369140625, 6.69610595703125, 6.921875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 10.0, 10.0, 12.0, 17.0, 21.0, 32.0, 43.0, 68.0, 89.0, 136.0, 199.0, 272.0, 428.0, 654.0, 955.0, 1425.0, 2128.0, 3377.0, 5258.0, 8381.0, 14030.0, 24099.0, 42622.0, 79368.0, 154592.0, 316321.0, 658469.0, 1134154.0, 874204.0, 430051.0, 206840.0, 103619.0, 55543.0, 30258.0, 17527.0, 10656.0, 6453.0, 4048.0, 2611.0, 1755.0, 1117.0, 756.0, 558.0, 406.0, 250.0, 152.0, 112.0, 72.0, 53.0, 35.0, 13.0, 10.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-17.90625, -17.341552734375, -16.77685546875, -16.212158203125, -15.6474609375, -15.082763671875, -14.51806640625, -13.953369140625, -13.388671875, -12.823974609375, -12.25927734375, -11.694580078125, -11.1298828125, -10.565185546875, -10.00048828125, -9.435791015625, -8.87109375, -8.306396484375, -7.74169921875, -7.177001953125, -6.6123046875, -6.047607421875, -5.48291015625, -4.918212890625, -4.353515625, -3.788818359375, -3.22412109375, -2.659423828125, -2.0947265625, -1.530029296875, -0.96533203125, -0.400634765625, 0.1640625, 0.728759765625, 1.29345703125, 1.858154296875, 2.4228515625, 2.987548828125, 3.55224609375, 4.116943359375, 4.681640625, 5.246337890625, 5.81103515625, 6.375732421875, 6.9404296875, 7.505126953125, 8.06982421875, 8.634521484375, 9.19921875, 9.763916015625, 10.32861328125, 10.893310546875, 11.4580078125, 12.022705078125, 12.58740234375, 13.152099609375, 13.716796875, 14.281494140625, 14.84619140625, 15.410888671875, 15.9755859375, 16.540283203125, 17.10498046875, 17.669677734375, 18.234375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 7.0, 8.0, 11.0, 13.0, 16.0, 27.0, 42.0, 40.0, 59.0, 77.0, 93.0, 123.0, 158.0, 170.0, 238.0, 276.0, 320.0, 351.0, 382.0, 321.0, 279.0, 211.0, 179.0, 148.0, 114.0, 93.0, 100.0, 50.0, 47.0, 31.0, 14.0, 15.0, 12.0, 8.0, 9.0, 10.0, 3.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.7998046875, -4.615234375, -4.4306640625, -4.24609375, -4.0615234375, -3.876953125, -3.6923828125, -3.5078125, -3.3232421875, -3.138671875, -2.9541015625, -2.76953125, -2.5849609375, -2.400390625, -2.2158203125, -2.03125, -1.8466796875, -1.662109375, -1.4775390625, -1.29296875, -1.1083984375, -0.923828125, -0.7392578125, -0.5546875, -0.3701171875, -0.185546875, -0.0009765625, 0.18359375, 0.3681640625, 0.552734375, 0.7373046875, 0.921875, 1.1064453125, 1.291015625, 1.4755859375, 1.66015625, 1.8447265625, 2.029296875, 2.2138671875, 2.3984375, 2.5830078125, 2.767578125, 2.9521484375, 3.13671875, 3.3212890625, 3.505859375, 3.6904296875, 3.875, 4.0595703125, 4.244140625, 4.4287109375, 4.61328125, 4.7978515625, 4.982421875, 5.1669921875, 5.3515625, 5.5361328125, 5.720703125, 5.9052734375, 6.08984375, 6.2744140625, 6.458984375, 6.6435546875, 6.828125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 11.0, 10.0, 25.0, 22.0, 32.0, 55.0, 66.0, 81.0, 104.0, 109.0, 105.0, 86.0, 64.0, 48.0, 39.0, 36.0, 27.0, 17.0, 17.0, 4.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.340173721313477, -29.491859436035156, -28.64354705810547, -27.79523277282715, -26.946918487548828, -26.09860610961914, -25.25029182434082, -24.4019775390625, -23.553665161132812, -22.705350875854492, -21.857038497924805, -21.008724212646484, -20.160409927368164, -19.312097549438477, -18.463783264160156, -17.61547088623047, -16.767154693603516, -15.918841361999512, -15.070527076721191, -14.222213745117188, -13.373900413513184, -12.52558708190918, -11.67727279663086, -10.828959465026855, -9.980646133422852, -9.132332801818848, -8.284018516540527, -7.435705184936523, -6.5873918533325195, -5.739078044891357, -4.890764236450195, -4.042450904846191, -3.1941375732421875, -2.3458240032196045, -1.497510313987732, -0.6491966247558594, 0.19911694526672363, 1.0474305152893066, 1.8957443237304688, 2.7440576553344727, 3.5923714637756348, 4.440685272216797, 5.288998603820801, 6.137312412261963, 6.985626220703125, 7.833939552307129, 8.682252883911133, 9.530567169189453, 10.378880500793457, 11.227193832397461, 12.075508117675781, 12.923821449279785, 13.772134780883789, 14.62044906616211, 15.468762397766113, 16.317075729370117, 17.165390014648438, 18.013704299926758, 18.862016677856445, 19.710330963134766, 20.558645248413086, 21.406957626342773, 22.255271911621094, 23.10358428955078, 23.9518985748291]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 9.0, 7.0, 7.0, 7.0, 9.0, 14.0, 13.0, 28.0, 18.0, 17.0, 21.0, 28.0, 28.0, 38.0, 33.0, 31.0, 34.0, 42.0, 42.0, 34.0, 38.0, 33.0, 52.0, 23.0, 29.0, 35.0, 35.0, 38.0, 17.0, 30.0, 38.0, 23.0, 24.0, 13.0, 20.0, 20.0, 18.0, 11.0, 11.0, 9.0, 6.0, 5.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.113921165466309, -9.834427833557129, -9.55493450164795, -9.27544116973877, -8.99594783782959, -8.71645450592041, -8.43696117401123, -8.157466888427734, -7.877974033355713, -7.598480701446533, -7.3189873695373535, -7.039494037628174, -6.760000228881836, -6.480506896972656, -6.201013565063477, -5.921520233154297, -5.642026901245117, -5.3625335693359375, -5.083040237426758, -4.803546905517578, -4.524053573608398, -4.244560241699219, -3.965066432952881, -3.685573101043701, -3.4060797691345215, -3.126586437225342, -2.847093105316162, -2.5675995349884033, -2.2881062030792236, -2.008612871170044, -1.7291194200515747, -1.4496259689331055, -1.1701335906982422, -0.8906401991844177, -0.6111468076705933, -0.3316534161567688, -0.052160024642944336, 0.22733330726623535, 0.5068267583847046, 0.7863202095031738, 1.0658135414123535, 1.3453068733215332, 1.6248003244400024, 1.9042937755584717, 2.1837871074676514, 2.463280439376831, 2.74277400970459, 3.0222673416137695, 3.301760673522949, 3.581254005432129, 3.8607473373413086, 4.140240669250488, 4.419734001159668, 4.699227333068848, 4.9787211418151855, 5.258214473724365, 5.537707805633545, 5.817201137542725, 6.096694469451904, 6.376187801361084, 6.655681610107422, 6.935174942016602, 7.214668273925781, 7.494161605834961, 7.773654937744141]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 7.0, 16.0, 24.0, 19.0, 33.0, 35.0, 57.0, 80.0, 121.0, 217.0, 307.0, 459.0, 718.0, 1131.0, 2037.0, 3921.0, 8432.0, 20570.0, 55689.0, 161836.0, 354161.0, 274708.0, 101690.0, 35527.0, 13694.0, 5890.0, 2883.0, 1568.0, 935.0, 630.0, 371.0, 214.0, 182.0, 129.0, 66.0, 59.0, 44.0, 25.0, 21.0, 11.0, 12.0, 13.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.96875, -15.46630859375, -14.9638671875, -14.46142578125, -13.958984375, -13.45654296875, -12.9541015625, -12.45166015625, -11.94921875, -11.44677734375, -10.9443359375, -10.44189453125, -9.939453125, -9.43701171875, -8.9345703125, -8.43212890625, -7.9296875, -7.42724609375, -6.9248046875, -6.42236328125, -5.919921875, -5.41748046875, -4.9150390625, -4.41259765625, -3.91015625, -3.40771484375, -2.9052734375, -2.40283203125, -1.900390625, -1.39794921875, -0.8955078125, -0.39306640625, 0.109375, 0.61181640625, 1.1142578125, 1.61669921875, 2.119140625, 2.62158203125, 3.1240234375, 3.62646484375, 4.12890625, 4.63134765625, 5.1337890625, 5.63623046875, 6.138671875, 6.64111328125, 7.1435546875, 7.64599609375, 8.1484375, 8.65087890625, 9.1533203125, 9.65576171875, 10.158203125, 10.66064453125, 11.1630859375, 11.66552734375, 12.16796875, 12.67041015625, 13.1728515625, 13.67529296875, 14.177734375, 14.68017578125, 15.1826171875, 15.68505859375, 16.1875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 4.0, 7.0, 3.0, 8.0, 13.0, 17.0, 18.0, 12.0, 13.0, 21.0, 27.0, 28.0, 27.0, 33.0, 28.0, 38.0, 43.0, 39.0, 39.0, 34.0, 30.0, 32.0, 35.0, 40.0, 31.0, 44.0, 31.0, 32.0, 36.0, 28.0, 37.0, 19.0, 18.0, 24.0, 16.0, 18.0, 18.0, 11.0, 11.0, 7.0, 2.0, 6.0, 4.0, 3.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-10.5625, -10.2435302734375, -9.924560546875, -9.6055908203125, -9.28662109375, -8.9676513671875, -8.648681640625, -8.3297119140625, -8.0107421875, -7.6917724609375, -7.372802734375, -7.0538330078125, -6.73486328125, -6.4158935546875, -6.096923828125, -5.7779541015625, -5.458984375, -5.1400146484375, -4.821044921875, -4.5020751953125, -4.18310546875, -3.8641357421875, -3.545166015625, -3.2261962890625, -2.9072265625, -2.5882568359375, -2.269287109375, -1.9503173828125, -1.63134765625, -1.3123779296875, -0.993408203125, -0.6744384765625, -0.35546875, -0.0364990234375, 0.282470703125, 0.6014404296875, 0.92041015625, 1.2393798828125, 1.558349609375, 1.8773193359375, 2.1962890625, 2.5152587890625, 2.834228515625, 3.1531982421875, 3.47216796875, 3.7911376953125, 4.110107421875, 4.4290771484375, 4.748046875, 5.0670166015625, 5.385986328125, 5.7049560546875, 6.02392578125, 6.3428955078125, 6.661865234375, 6.9808349609375, 7.2998046875, 7.6187744140625, 7.937744140625, 8.2567138671875, 8.57568359375, 8.8946533203125, 9.213623046875, 9.5325927734375, 9.8515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 11.0, 15.0, 19.0, 29.0, 28.0, 35.0, 41.0, 79.0, 84.0, 129.0, 199.0, 263.0, 428.0, 720.0, 1245.0, 2476.0, 4868.0, 11569.0, 32223.0, 112125.0, 389216.0, 348207.0, 96300.0, 28030.0, 10347.0, 4429.0, 2203.0, 1209.0, 663.0, 418.0, 275.0, 178.0, 135.0, 76.0, 78.0, 49.0, 44.0, 25.0, 13.0, 13.0, 13.0, 11.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.796875, -21.114501953125, -20.43212890625, -19.749755859375, -19.0673828125, -18.385009765625, -17.70263671875, -17.020263671875, -16.337890625, -15.655517578125, -14.97314453125, -14.290771484375, -13.6083984375, -12.926025390625, -12.24365234375, -11.561279296875, -10.87890625, -10.196533203125, -9.51416015625, -8.831787109375, -8.1494140625, -7.467041015625, -6.78466796875, -6.102294921875, -5.419921875, -4.737548828125, -4.05517578125, -3.372802734375, -2.6904296875, -2.008056640625, -1.32568359375, -0.643310546875, 0.0390625, 0.721435546875, 1.40380859375, 2.086181640625, 2.7685546875, 3.450927734375, 4.13330078125, 4.815673828125, 5.498046875, 6.180419921875, 6.86279296875, 7.545166015625, 8.2275390625, 8.909912109375, 9.59228515625, 10.274658203125, 10.95703125, 11.639404296875, 12.32177734375, 13.004150390625, 13.6865234375, 14.368896484375, 15.05126953125, 15.733642578125, 16.416015625, 17.098388671875, 17.78076171875, 18.463134765625, 19.1455078125, 19.827880859375, 20.51025390625, 21.192626953125, 21.875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 3.0, 2.0, 8.0, 5.0, 8.0, 12.0, 14.0, 13.0, 18.0, 20.0, 25.0, 29.0, 20.0, 28.0, 35.0, 32.0, 37.0, 31.0, 42.0, 42.0, 41.0, 36.0, 38.0, 36.0, 35.0, 29.0, 42.0, 42.0, 30.0, 33.0, 34.0, 28.0, 23.0, 18.0, 15.0, 17.0, 13.0, 9.0, 10.0, 6.0, 6.0, 7.0, 4.0, 10.0, 1.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.703125, -6.50433349609375, -6.3055419921875, -6.10675048828125, -5.907958984375, -5.70916748046875, -5.5103759765625, -5.31158447265625, -5.11279296875, -4.91400146484375, -4.7152099609375, -4.51641845703125, -4.317626953125, -4.11883544921875, -3.9200439453125, -3.72125244140625, -3.5224609375, -3.32366943359375, -3.1248779296875, -2.92608642578125, -2.727294921875, -2.52850341796875, -2.3297119140625, -2.13092041015625, -1.93212890625, -1.73333740234375, -1.5345458984375, -1.33575439453125, -1.136962890625, -0.93817138671875, -0.7393798828125, -0.54058837890625, -0.341796875, -0.14300537109375, 0.0557861328125, 0.25457763671875, 0.453369140625, 0.65216064453125, 0.8509521484375, 1.04974365234375, 1.24853515625, 1.44732666015625, 1.6461181640625, 1.84490966796875, 2.043701171875, 2.24249267578125, 2.4412841796875, 2.64007568359375, 2.8388671875, 3.03765869140625, 3.2364501953125, 3.43524169921875, 3.634033203125, 3.83282470703125, 4.0316162109375, 4.23040771484375, 4.42919921875, 4.62799072265625, 4.8267822265625, 5.02557373046875, 5.224365234375, 5.42315673828125, 5.6219482421875, 5.82073974609375, 6.01953125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 9.0, 11.0, 25.0, 19.0, 28.0, 31.0, 47.0, 72.0, 109.0, 131.0, 196.0, 245.0, 357.0, 489.0, 776.0, 1097.0, 1628.0, 2517.0, 4584.0, 12430.0, 135020.0, 801301.0, 67327.0, 8963.0, 3882.0, 2328.0, 1481.0, 1022.0, 667.0, 482.0, 366.0, 255.0, 158.0, 140.0, 91.0, 75.0, 61.0, 34.0, 27.0, 9.0, 18.0, 4.0, 8.0, 10.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.296875, -19.670166015625, -19.04345703125, -18.416748046875, -17.7900390625, -17.163330078125, -16.53662109375, -15.909912109375, -15.283203125, -14.656494140625, -14.02978515625, -13.403076171875, -12.7763671875, -12.149658203125, -11.52294921875, -10.896240234375, -10.26953125, -9.642822265625, -9.01611328125, -8.389404296875, -7.7626953125, -7.135986328125, -6.50927734375, -5.882568359375, -5.255859375, -4.629150390625, -4.00244140625, -3.375732421875, -2.7490234375, -2.122314453125, -1.49560546875, -0.868896484375, -0.2421875, 0.384521484375, 1.01123046875, 1.637939453125, 2.2646484375, 2.891357421875, 3.51806640625, 4.144775390625, 4.771484375, 5.398193359375, 6.02490234375, 6.651611328125, 7.2783203125, 7.905029296875, 8.53173828125, 9.158447265625, 9.78515625, 10.411865234375, 11.03857421875, 11.665283203125, 12.2919921875, 12.918701171875, 13.54541015625, 14.172119140625, 14.798828125, 15.425537109375, 16.05224609375, 16.678955078125, 17.3056640625, 17.932373046875, 18.55908203125, 19.185791015625, 19.8125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 9.0, 8.0, 35.0, 82.0, 229.0, 343.0, 174.0, 75.0, 20.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016126632690429688, -0.0015612393617630005, -0.0015098154544830322, -0.001458391547203064, -0.0014069676399230957, -0.0013555437326431274, -0.0013041198253631592, -0.001252695918083191, -0.0012012720108032227, -0.0011498481035232544, -0.0010984241962432861, -0.0010470002889633179, -0.0009955763816833496, -0.0009441524744033813, -0.0008927285671234131, -0.0008413046598434448, -0.0007898807525634766, -0.0007384568452835083, -0.00068703293800354, -0.0006356090307235718, -0.0005841851234436035, -0.0005327612161636353, -0.000481337308883667, -0.00042991340160369873, -0.00037848949432373047, -0.0003270655870437622, -0.00027564167976379395, -0.00022421777248382568, -0.00017279386520385742, -0.00012136995792388916, -6.99460506439209e-05, -1.8522143363952637e-05, 3.2901763916015625e-05, 8.432567119598389e-05, 0.00013574957847595215, 0.0001871734857559204, 0.00023859739303588867, 0.00029002130031585693, 0.0003414452075958252, 0.00039286911487579346, 0.0004442930221557617, 0.00049571692943573, 0.0005471408367156982, 0.0005985647439956665, 0.0006499886512756348, 0.000701412558555603, 0.0007528364658355713, 0.0008042603731155396, 0.0008556842803955078, 0.0009071081876754761, 0.0009585320949554443, 0.0010099560022354126, 0.0010613799095153809, 0.0011128038167953491, 0.0011642277240753174, 0.0012156516313552856, 0.001267075538635254, 0.0013184994459152222, 0.0013699233531951904, 0.0014213472604751587, 0.001472771167755127, 0.0015241950750350952, 0.0015756189823150635, 0.0016270428895950317, 0.001678466796875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 15.0, 24.0, 30.0, 34.0, 48.0, 67.0, 76.0, 147.0, 151.0, 218.0, 289.0, 387.0, 522.0, 686.0, 996.0, 1255.0, 1918.0, 2628.0, 3989.0, 7384.0, 25360.0, 162974.0, 598512.0, 190508.0, 28448.0, 7939.0, 4161.0, 2720.0, 1862.0, 1417.0, 1004.0, 687.0, 567.0, 412.0, 259.0, 234.0, 169.0, 123.0, 75.0, 66.0, 68.0, 30.0, 24.0, 24.0, 16.0, 6.0, 7.0, 9.0, 2.0, 1.0, 2.0, 1.0], "bins": [-13.765625, -13.3670654296875, -12.968505859375, -12.5699462890625, -12.17138671875, -11.7728271484375, -11.374267578125, -10.9757080078125, -10.5771484375, -10.1785888671875, -9.780029296875, -9.3814697265625, -8.98291015625, -8.5843505859375, -8.185791015625, -7.7872314453125, -7.388671875, -6.9901123046875, -6.591552734375, -6.1929931640625, -5.79443359375, -5.3958740234375, -4.997314453125, -4.5987548828125, -4.2001953125, -3.8016357421875, -3.403076171875, -3.0045166015625, -2.60595703125, -2.2073974609375, -1.808837890625, -1.4102783203125, -1.01171875, -0.6131591796875, -0.214599609375, 0.1839599609375, 0.58251953125, 0.9810791015625, 1.379638671875, 1.7781982421875, 2.1767578125, 2.5753173828125, 2.973876953125, 3.3724365234375, 3.77099609375, 4.1695556640625, 4.568115234375, 4.9666748046875, 5.365234375, 5.7637939453125, 6.162353515625, 6.5609130859375, 6.95947265625, 7.3580322265625, 7.756591796875, 8.1551513671875, 8.5537109375, 8.9522705078125, 9.350830078125, 9.7493896484375, 10.14794921875, 10.5465087890625, 10.945068359375, 11.3436279296875, 11.7421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 10.0, 14.0, 27.0, 39.0, 88.0, 101.0, 159.0, 154.0, 151.0, 90.0, 55.0, 41.0, 24.0, 14.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.73046875, -2.645843505859375, -2.56121826171875, -2.476593017578125, -2.3919677734375, -2.307342529296875, -2.22271728515625, -2.138092041015625, -2.053466796875, -1.968841552734375, -1.88421630859375, -1.799591064453125, -1.7149658203125, -1.630340576171875, -1.54571533203125, -1.461090087890625, -1.37646484375, -1.291839599609375, -1.20721435546875, -1.122589111328125, -1.0379638671875, -0.953338623046875, -0.86871337890625, -0.784088134765625, -0.699462890625, -0.614837646484375, -0.53021240234375, -0.445587158203125, -0.3609619140625, -0.276336669921875, -0.19171142578125, -0.107086181640625, -0.0224609375, 0.062164306640625, 0.14678955078125, 0.231414794921875, 0.3160400390625, 0.400665283203125, 0.48529052734375, 0.569915771484375, 0.654541015625, 0.739166259765625, 0.82379150390625, 0.908416748046875, 0.9930419921875, 1.077667236328125, 1.16229248046875, 1.246917724609375, 1.33154296875, 1.416168212890625, 1.50079345703125, 1.585418701171875, 1.6700439453125, 1.754669189453125, 1.83929443359375, 1.923919677734375, 2.008544921875, 2.093170166015625, 2.17779541015625, 2.262420654296875, 2.3470458984375, 2.431671142578125, 2.51629638671875, 2.600921630859375, 2.685546875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 9.0, 6.0, 8.0, 8.0, 15.0, 9.0, 33.0, 32.0, 46.0, 77.0, 73.0, 104.0, 115.0, 108.0, 81.0, 62.0, 52.0, 34.0, 33.0, 32.0, 17.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.375194549560547, -29.5250244140625, -28.674854278564453, -27.824682235717773, -26.974512100219727, -26.12434196472168, -25.274169921875, -24.423999786376953, -23.573829650878906, -22.72365951538086, -21.873489379882812, -21.023317337036133, -20.173147201538086, -19.32297706604004, -18.47280502319336, -17.622634887695312, -16.772464752197266, -15.922294616699219, -15.072123527526855, -14.221952438354492, -13.371782302856445, -12.521612167358398, -11.671441078186035, -10.821269989013672, -9.971099853515625, -9.120929718017578, -8.270758628845215, -7.42058801651001, -6.570417404174805, -5.7202467918396, -4.8700761795043945, -4.0199055671691895, -3.1697330474853516, -2.3195624351501465, -1.4693918228149414, -0.6192212104797363, 0.23094940185546875, 1.0811200141906738, 1.931290626525879, 2.781461238861084, 3.631631851196289, 4.481802463531494, 5.331973075866699, 6.182143688201904, 7.032314300537109, 7.8824849128723145, 8.73265552520752, 9.582826614379883, 10.43299674987793, 11.283166885375977, 12.13333797454834, 12.983509063720703, 13.83367919921875, 14.683849334716797, 15.53402042388916, 16.384191513061523, 17.23436164855957, 18.084531784057617, 18.934703826904297, 19.784873962402344, 20.63504409790039, 21.485214233398438, 22.335384368896484, 23.185556411743164, 24.03572654724121]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 10.0, 9.0, 7.0, 7.0, 8.0, 11.0, 19.0, 18.0, 23.0, 24.0, 17.0, 19.0, 25.0, 39.0, 39.0, 36.0, 39.0, 37.0, 35.0, 38.0, 33.0, 48.0, 32.0, 39.0, 24.0, 29.0, 34.0, 36.0, 27.0, 33.0, 23.0, 28.0, 30.0, 14.0, 18.0, 16.0, 19.0, 15.0, 10.0, 7.0, 9.0, 8.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.759055137634277, -9.482192039489746, -9.205327987670898, -8.928464889526367, -8.651601791381836, -8.374738693237305, -8.097875595092773, -7.821011543273926, -7.5441484451293945, -7.267285346984863, -6.990421772003174, -6.713558197021484, -6.436695098876953, -6.159832000732422, -5.882968425750732, -5.606104850769043, -5.329241752624512, -5.0523786544799805, -4.775515079498291, -4.498651504516602, -4.22178840637207, -3.94492506980896, -3.6680617332458496, -3.3911983966827393, -3.114335060119629, -2.8374717235565186, -2.560608386993408, -2.283745050430298, -2.0068817138671875, -1.7300183773040771, -1.4531550407409668, -1.1762917041778564, -0.8994288444519043, -0.622565507888794, -0.3457021713256836, -0.06883883476257324, 0.2080245018005371, 0.48488783836364746, 0.7617511749267578, 1.0386145114898682, 1.3154778480529785, 1.5923411846160889, 1.8692045211791992, 2.1460678577423096, 2.42293119430542, 2.6997945308685303, 2.9766578674316406, 3.253521203994751, 3.5303845405578613, 3.8072478771209717, 4.084111213684082, 4.360974311828613, 4.637837886810303, 4.914701461791992, 5.191564559936523, 5.468427658081055, 5.745291233062744, 6.022154808044434, 6.299017906188965, 6.575881004333496, 6.8527445793151855, 7.129608154296875, 7.406471252441406, 7.6833343505859375, 7.960197925567627]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 4.0, 4.0, 13.0, 16.0, 23.0, 46.0, 47.0, 77.0, 122.0, 192.0, 324.0, 530.0, 827.0, 1321.0, 2094.0, 3631.0, 5817.0, 9615.0, 16236.0, 26571.0, 42992.0, 68960.0, 104640.0, 143871.0, 164709.0, 149578.0, 111097.0, 74558.0, 46901.0, 29212.0, 17540.0, 10652.0, 6355.0, 3863.0, 2361.0, 1460.0, 864.0, 520.0, 340.0, 223.0, 130.0, 75.0, 37.0, 38.0, 27.0, 21.0, 9.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8671875, -11.43701171875, -11.0068359375, -10.57666015625, -10.146484375, -9.71630859375, -9.2861328125, -8.85595703125, -8.42578125, -7.99560546875, -7.5654296875, -7.13525390625, -6.705078125, -6.27490234375, -5.8447265625, -5.41455078125, -4.984375, -4.55419921875, -4.1240234375, -3.69384765625, -3.263671875, -2.83349609375, -2.4033203125, -1.97314453125, -1.54296875, -1.11279296875, -0.6826171875, -0.25244140625, 0.177734375, 0.60791015625, 1.0380859375, 1.46826171875, 1.8984375, 2.32861328125, 2.7587890625, 3.18896484375, 3.619140625, 4.04931640625, 4.4794921875, 4.90966796875, 5.33984375, 5.77001953125, 6.2001953125, 6.63037109375, 7.060546875, 7.49072265625, 7.9208984375, 8.35107421875, 8.78125, 9.21142578125, 9.6416015625, 10.07177734375, 10.501953125, 10.93212890625, 11.3623046875, 11.79248046875, 12.22265625, 12.65283203125, 13.0830078125, 13.51318359375, 13.943359375, 14.37353515625, 14.8037109375, 15.23388671875, 15.6640625]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 10.0, 9.0, 4.0, 9.0, 14.0, 15.0, 18.0, 23.0, 20.0, 25.0, 41.0, 31.0, 35.0, 44.0, 34.0, 32.0, 40.0, 61.0, 54.0, 38.0, 38.0, 49.0, 32.0, 42.0, 36.0, 33.0, 26.0, 27.0, 34.0, 20.0, 18.0, 18.0, 13.0, 15.0, 14.0, 9.0, 7.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.2109375, -12.8529052734375, -12.494873046875, -12.1368408203125, -11.77880859375, -11.4207763671875, -11.062744140625, -10.7047119140625, -10.3466796875, -9.9886474609375, -9.630615234375, -9.2725830078125, -8.91455078125, -8.5565185546875, -8.198486328125, -7.8404541015625, -7.482421875, -7.1243896484375, -6.766357421875, -6.4083251953125, -6.05029296875, -5.6922607421875, -5.334228515625, -4.9761962890625, -4.6181640625, -4.2601318359375, -3.902099609375, -3.5440673828125, -3.18603515625, -2.8280029296875, -2.469970703125, -2.1119384765625, -1.75390625, -1.3958740234375, -1.037841796875, -0.6798095703125, -0.32177734375, 0.0362548828125, 0.394287109375, 0.7523193359375, 1.1103515625, 1.4683837890625, 1.826416015625, 2.1844482421875, 2.54248046875, 2.9005126953125, 3.258544921875, 3.6165771484375, 3.974609375, 4.3326416015625, 4.690673828125, 5.0487060546875, 5.40673828125, 5.7647705078125, 6.122802734375, 6.4808349609375, 6.8388671875, 7.1968994140625, 7.554931640625, 7.9129638671875, 8.27099609375, 8.6290283203125, 8.987060546875, 9.3450927734375, 9.703125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 12.0, 29.0, 38.0, 51.0, 88.0, 119.0, 161.0, 266.0, 425.0, 674.0, 1095.0, 1707.0, 2715.0, 4535.0, 7550.0, 12685.0, 21700.0, 37079.0, 63363.0, 103041.0, 150483.0, 179358.0, 162906.0, 116654.0, 73974.0, 43786.0, 26189.0, 15249.0, 8697.0, 5255.0, 3184.0, 1981.0, 1297.0, 756.0, 536.0, 319.0, 224.0, 134.0, 75.0, 62.0, 34.0, 19.0, 15.0, 14.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.625, -14.1318359375, -13.638671875, -13.1455078125, -12.65234375, -12.1591796875, -11.666015625, -11.1728515625, -10.6796875, -10.1865234375, -9.693359375, -9.2001953125, -8.70703125, -8.2138671875, -7.720703125, -7.2275390625, -6.734375, -6.2412109375, -5.748046875, -5.2548828125, -4.76171875, -4.2685546875, -3.775390625, -3.2822265625, -2.7890625, -2.2958984375, -1.802734375, -1.3095703125, -0.81640625, -0.3232421875, 0.169921875, 0.6630859375, 1.15625, 1.6494140625, 2.142578125, 2.6357421875, 3.12890625, 3.6220703125, 4.115234375, 4.6083984375, 5.1015625, 5.5947265625, 6.087890625, 6.5810546875, 7.07421875, 7.5673828125, 8.060546875, 8.5537109375, 9.046875, 9.5400390625, 10.033203125, 10.5263671875, 11.01953125, 11.5126953125, 12.005859375, 12.4990234375, 12.9921875, 13.4853515625, 13.978515625, 14.4716796875, 14.96484375, 15.4580078125, 15.951171875, 16.4443359375, 16.9375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 5.0, 4.0, 3.0, 8.0, 8.0, 7.0, 9.0, 12.0, 17.0, 13.0, 22.0, 17.0, 29.0, 43.0, 35.0, 24.0, 32.0, 39.0, 37.0, 52.0, 50.0, 34.0, 34.0, 46.0, 35.0, 44.0, 31.0, 45.0, 42.0, 28.0, 18.0, 26.0, 29.0, 24.0, 14.0, 23.0, 13.0, 10.0, 8.0, 6.0, 7.0, 7.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.4296875, -7.21636962890625, -7.0030517578125, -6.78973388671875, -6.576416015625, -6.36309814453125, -6.1497802734375, -5.93646240234375, -5.72314453125, -5.50982666015625, -5.2965087890625, -5.08319091796875, -4.869873046875, -4.65655517578125, -4.4432373046875, -4.22991943359375, -4.0166015625, -3.80328369140625, -3.5899658203125, -3.37664794921875, -3.163330078125, -2.95001220703125, -2.7366943359375, -2.52337646484375, -2.31005859375, -2.09674072265625, -1.8834228515625, -1.67010498046875, -1.456787109375, -1.24346923828125, -1.0301513671875, -0.81683349609375, -0.603515625, -0.39019775390625, -0.1768798828125, 0.03643798828125, 0.249755859375, 0.46307373046875, 0.6763916015625, 0.88970947265625, 1.10302734375, 1.31634521484375, 1.5296630859375, 1.74298095703125, 1.956298828125, 2.16961669921875, 2.3829345703125, 2.59625244140625, 2.8095703125, 3.02288818359375, 3.2362060546875, 3.44952392578125, 3.662841796875, 3.87615966796875, 4.0894775390625, 4.30279541015625, 4.51611328125, 4.72943115234375, 4.9427490234375, 5.15606689453125, 5.369384765625, 5.58270263671875, 5.7960205078125, 6.00933837890625, 6.22265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 11.0, 12.0, 23.0, 27.0, 37.0, 81.0, 88.0, 112.0, 152.0, 241.0, 401.0, 594.0, 812.0, 1250.0, 1949.0, 3089.0, 5005.0, 8278.0, 13986.0, 24963.0, 45288.0, 86016.0, 158884.0, 236117.0, 203224.0, 116700.0, 61830.0, 33101.0, 18418.0, 10615.0, 6238.0, 3775.0, 2400.0, 1580.0, 1029.0, 708.0, 475.0, 311.0, 227.0, 139.0, 102.0, 61.0, 58.0, 43.0, 35.0, 23.0, 14.0, 6.0, 7.0, 9.0, 5.0, 0.0, 5.0], "bins": [-8.4140625, -8.171875, -7.9296875, -7.6875, -7.4453125, -7.203125, -6.9609375, -6.71875, -6.4765625, -6.234375, -5.9921875, -5.75, -5.5078125, -5.265625, -5.0234375, -4.78125, -4.5390625, -4.296875, -4.0546875, -3.8125, -3.5703125, -3.328125, -3.0859375, -2.84375, -2.6015625, -2.359375, -2.1171875, -1.875, -1.6328125, -1.390625, -1.1484375, -0.90625, -0.6640625, -0.421875, -0.1796875, 0.0625, 0.3046875, 0.546875, 0.7890625, 1.03125, 1.2734375, 1.515625, 1.7578125, 2.0, 2.2421875, 2.484375, 2.7265625, 2.96875, 3.2109375, 3.453125, 3.6953125, 3.9375, 4.1796875, 4.421875, 4.6640625, 4.90625, 5.1484375, 5.390625, 5.6328125, 5.875, 6.1171875, 6.359375, 6.6015625, 6.84375, 7.0859375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 6.0, 6.0, 9.0, 10.0, 9.0, 12.0, 15.0, 30.0, 26.0, 43.0, 39.0, 61.0, 108.0, 98.0, 82.0, 87.0, 95.0, 56.0, 49.0, 28.0, 34.0, 16.0, 13.0, 15.0, 12.0, 8.0, 10.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011739730834960938, -0.0011376142501831055, -0.0011012554168701172, -0.001064896583557129, -0.0010285377502441406, -0.0009921789169311523, -0.0009558200836181641, -0.0009194612503051758, -0.0008831024169921875, -0.0008467435836791992, -0.0008103847503662109, -0.0007740259170532227, -0.0007376670837402344, -0.0007013082504272461, -0.0006649494171142578, -0.0006285905838012695, -0.0005922317504882812, -0.000555872917175293, -0.0005195140838623047, -0.0004831552505493164, -0.0004467964172363281, -0.00041043758392333984, -0.00037407875061035156, -0.0003377199172973633, -0.000301361083984375, -0.0002650022506713867, -0.00022864341735839844, -0.00019228458404541016, -0.00015592575073242188, -0.0001195669174194336, -8.320808410644531e-05, -4.684925079345703e-05, -1.049041748046875e-05, 2.586841583251953e-05, 6.222724914550781e-05, 9.85860824584961e-05, 0.00013494491577148438, 0.00017130374908447266, 0.00020766258239746094, 0.00024402141571044922, 0.0002803802490234375, 0.0003167390823364258, 0.00035309791564941406, 0.00038945674896240234, 0.0004258155822753906, 0.0004621744155883789, 0.0004985332489013672, 0.0005348920822143555, 0.0005712509155273438, 0.000607609748840332, 0.0006439685821533203, 0.0006803274154663086, 0.0007166862487792969, 0.0007530450820922852, 0.0007894039154052734, 0.0008257627487182617, 0.00086212158203125, 0.0008984804153442383, 0.0009348392486572266, 0.0009711980819702148, 0.0010075569152832031, 0.0010439157485961914, 0.0010802745819091797, 0.001116633415222168, 0.0011529922485351562]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 8.0, 14.0, 12.0, 19.0, 34.0, 49.0, 44.0, 89.0, 131.0, 185.0, 284.0, 390.0, 599.0, 916.0, 1365.0, 2172.0, 3535.0, 5761.0, 9520.0, 16469.0, 28703.0, 52877.0, 96932.0, 168115.0, 223623.0, 185713.0, 110796.0, 60528.0, 32963.0, 18608.0, 10828.0, 6411.0, 3904.0, 2446.0, 1571.0, 974.0, 647.0, 422.0, 286.0, 195.0, 137.0, 105.0, 51.0, 48.0, 25.0, 18.0, 19.0, 10.0, 4.0, 5.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.39453125, -6.1785888671875, -5.962646484375, -5.7467041015625, -5.53076171875, -5.3148193359375, -5.098876953125, -4.8829345703125, -4.6669921875, -4.4510498046875, -4.235107421875, -4.0191650390625, -3.80322265625, -3.5872802734375, -3.371337890625, -3.1553955078125, -2.939453125, -2.7235107421875, -2.507568359375, -2.2916259765625, -2.07568359375, -1.8597412109375, -1.643798828125, -1.4278564453125, -1.2119140625, -0.9959716796875, -0.780029296875, -0.5640869140625, -0.34814453125, -0.1322021484375, 0.083740234375, 0.2996826171875, 0.515625, 0.7315673828125, 0.947509765625, 1.1634521484375, 1.37939453125, 1.5953369140625, 1.811279296875, 2.0272216796875, 2.2431640625, 2.4591064453125, 2.675048828125, 2.8909912109375, 3.10693359375, 3.3228759765625, 3.538818359375, 3.7547607421875, 3.970703125, 4.1866455078125, 4.402587890625, 4.6185302734375, 4.83447265625, 5.0504150390625, 5.266357421875, 5.4822998046875, 5.6982421875, 5.9141845703125, 6.130126953125, 6.3460693359375, 6.56201171875, 6.7779541015625, 6.993896484375, 7.2098388671875, 7.42578125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 9.0, 3.0, 5.0, 8.0, 7.0, 12.0, 7.0, 15.0, 15.0, 26.0, 35.0, 35.0, 29.0, 55.0, 47.0, 57.0, 85.0, 68.0, 73.0, 73.0, 63.0, 49.0, 34.0, 36.0, 36.0, 26.0, 20.0, 10.0, 13.0, 12.0, 14.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6025390625, -1.5393218994140625, -1.476104736328125, -1.4128875732421875, -1.34967041015625, -1.2864532470703125, -1.223236083984375, -1.1600189208984375, -1.0968017578125, -1.0335845947265625, -0.970367431640625, -0.9071502685546875, -0.84393310546875, -0.7807159423828125, -0.717498779296875, -0.6542816162109375, -0.591064453125, -0.5278472900390625, -0.464630126953125, -0.4014129638671875, -0.33819580078125, -0.2749786376953125, -0.211761474609375, -0.1485443115234375, -0.0853271484375, -0.0221099853515625, 0.041107177734375, 0.1043243408203125, 0.16754150390625, 0.2307586669921875, 0.293975830078125, 0.3571929931640625, 0.42041015625, 0.4836273193359375, 0.546844482421875, 0.6100616455078125, 0.67327880859375, 0.7364959716796875, 0.799713134765625, 0.8629302978515625, 0.9261474609375, 0.9893646240234375, 1.052581787109375, 1.1157989501953125, 1.17901611328125, 1.2422332763671875, 1.305450439453125, 1.3686676025390625, 1.431884765625, 1.4951019287109375, 1.558319091796875, 1.6215362548828125, 1.68475341796875, 1.7479705810546875, 1.811187744140625, 1.8744049072265625, 1.9376220703125, 2.0008392333984375, 2.064056396484375, 2.1272735595703125, 2.19049072265625, 2.2537078857421875, 2.316925048828125, 2.3801422119140625, 2.443359375]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 11.0, 12.0, 10.0, 13.0, 16.0, 32.0, 43.0, 50.0, 62.0, 76.0, 79.0, 76.0, 91.0, 76.0, 58.0, 60.0, 47.0, 45.0, 23.0, 30.0, 19.0, 13.0, 7.0, 9.0, 7.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.13949203491211, -24.40159797668457, -23.66370391845703, -22.925809860229492, -22.187915802001953, -21.45001983642578, -20.712125778198242, -19.974231719970703, -19.236337661743164, -18.498443603515625, -17.760549545288086, -17.022655487060547, -16.284759521484375, -15.546866416931152, -14.808971405029297, -14.071077346801758, -13.333183288574219, -12.59528923034668, -11.85739517211914, -11.119500160217285, -10.381606101989746, -9.643712043762207, -8.905817031860352, -8.167922973632812, -7.430028915405273, -6.692134857177734, -5.954240322113037, -5.21634578704834, -4.478451728820801, -3.7405574321746826, -3.0026631355285645, -2.264768600463867, -1.526876449584961, -0.7889821529388428, -0.05108785629272461, 0.6868064403533936, 1.4247007369995117, 2.16259503364563, 2.900489330291748, 3.6383838653564453, 4.376277923583984, 5.114171981811523, 5.852066516876221, 6.589961051940918, 7.327855110168457, 8.065749168395996, 8.803644180297852, 9.54153823852539, 10.27943229675293, 11.017326354980469, 11.755220413208008, 12.493115425109863, 13.231009483337402, 13.968903541564941, 14.706798553466797, 15.444692611694336, 16.182586669921875, 16.920480728149414, 17.658374786376953, 18.396268844604492, 19.13416290283203, 19.872058868408203, 20.609952926635742, 21.34784698486328, 22.08574104309082]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 9.0, 5.0, 14.0, 9.0, 10.0, 15.0, 17.0, 14.0, 21.0, 23.0, 23.0, 26.0, 39.0, 20.0, 37.0, 38.0, 28.0, 38.0, 46.0, 36.0, 37.0, 36.0, 31.0, 24.0, 44.0, 33.0, 34.0, 38.0, 26.0, 26.0, 30.0, 28.0, 22.0, 23.0, 20.0, 16.0, 12.0, 14.0, 10.0, 5.0, 11.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.364797592163086, -8.079201698303223, -7.793605804443359, -7.508009910583496, -7.222414016723633, -6.9368181228637695, -6.651222229003906, -6.365626335144043, -6.08003044128418, -5.794434547424316, -5.508838653564453, -5.22324275970459, -4.937646865844727, -4.652050971984863, -4.366455078125, -4.080859184265137, -3.7952632904052734, -3.50966739654541, -3.224071502685547, -2.9384756088256836, -2.6528797149658203, -2.367283821105957, -2.0816879272460938, -1.7960920333862305, -1.5104961395263672, -1.224900245666504, -0.9393043518066406, -0.6537084579467773, -0.36811256408691406, -0.08251667022705078, 0.2030792236328125, 0.4886751174926758, 0.7742719650268555, 1.0598678588867188, 1.345463752746582, 1.6310596466064453, 1.9166555404663086, 2.202251434326172, 2.487847328186035, 2.7734432220458984, 3.0590391159057617, 3.344635009765625, 3.6302309036254883, 3.9158267974853516, 4.201422691345215, 4.487018585205078, 4.772614479064941, 5.058210372924805, 5.343806266784668, 5.629402160644531, 5.9149980545043945, 6.200593948364258, 6.486189842224121, 6.771785736083984, 7.057381629943848, 7.342977523803711, 7.628573417663574, 7.9141693115234375, 8.1997652053833, 8.485361099243164, 8.770956993103027, 9.05655288696289, 9.342148780822754, 9.627744674682617, 9.91334056854248]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 10.0, 12.0, 21.0, 28.0, 46.0, 59.0, 81.0, 140.0, 235.0, 319.0, 467.0, 846.0, 1245.0, 2060.0, 3485.0, 5831.0, 10521.0, 19676.0, 38580.0, 82272.0, 194879.0, 524960.0, 1326373.0, 1221086.0, 448406.0, 167891.0, 71534.0, 33666.0, 17124.0, 9360.0, 5170.0, 2984.0, 1772.0, 1121.0, 676.0, 434.0, 300.0, 165.0, 127.0, 93.0, 56.0, 46.0, 36.0, 25.0, 7.0, 21.0, 13.0, 9.0, 10.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-20.65625, -19.966064453125, -19.27587890625, -18.585693359375, -17.8955078125, -17.205322265625, -16.51513671875, -15.824951171875, -15.134765625, -14.444580078125, -13.75439453125, -13.064208984375, -12.3740234375, -11.683837890625, -10.99365234375, -10.303466796875, -9.61328125, -8.923095703125, -8.23291015625, -7.542724609375, -6.8525390625, -6.162353515625, -5.47216796875, -4.781982421875, -4.091796875, -3.401611328125, -2.71142578125, -2.021240234375, -1.3310546875, -0.640869140625, 0.04931640625, 0.739501953125, 1.4296875, 2.119873046875, 2.81005859375, 3.500244140625, 4.1904296875, 4.880615234375, 5.57080078125, 6.260986328125, 6.951171875, 7.641357421875, 8.33154296875, 9.021728515625, 9.7119140625, 10.402099609375, 11.09228515625, 11.782470703125, 12.47265625, 13.162841796875, 13.85302734375, 14.543212890625, 15.2333984375, 15.923583984375, 16.61376953125, 17.303955078125, 17.994140625, 18.684326171875, 19.37451171875, 20.064697265625, 20.7548828125, 21.445068359375, 22.13525390625, 22.825439453125, 23.515625]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 13.0, 4.0, 7.0, 13.0, 19.0, 15.0, 18.0, 25.0, 23.0, 25.0, 29.0, 37.0, 42.0, 36.0, 36.0, 35.0, 53.0, 44.0, 38.0, 37.0, 36.0, 40.0, 27.0, 31.0, 36.0, 38.0, 39.0, 25.0, 20.0, 26.0, 16.0, 17.0, 21.0, 14.0, 14.0, 10.0, 8.0, 3.0, 4.0, 6.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.6953125, -7.4495849609375, -7.203857421875, -6.9581298828125, -6.71240234375, -6.4666748046875, -6.220947265625, -5.9752197265625, -5.7294921875, -5.4837646484375, -5.238037109375, -4.9923095703125, -4.74658203125, -4.5008544921875, -4.255126953125, -4.0093994140625, -3.763671875, -3.5179443359375, -3.272216796875, -3.0264892578125, -2.78076171875, -2.5350341796875, -2.289306640625, -2.0435791015625, -1.7978515625, -1.5521240234375, -1.306396484375, -1.0606689453125, -0.81494140625, -0.5692138671875, -0.323486328125, -0.0777587890625, 0.16796875, 0.4136962890625, 0.659423828125, 0.9051513671875, 1.15087890625, 1.3966064453125, 1.642333984375, 1.8880615234375, 2.1337890625, 2.3795166015625, 2.625244140625, 2.8709716796875, 3.11669921875, 3.3624267578125, 3.608154296875, 3.8538818359375, 4.099609375, 4.3453369140625, 4.591064453125, 4.8367919921875, 5.08251953125, 5.3282470703125, 5.573974609375, 5.8197021484375, 6.0654296875, 6.3111572265625, 6.556884765625, 6.8026123046875, 7.04833984375, 7.2940673828125, 7.539794921875, 7.7855224609375, 8.03125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 10.0, 15.0, 22.0, 23.0, 63.0, 74.0, 109.0, 156.0, 218.0, 349.0, 537.0, 817.0, 1272.0, 1946.0, 3092.0, 5046.0, 8097.0, 13708.0, 24096.0, 43745.0, 84309.0, 172522.0, 372771.0, 821839.0, 1243017.0, 736677.0, 331985.0, 154697.0, 76242.0, 40362.0, 22616.0, 12940.0, 7781.0, 4844.0, 2927.0, 1906.0, 1231.0, 762.0, 527.0, 327.0, 215.0, 125.0, 87.0, 58.0, 45.0, 24.0, 15.0, 7.0, 8.0, 4.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.65625, -19.9990234375, -19.341796875, -18.6845703125, -18.02734375, -17.3701171875, -16.712890625, -16.0556640625, -15.3984375, -14.7412109375, -14.083984375, -13.4267578125, -12.76953125, -12.1123046875, -11.455078125, -10.7978515625, -10.140625, -9.4833984375, -8.826171875, -8.1689453125, -7.51171875, -6.8544921875, -6.197265625, -5.5400390625, -4.8828125, -4.2255859375, -3.568359375, -2.9111328125, -2.25390625, -1.5966796875, -0.939453125, -0.2822265625, 0.375, 1.0322265625, 1.689453125, 2.3466796875, 3.00390625, 3.6611328125, 4.318359375, 4.9755859375, 5.6328125, 6.2900390625, 6.947265625, 7.6044921875, 8.26171875, 8.9189453125, 9.576171875, 10.2333984375, 10.890625, 11.5478515625, 12.205078125, 12.8623046875, 13.51953125, 14.1767578125, 14.833984375, 15.4912109375, 16.1484375, 16.8056640625, 17.462890625, 18.1201171875, 18.77734375, 19.4345703125, 20.091796875, 20.7490234375, 21.40625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 7.0, 6.0, 3.0, 11.0, 15.0, 25.0, 37.0, 46.0, 53.0, 67.0, 103.0, 126.0, 159.0, 196.0, 247.0, 321.0, 337.0, 385.0, 347.0, 337.0, 257.0, 222.0, 151.0, 149.0, 100.0, 83.0, 62.0, 47.0, 43.0, 37.0, 23.0, 8.0, 13.0, 13.0, 5.0, 9.0, 6.0, 6.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.203125, -5.0020751953125, -4.801025390625, -4.5999755859375, -4.39892578125, -4.1978759765625, -3.996826171875, -3.7957763671875, -3.5947265625, -3.3936767578125, -3.192626953125, -2.9915771484375, -2.79052734375, -2.5894775390625, -2.388427734375, -2.1873779296875, -1.986328125, -1.7852783203125, -1.584228515625, -1.3831787109375, -1.18212890625, -0.9810791015625, -0.780029296875, -0.5789794921875, -0.3779296875, -0.1768798828125, 0.024169921875, 0.2252197265625, 0.42626953125, 0.6273193359375, 0.828369140625, 1.0294189453125, 1.23046875, 1.4315185546875, 1.632568359375, 1.8336181640625, 2.03466796875, 2.2357177734375, 2.436767578125, 2.6378173828125, 2.8388671875, 3.0399169921875, 3.240966796875, 3.4420166015625, 3.64306640625, 3.8441162109375, 4.045166015625, 4.2462158203125, 4.447265625, 4.6483154296875, 4.849365234375, 5.0504150390625, 5.25146484375, 5.4525146484375, 5.653564453125, 5.8546142578125, 6.0556640625, 6.2567138671875, 6.457763671875, 6.6588134765625, 6.85986328125, 7.0609130859375, 7.261962890625, 7.4630126953125, 7.6640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 13.0, 11.0, 14.0, 28.0, 36.0, 40.0, 52.0, 79.0, 95.0, 96.0, 81.0, 93.0, 74.0, 67.0, 43.0, 43.0, 28.0, 22.0, 11.0, 16.0, 9.0, 9.0, 2.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.252614974975586, -27.404245376586914, -26.555875778198242, -25.707504272460938, -24.859134674072266, -24.010765075683594, -23.162395477294922, -22.31402587890625, -21.465654373168945, -20.617284774780273, -19.7689151763916, -18.920543670654297, -18.072174072265625, -17.223804473876953, -16.37543487548828, -15.527064323425293, -14.678694725036621, -13.83032512664795, -12.981954574584961, -12.133584976196289, -11.2852144241333, -10.436844825744629, -9.58847427368164, -8.740104675292969, -7.891734600067139, -7.043364524841309, -6.1949944496154785, -5.346624374389648, -4.498254776000977, -3.6498847007751465, -2.8015146255493164, -1.9531445503234863, -1.1047744750976562, -0.25640445947647095, 0.5919655561447144, 1.4403355121612549, 2.288705587387085, 3.137075424194336, 3.985445499420166, 4.833815574645996, 5.682185649871826, 6.530555725097656, 7.378925800323486, 8.227295875549316, 9.075665473937988, 9.924036026000977, 10.772405624389648, 11.62077522277832, 12.469145774841309, 13.31751537322998, 14.165885925292969, 15.01425552368164, 15.862626075744629, 16.710994720458984, 17.55936622619629, 18.40773582458496, 19.256105422973633, 20.104475021362305, 20.952844619750977, 21.80121612548828, 22.649585723876953, 23.497955322265625, 24.346324920654297, 25.19469451904297, 26.043066024780273]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 9.0, 7.0, 5.0, 11.0, 10.0, 9.0, 20.0, 23.0, 13.0, 21.0, 21.0, 23.0, 38.0, 18.0, 39.0, 28.0, 33.0, 40.0, 46.0, 36.0, 25.0, 33.0, 35.0, 38.0, 36.0, 43.0, 25.0, 34.0, 30.0, 23.0, 23.0, 29.0, 25.0, 31.0, 14.0, 25.0, 12.0, 15.0, 5.0, 15.0, 8.0, 6.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-8.791970252990723, -8.51536750793457, -8.238763809204102, -7.962160587310791, -7.6855573654174805, -7.408954620361328, -7.132351398468018, -6.855748176574707, -6.5791449546813965, -6.302541732788086, -6.025938510894775, -5.749335289001465, -5.4727325439453125, -5.196128845214844, -4.919526100158691, -4.642922878265381, -4.36631965637207, -4.08971643447876, -3.813113212585449, -3.5365102291107178, -3.2599070072174072, -2.9833037853240967, -2.7067008018493652, -2.4300975799560547, -2.153494358062744, -1.8768911361694336, -1.6002880334854126, -1.3236849308013916, -1.047081708908081, -0.7704784870147705, -0.4938753843307495, -0.21727228164672852, 0.059329986572265625, 0.3359331488609314, 0.6125363111495972, 0.8891394734382629, 1.1657426357269287, 1.4423458576202393, 1.7189489603042603, 1.9955520629882812, 2.272155284881592, 2.5487585067749023, 2.825361728668213, 3.1019647121429443, 3.378567934036255, 3.6551711559295654, 3.931774139404297, 4.208377361297607, 4.484980583190918, 4.7615838050842285, 5.038187026977539, 5.31479024887085, 5.59139347076416, 5.8679962158203125, 6.144599437713623, 6.421202659606934, 6.697805881500244, 6.974409103393555, 7.251012325286865, 7.527615547180176, 7.804218292236328, 8.080821990966797, 8.35742473602295, 8.634027481079102, 8.91063117980957]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 12.0, 13.0, 32.0, 44.0, 63.0, 83.0, 117.0, 238.0, 375.0, 668.0, 1017.0, 1761.0, 3090.0, 5106.0, 8611.0, 14774.0, 24693.0, 41915.0, 68403.0, 106949.0, 153944.0, 179201.0, 155385.0, 108779.0, 69215.0, 42275.0, 25237.0, 14744.0, 8855.0, 5311.0, 3102.0, 1787.0, 1074.0, 631.0, 445.0, 222.0, 130.0, 84.0, 57.0, 33.0, 28.0, 16.0, 9.0, 15.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.98046875, -6.75897216796875, -6.5374755859375, -6.31597900390625, -6.094482421875, -5.87298583984375, -5.6514892578125, -5.42999267578125, -5.20849609375, -4.98699951171875, -4.7655029296875, -4.54400634765625, -4.322509765625, -4.10101318359375, -3.8795166015625, -3.65802001953125, -3.4365234375, -3.21502685546875, -2.9935302734375, -2.77203369140625, -2.550537109375, -2.32904052734375, -2.1075439453125, -1.88604736328125, -1.66455078125, -1.44305419921875, -1.2215576171875, -1.00006103515625, -0.778564453125, -0.55706787109375, -0.3355712890625, -0.11407470703125, 0.107421875, 0.32891845703125, 0.5504150390625, 0.77191162109375, 0.993408203125, 1.21490478515625, 1.4364013671875, 1.65789794921875, 1.87939453125, 2.10089111328125, 2.3223876953125, 2.54388427734375, 2.765380859375, 2.98687744140625, 3.2083740234375, 3.42987060546875, 3.6513671875, 3.87286376953125, 4.0943603515625, 4.31585693359375, 4.537353515625, 4.75885009765625, 4.9803466796875, 5.20184326171875, 5.42333984375, 5.64483642578125, 5.8663330078125, 6.08782958984375, 6.309326171875, 6.53082275390625, 6.7523193359375, 6.97381591796875, 7.1953125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 15.0, 16.0, 8.0, 12.0, 20.0, 24.0, 23.0, 20.0, 23.0, 38.0, 44.0, 38.0, 39.0, 34.0, 39.0, 39.0, 45.0, 50.0, 45.0, 47.0, 35.0, 34.0, 33.0, 33.0, 40.0, 28.0, 21.0, 21.0, 21.0, 22.0, 16.0, 16.0, 12.0, 10.0, 12.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.6796875, -11.3138427734375, -10.947998046875, -10.5821533203125, -10.21630859375, -9.8504638671875, -9.484619140625, -9.1187744140625, -8.7529296875, -8.3870849609375, -8.021240234375, -7.6553955078125, -7.28955078125, -6.9237060546875, -6.557861328125, -6.1920166015625, -5.826171875, -5.4603271484375, -5.094482421875, -4.7286376953125, -4.36279296875, -3.9969482421875, -3.631103515625, -3.2652587890625, -2.8994140625, -2.5335693359375, -2.167724609375, -1.8018798828125, -1.43603515625, -1.0701904296875, -0.704345703125, -0.3385009765625, 0.02734375, 0.3931884765625, 0.759033203125, 1.1248779296875, 1.49072265625, 1.8565673828125, 2.222412109375, 2.5882568359375, 2.9541015625, 3.3199462890625, 3.685791015625, 4.0516357421875, 4.41748046875, 4.7833251953125, 5.149169921875, 5.5150146484375, 5.880859375, 6.2467041015625, 6.612548828125, 6.9783935546875, 7.34423828125, 7.7100830078125, 8.075927734375, 8.4417724609375, 8.8076171875, 9.1734619140625, 9.539306640625, 9.9051513671875, 10.27099609375, 10.6368408203125, 11.002685546875, 11.3685302734375, 11.734375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 17.0, 15.0, 29.0, 26.0, 45.0, 61.0, 115.0, 154.0, 200.0, 301.0, 446.0, 665.0, 993.0, 1484.0, 2397.0, 3864.0, 6316.0, 10354.0, 17940.0, 31295.0, 57085.0, 103949.0, 178029.0, 229826.0, 172972.0, 100428.0, 55448.0, 30256.0, 17329.0, 9937.0, 6095.0, 3660.0, 2371.0, 1445.0, 937.0, 648.0, 455.0, 277.0, 217.0, 138.0, 102.0, 74.0, 51.0, 42.0, 14.0, 16.0, 10.0, 6.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-9.8828125, -9.5875244140625, -9.292236328125, -8.9969482421875, -8.70166015625, -8.4063720703125, -8.111083984375, -7.8157958984375, -7.5205078125, -7.2252197265625, -6.929931640625, -6.6346435546875, -6.33935546875, -6.0440673828125, -5.748779296875, -5.4534912109375, -5.158203125, -4.8629150390625, -4.567626953125, -4.2723388671875, -3.97705078125, -3.6817626953125, -3.386474609375, -3.0911865234375, -2.7958984375, -2.5006103515625, -2.205322265625, -1.9100341796875, -1.61474609375, -1.3194580078125, -1.024169921875, -0.7288818359375, -0.43359375, -0.1383056640625, 0.156982421875, 0.4522705078125, 0.74755859375, 1.0428466796875, 1.338134765625, 1.6334228515625, 1.9287109375, 2.2239990234375, 2.519287109375, 2.8145751953125, 3.10986328125, 3.4051513671875, 3.700439453125, 3.9957275390625, 4.291015625, 4.5863037109375, 4.881591796875, 5.1768798828125, 5.47216796875, 5.7674560546875, 6.062744140625, 6.3580322265625, 6.6533203125, 6.9486083984375, 7.243896484375, 7.5391845703125, 7.83447265625, 8.1297607421875, 8.425048828125, 8.7203369140625, 9.015625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 8.0, 6.0, 6.0, 11.0, 12.0, 16.0, 10.0, 9.0, 23.0, 19.0, 36.0, 31.0, 27.0, 35.0, 44.0, 40.0, 36.0, 39.0, 38.0, 35.0, 47.0, 39.0, 37.0, 37.0, 29.0, 32.0, 44.0, 27.0, 28.0, 34.0, 29.0, 22.0, 13.0, 14.0, 15.0, 16.0, 5.0, 10.0, 6.0, 6.0, 7.0, 5.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.7191162109375, -5.516357421875, -5.3135986328125, -5.11083984375, -4.9080810546875, -4.705322265625, -4.5025634765625, -4.2998046875, -4.0970458984375, -3.894287109375, -3.6915283203125, -3.48876953125, -3.2860107421875, -3.083251953125, -2.8804931640625, -2.677734375, -2.4749755859375, -2.272216796875, -2.0694580078125, -1.86669921875, -1.6639404296875, -1.461181640625, -1.2584228515625, -1.0556640625, -0.8529052734375, -0.650146484375, -0.4473876953125, -0.24462890625, -0.0418701171875, 0.160888671875, 0.3636474609375, 0.56640625, 0.7691650390625, 0.971923828125, 1.1746826171875, 1.37744140625, 1.5802001953125, 1.782958984375, 1.9857177734375, 2.1884765625, 2.3912353515625, 2.593994140625, 2.7967529296875, 2.99951171875, 3.2022705078125, 3.405029296875, 3.6077880859375, 3.810546875, 4.0133056640625, 4.216064453125, 4.4188232421875, 4.62158203125, 4.8243408203125, 5.027099609375, 5.2298583984375, 5.4326171875, 5.6353759765625, 5.838134765625, 6.0408935546875, 6.24365234375, 6.4464111328125, 6.649169921875, 6.8519287109375, 7.0546875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 3.0, 6.0, 2.0, 5.0, 4.0, 6.0, 3.0, 27.0, 28.0, 37.0, 62.0, 59.0, 89.0, 169.0, 266.0, 405.0, 662.0, 1122.0, 2003.0, 3427.0, 6216.0, 11959.0, 23636.0, 49967.0, 107142.0, 223667.0, 292169.0, 171176.0, 78856.0, 36782.0, 17859.0, 8974.0, 4806.0, 2733.0, 1644.0, 947.0, 599.0, 382.0, 220.0, 136.0, 89.0, 72.0, 48.0, 26.0, 22.0, 13.0, 11.0, 13.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.30078125, -4.16339111328125, -4.0260009765625, -3.88861083984375, -3.751220703125, -3.61383056640625, -3.4764404296875, -3.33905029296875, -3.20166015625, -3.06427001953125, -2.9268798828125, -2.78948974609375, -2.652099609375, -2.51470947265625, -2.3773193359375, -2.23992919921875, -2.1025390625, -1.96514892578125, -1.8277587890625, -1.69036865234375, -1.552978515625, -1.41558837890625, -1.2781982421875, -1.14080810546875, -1.00341796875, -0.86602783203125, -0.7286376953125, -0.59124755859375, -0.453857421875, -0.31646728515625, -0.1790771484375, -0.04168701171875, 0.095703125, 0.23309326171875, 0.3704833984375, 0.50787353515625, 0.645263671875, 0.78265380859375, 0.9200439453125, 1.05743408203125, 1.19482421875, 1.33221435546875, 1.4696044921875, 1.60699462890625, 1.744384765625, 1.88177490234375, 2.0191650390625, 2.15655517578125, 2.2939453125, 2.43133544921875, 2.5687255859375, 2.70611572265625, 2.843505859375, 2.98089599609375, 3.1182861328125, 3.25567626953125, 3.39306640625, 3.53045654296875, 3.6678466796875, 3.80523681640625, 3.942626953125, 4.08001708984375, 4.2174072265625, 4.35479736328125, 4.4921875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 4.0, 9.0, 10.0, 13.0, 21.0, 21.0, 31.0, 48.0, 45.0, 58.0, 68.0, 86.0, 80.0, 93.0, 74.0, 68.0, 54.0, 50.0, 39.0, 39.0, 23.0, 10.0, 17.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002608299255371094, -0.00025025755167007446, -0.00023968517780303955, -0.00022911280393600464, -0.00021854043006896973, -0.00020796805620193481, -0.0001973956823348999, -0.000186823308467865, -0.00017625093460083008, -0.00016567856073379517, -0.00015510618686676025, -0.00014453381299972534, -0.00013396143913269043, -0.00012338906526565552, -0.0001128166913986206, -0.0001022443175315857, -9.167194366455078e-05, -8.109956979751587e-05, -7.052719593048096e-05, -5.9954822063446045e-05, -4.938244819641113e-05, -3.881007432937622e-05, -2.823770046234131e-05, -1.7665326595306396e-05, -7.092952728271484e-06, 3.4794211387634277e-06, 1.405179500579834e-05, 2.4624168872833252e-05, 3.5196542739868164e-05, 4.5768916606903076e-05, 5.634129047393799e-05, 6.69136643409729e-05, 7.748603820800781e-05, 8.805841207504272e-05, 9.863078594207764e-05, 0.00010920315980911255, 0.00011977553367614746, 0.00013034790754318237, 0.00014092028141021729, 0.0001514926552772522, 0.0001620650291442871, 0.00017263740301132202, 0.00018320977687835693, 0.00019378215074539185, 0.00020435452461242676, 0.00021492689847946167, 0.00022549927234649658, 0.0002360716462135315, 0.0002466440200805664, 0.0002572163939476013, 0.00026778876781463623, 0.00027836114168167114, 0.00028893351554870605, 0.00029950588941574097, 0.0003100782632827759, 0.0003206506371498108, 0.0003312230110168457, 0.0003417953848838806, 0.00035236775875091553, 0.00036294013261795044, 0.00037351250648498535, 0.00038408488035202026, 0.0003946572542190552, 0.0004052296280860901, 0.000415802001953125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 3.0, 11.0, 9.0, 9.0, 19.0, 34.0, 45.0, 67.0, 93.0, 150.0, 218.0, 296.0, 469.0, 738.0, 1142.0, 1804.0, 2941.0, 4760.0, 7826.0, 13271.0, 23021.0, 39977.0, 68289.0, 111571.0, 162614.0, 187564.0, 157966.0, 106632.0, 64817.0, 38351.0, 21838.0, 12479.0, 7270.0, 4467.0, 2783.0, 1786.0, 1122.0, 695.0, 496.0, 296.0, 200.0, 144.0, 83.0, 60.0, 46.0, 29.0, 13.0, 14.0, 13.0, 6.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.373046875, -3.26910400390625, -3.1651611328125, -3.06121826171875, -2.957275390625, -2.85333251953125, -2.7493896484375, -2.64544677734375, -2.54150390625, -2.43756103515625, -2.3336181640625, -2.22967529296875, -2.125732421875, -2.02178955078125, -1.9178466796875, -1.81390380859375, -1.7099609375, -1.60601806640625, -1.5020751953125, -1.39813232421875, -1.294189453125, -1.19024658203125, -1.0863037109375, -0.98236083984375, -0.87841796875, -0.77447509765625, -0.6705322265625, -0.56658935546875, -0.462646484375, -0.35870361328125, -0.2547607421875, -0.15081787109375, -0.046875, 0.05706787109375, 0.1610107421875, 0.26495361328125, 0.368896484375, 0.47283935546875, 0.5767822265625, 0.68072509765625, 0.78466796875, 0.88861083984375, 0.9925537109375, 1.09649658203125, 1.200439453125, 1.30438232421875, 1.4083251953125, 1.51226806640625, 1.6162109375, 1.72015380859375, 1.8240966796875, 1.92803955078125, 2.031982421875, 2.13592529296875, 2.2398681640625, 2.34381103515625, 2.44775390625, 2.55169677734375, 2.6556396484375, 2.75958251953125, 2.863525390625, 2.96746826171875, 3.0714111328125, 3.17535400390625, 3.279296875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 9.0, 10.0, 13.0, 21.0, 22.0, 29.0, 22.0, 38.0, 40.0, 34.0, 53.0, 61.0, 45.0, 38.0, 54.0, 54.0, 49.0, 43.0, 33.0, 43.0, 37.0, 43.0, 28.0, 34.0, 25.0, 18.0, 22.0, 13.0, 10.0, 6.0, 7.0, 9.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.985137939453125, -0.95758056640625, -0.930023193359375, -0.9024658203125, -0.874908447265625, -0.84735107421875, -0.819793701171875, -0.792236328125, -0.764678955078125, -0.73712158203125, -0.709564208984375, -0.6820068359375, -0.654449462890625, -0.62689208984375, -0.599334716796875, -0.57177734375, -0.544219970703125, -0.51666259765625, -0.489105224609375, -0.4615478515625, -0.433990478515625, -0.40643310546875, -0.378875732421875, -0.351318359375, -0.323760986328125, -0.29620361328125, -0.268646240234375, -0.2410888671875, -0.213531494140625, -0.18597412109375, -0.158416748046875, -0.130859375, -0.103302001953125, -0.07574462890625, -0.048187255859375, -0.0206298828125, 0.006927490234375, 0.03448486328125, 0.062042236328125, 0.089599609375, 0.117156982421875, 0.14471435546875, 0.172271728515625, 0.1998291015625, 0.227386474609375, 0.25494384765625, 0.282501220703125, 0.31005859375, 0.337615966796875, 0.36517333984375, 0.392730712890625, 0.4202880859375, 0.447845458984375, 0.47540283203125, 0.502960205078125, 0.530517578125, 0.558074951171875, 0.58563232421875, 0.613189697265625, 0.6407470703125, 0.668304443359375, 0.69586181640625, 0.723419189453125, 0.7509765625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 2.0, 5.0, 8.0, 7.0, 10.0, 15.0, 26.0, 25.0, 39.0, 47.0, 55.0, 92.0, 89.0, 85.0, 90.0, 85.0, 67.0, 59.0, 46.0, 27.0, 39.0, 18.0, 12.0, 12.0, 9.0, 7.0, 1.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.385204315185547, -25.559053421020508, -24.73290252685547, -23.90675163269043, -23.08060073852539, -22.25444984436035, -21.428298950195312, -20.602148056030273, -19.775997161865234, -18.949846267700195, -18.123695373535156, -17.297544479370117, -16.471393585205078, -15.645242691040039, -14.819091796875, -13.992940902709961, -13.166790008544922, -12.340639114379883, -11.514488220214844, -10.688337326049805, -9.862186431884766, -9.036035537719727, -8.209884643554688, -7.383733749389648, -6.557582855224609, -5.73143196105957, -4.905281066894531, -4.079130172729492, -3.252979278564453, -2.426828384399414, -1.600677490234375, -0.7745265960693359, 0.051624298095703125, 0.8777751922607422, 1.7039260864257812, 2.5300769805908203, 3.3562278747558594, 4.182378768920898, 5.0085296630859375, 5.834680557250977, 6.660831451416016, 7.486982345581055, 8.313133239746094, 9.139284133911133, 9.965435028076172, 10.791585922241211, 11.61773681640625, 12.443887710571289, 13.270038604736328, 14.096189498901367, 14.922340393066406, 15.748491287231445, 16.574642181396484, 17.400793075561523, 18.226943969726562, 19.0530948638916, 19.87924575805664, 20.70539665222168, 21.53154754638672, 22.357698440551758, 23.183849334716797, 24.010000228881836, 24.836151123046875, 25.662302017211914, 26.488452911376953]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 8.0, 7.0, 3.0, 9.0, 14.0, 12.0, 16.0, 18.0, 18.0, 21.0, 22.0, 24.0, 30.0, 31.0, 34.0, 25.0, 31.0, 46.0, 42.0, 36.0, 26.0, 38.0, 35.0, 36.0, 45.0, 32.0, 27.0, 26.0, 39.0, 22.0, 27.0, 26.0, 28.0, 25.0, 28.0, 9.0, 20.0, 4.0, 15.0, 12.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-8.70146369934082, -8.426247596740723, -8.151031494140625, -7.8758158683776855, -7.600600242614746, -7.325384140014648, -7.050168037414551, -6.774951934814453, -6.499736309051514, -6.224520206451416, -5.949304580688477, -5.674088478088379, -5.398872375488281, -5.123656749725342, -4.848440647125244, -4.573225021362305, -4.298008918762207, -4.022792816162109, -3.74757719039917, -3.4723610877990723, -3.1971452236175537, -2.921929359436035, -2.6467132568359375, -2.371497392654419, -2.0962815284729004, -1.8210656642913818, -1.5458496809005737, -1.2706336975097656, -0.9954178333282471, -0.7202019691467285, -0.4449859857559204, -0.1697700023651123, 0.10544586181640625, 0.3806617856025696, 0.6558777093887329, 0.9310936331748962, 1.2063095569610596, 1.4815254211425781, 1.7567414045333862, 2.0319573879241943, 2.307173252105713, 2.5823891162872314, 2.85760498046875, 3.1328210830688477, 3.408036947250366, 3.6832528114318848, 3.9584689140319824, 4.233684539794922, 4.5089006423950195, 4.784116744995117, 5.059332370758057, 5.334548473358154, 5.609764099121094, 5.884980201721191, 6.160196304321289, 6.435412406921387, 6.710628032684326, 6.985844135284424, 7.261059761047363, 7.536275863647461, 7.811491966247559, 8.086708068847656, 8.361923217773438, 8.637139320373535, 8.912355422973633]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 9.0, 16.0, 18.0, 29.0, 36.0, 51.0, 88.0, 135.0, 167.0, 253.0, 354.0, 560.0, 862.0, 1266.0, 2102.0, 3155.0, 5121.0, 8057.0, 13579.0, 22610.0, 37230.0, 59979.0, 92642.0, 132912.0, 161046.0, 157300.0, 124376.0, 84649.0, 54029.0, 33386.0, 19985.0, 12263.0, 7556.0, 4495.0, 2895.0, 1808.0, 1164.0, 782.0, 494.0, 303.0, 243.0, 197.0, 116.0, 63.0, 47.0, 29.0, 26.0, 24.0, 14.0, 14.0, 10.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-16.03125, -15.528564453125, -15.02587890625, -14.523193359375, -14.0205078125, -13.517822265625, -13.01513671875, -12.512451171875, -12.009765625, -11.507080078125, -11.00439453125, -10.501708984375, -9.9990234375, -9.496337890625, -8.99365234375, -8.490966796875, -7.98828125, -7.485595703125, -6.98291015625, -6.480224609375, -5.9775390625, -5.474853515625, -4.97216796875, -4.469482421875, -3.966796875, -3.464111328125, -2.96142578125, -2.458740234375, -1.9560546875, -1.453369140625, -0.95068359375, -0.447998046875, 0.0546875, 0.557373046875, 1.06005859375, 1.562744140625, 2.0654296875, 2.568115234375, 3.07080078125, 3.573486328125, 4.076171875, 4.578857421875, 5.08154296875, 5.584228515625, 6.0869140625, 6.589599609375, 7.09228515625, 7.594970703125, 8.09765625, 8.600341796875, 9.10302734375, 9.605712890625, 10.1083984375, 10.611083984375, 11.11376953125, 11.616455078125, 12.119140625, 12.621826171875, 13.12451171875, 13.627197265625, 14.1298828125, 14.632568359375, 15.13525390625, 15.637939453125, 16.140625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 9.0, 2.0, 3.0, 7.0, 7.0, 8.0, 15.0, 14.0, 26.0, 40.0, 21.0, 23.0, 22.0, 43.0, 39.0, 46.0, 44.0, 35.0, 41.0, 40.0, 45.0, 33.0, 49.0, 39.0, 34.0, 36.0, 44.0, 31.0, 20.0, 27.0, 33.0, 19.0, 23.0, 17.0, 21.0, 5.0, 11.0, 7.0, 6.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.25, -10.8936767578125, -10.537353515625, -10.1810302734375, -9.82470703125, -9.4683837890625, -9.112060546875, -8.7557373046875, -8.3994140625, -8.0430908203125, -7.686767578125, -7.3304443359375, -6.97412109375, -6.6177978515625, -6.261474609375, -5.9051513671875, -5.548828125, -5.1925048828125, -4.836181640625, -4.4798583984375, -4.12353515625, -3.7672119140625, -3.410888671875, -3.0545654296875, -2.6982421875, -2.3419189453125, -1.985595703125, -1.6292724609375, -1.27294921875, -0.9166259765625, -0.560302734375, -0.2039794921875, 0.15234375, 0.5086669921875, 0.864990234375, 1.2213134765625, 1.57763671875, 1.9339599609375, 2.290283203125, 2.6466064453125, 3.0029296875, 3.3592529296875, 3.715576171875, 4.0718994140625, 4.42822265625, 4.7845458984375, 5.140869140625, 5.4971923828125, 5.853515625, 6.2098388671875, 6.566162109375, 6.9224853515625, 7.27880859375, 7.6351318359375, 7.991455078125, 8.3477783203125, 8.7041015625, 9.0604248046875, 9.416748046875, 9.7730712890625, 10.12939453125, 10.4857177734375, 10.842041015625, 11.1983642578125, 11.5546875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 9.0, 19.0, 19.0, 43.0, 65.0, 91.0, 162.0, 258.0, 376.0, 590.0, 950.0, 1481.0, 2292.0, 3628.0, 5818.0, 9440.0, 15508.0, 24817.0, 39823.0, 62589.0, 93942.0, 129140.0, 153775.0, 148700.0, 120342.0, 84889.0, 56430.0, 35428.0, 22085.0, 13467.0, 8423.0, 5079.0, 3224.0, 2068.0, 1243.0, 843.0, 536.0, 346.0, 217.0, 156.0, 86.0, 61.0, 40.0, 24.0, 14.0, 10.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.6640625, -13.1907958984375, -12.717529296875, -12.2442626953125, -11.77099609375, -11.2977294921875, -10.824462890625, -10.3511962890625, -9.8779296875, -9.4046630859375, -8.931396484375, -8.4581298828125, -7.98486328125, -7.5115966796875, -7.038330078125, -6.5650634765625, -6.091796875, -5.6185302734375, -5.145263671875, -4.6719970703125, -4.19873046875, -3.7254638671875, -3.252197265625, -2.7789306640625, -2.3056640625, -1.8323974609375, -1.359130859375, -0.8858642578125, -0.41259765625, 0.0606689453125, 0.533935546875, 1.0072021484375, 1.48046875, 1.9537353515625, 2.427001953125, 2.9002685546875, 3.37353515625, 3.8468017578125, 4.320068359375, 4.7933349609375, 5.2666015625, 5.7398681640625, 6.213134765625, 6.6864013671875, 7.15966796875, 7.6329345703125, 8.106201171875, 8.5794677734375, 9.052734375, 9.5260009765625, 9.999267578125, 10.4725341796875, 10.94580078125, 11.4190673828125, 11.892333984375, 12.3656005859375, 12.8388671875, 13.3121337890625, 13.785400390625, 14.2586669921875, 14.73193359375, 15.2052001953125, 15.678466796875, 16.1517333984375, 16.625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 5.0, 13.0, 14.0, 11.0, 14.0, 15.0, 21.0, 24.0, 31.0, 26.0, 35.0, 29.0, 37.0, 43.0, 39.0, 49.0, 39.0, 52.0, 37.0, 37.0, 34.0, 53.0, 44.0, 44.0, 29.0, 37.0, 26.0, 18.0, 25.0, 11.0, 19.0, 11.0, 15.0, 7.0, 5.0, 8.0, 4.0, 9.0, 3.0, 7.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0], "bins": [-7.00390625, -6.78948974609375, -6.5750732421875, -6.36065673828125, -6.146240234375, -5.93182373046875, -5.7174072265625, -5.50299072265625, -5.28857421875, -5.07415771484375, -4.8597412109375, -4.64532470703125, -4.430908203125, -4.21649169921875, -4.0020751953125, -3.78765869140625, -3.5732421875, -3.35882568359375, -3.1444091796875, -2.92999267578125, -2.715576171875, -2.50115966796875, -2.2867431640625, -2.07232666015625, -1.85791015625, -1.64349365234375, -1.4290771484375, -1.21466064453125, -1.000244140625, -0.78582763671875, -0.5714111328125, -0.35699462890625, -0.142578125, 0.07183837890625, 0.2862548828125, 0.50067138671875, 0.715087890625, 0.92950439453125, 1.1439208984375, 1.35833740234375, 1.57275390625, 1.78717041015625, 2.0015869140625, 2.21600341796875, 2.430419921875, 2.64483642578125, 2.8592529296875, 3.07366943359375, 3.2880859375, 3.50250244140625, 3.7169189453125, 3.93133544921875, 4.145751953125, 4.36016845703125, 4.5745849609375, 4.78900146484375, 5.00341796875, 5.21783447265625, 5.4322509765625, 5.64666748046875, 5.861083984375, 6.07550048828125, 6.2899169921875, 6.50433349609375, 6.71875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 3.0, 8.0, 7.0, 12.0, 17.0, 24.0, 31.0, 34.0, 56.0, 74.0, 92.0, 132.0, 199.0, 287.0, 382.0, 618.0, 876.0, 1355.0, 2068.0, 3110.0, 5130.0, 8509.0, 15021.0, 28799.0, 58497.0, 124026.0, 234504.0, 260313.0, 152877.0, 72181.0, 35021.0, 17925.0, 10075.0, 5653.0, 3709.0, 2291.0, 1507.0, 945.0, 657.0, 486.0, 282.0, 219.0, 152.0, 122.0, 62.0, 65.0, 38.0, 28.0, 23.0, 20.0, 13.0, 11.0, 5.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-9.78125, -9.4671630859375, -9.153076171875, -8.8389892578125, -8.52490234375, -8.2108154296875, -7.896728515625, -7.5826416015625, -7.2685546875, -6.9544677734375, -6.640380859375, -6.3262939453125, -6.01220703125, -5.6981201171875, -5.384033203125, -5.0699462890625, -4.755859375, -4.4417724609375, -4.127685546875, -3.8135986328125, -3.49951171875, -3.1854248046875, -2.871337890625, -2.5572509765625, -2.2431640625, -1.9290771484375, -1.614990234375, -1.3009033203125, -0.98681640625, -0.6727294921875, -0.358642578125, -0.0445556640625, 0.26953125, 0.5836181640625, 0.897705078125, 1.2117919921875, 1.52587890625, 1.8399658203125, 2.154052734375, 2.4681396484375, 2.7822265625, 3.0963134765625, 3.410400390625, 3.7244873046875, 4.03857421875, 4.3526611328125, 4.666748046875, 4.9808349609375, 5.294921875, 5.6090087890625, 5.923095703125, 6.2371826171875, 6.55126953125, 6.8653564453125, 7.179443359375, 7.4935302734375, 7.8076171875, 8.1217041015625, 8.435791015625, 8.7498779296875, 9.06396484375, 9.3780517578125, 9.692138671875, 10.0062255859375, 10.3203125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 7.0, 5.0, 3.0, 11.0, 12.0, 18.0, 19.0, 31.0, 31.0, 36.0, 53.0, 62.0, 106.0, 88.0, 101.0, 86.0, 61.0, 63.0, 35.0, 42.0, 22.0, 18.0, 16.0, 7.0, 16.0, 16.0, 4.0, 6.0, 3.0, 6.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.001407623291015625, -0.001367717981338501, -0.001327812671661377, -0.001287907361984253, -0.001248002052307129, -0.0012080967426300049, -0.0011681914329528809, -0.0011282861232757568, -0.0010883808135986328, -0.0010484755039215088, -0.0010085701942443848, -0.0009686648845672607, -0.0009287595748901367, -0.0008888542652130127, -0.0008489489555358887, -0.0008090436458587646, -0.0007691383361816406, -0.0007292330265045166, -0.0006893277168273926, -0.0006494224071502686, -0.0006095170974731445, -0.0005696117877960205, -0.0005297064781188965, -0.0004898011684417725, -0.00044989585876464844, -0.0004099905490875244, -0.0003700852394104004, -0.00033017992973327637, -0.00029027462005615234, -0.0002503693103790283, -0.0002104640007019043, -0.00017055869102478027, -0.00013065338134765625, -9.074807167053223e-05, -5.08427619934082e-05, -1.093745231628418e-05, 2.8967857360839844e-05, 6.887316703796387e-05, 0.00010877847671508789, 0.00014868378639221191, 0.00018858909606933594, 0.00022849440574645996, 0.000268399715423584, 0.000308305025100708, 0.00034821033477783203, 0.00038811564445495605, 0.0004280209541320801, 0.0004679262638092041, 0.0005078315734863281, 0.0005477368831634521, 0.0005876421928405762, 0.0006275475025177002, 0.0006674528121948242, 0.0007073581218719482, 0.0007472634315490723, 0.0007871687412261963, 0.0008270740509033203, 0.0008669793605804443, 0.0009068846702575684, 0.0009467899799346924, 0.0009866952896118164, 0.0010266005992889404, 0.0010665059089660645, 0.0011064112186431885, 0.0011463165283203125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [7.0, 3.0, 4.0, 6.0, 13.0, 16.0, 17.0, 26.0, 32.0, 65.0, 63.0, 106.0, 133.0, 169.0, 236.0, 285.0, 400.0, 537.0, 762.0, 1105.0, 1519.0, 2216.0, 3246.0, 5296.0, 8239.0, 13630.0, 23263.0, 41848.0, 77628.0, 142420.0, 217717.0, 209067.0, 132262.0, 71007.0, 38428.0, 21280.0, 12490.0, 7674.0, 4861.0, 3190.0, 2161.0, 1425.0, 1000.0, 725.0, 556.0, 389.0, 261.0, 187.0, 147.0, 117.0, 87.0, 55.0, 63.0, 39.0, 29.0, 27.0, 14.0, 13.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0], "bins": [-7.7734375, -7.5220947265625, -7.270751953125, -7.0194091796875, -6.76806640625, -6.5167236328125, -6.265380859375, -6.0140380859375, -5.7626953125, -5.5113525390625, -5.260009765625, -5.0086669921875, -4.75732421875, -4.5059814453125, -4.254638671875, -4.0032958984375, -3.751953125, -3.5006103515625, -3.249267578125, -2.9979248046875, -2.74658203125, -2.4952392578125, -2.243896484375, -1.9925537109375, -1.7412109375, -1.4898681640625, -1.238525390625, -0.9871826171875, -0.73583984375, -0.4844970703125, -0.233154296875, 0.0181884765625, 0.26953125, 0.5208740234375, 0.772216796875, 1.0235595703125, 1.27490234375, 1.5262451171875, 1.777587890625, 2.0289306640625, 2.2802734375, 2.5316162109375, 2.782958984375, 3.0343017578125, 3.28564453125, 3.5369873046875, 3.788330078125, 4.0396728515625, 4.291015625, 4.5423583984375, 4.793701171875, 5.0450439453125, 5.29638671875, 5.5477294921875, 5.799072265625, 6.0504150390625, 6.3017578125, 6.5531005859375, 6.804443359375, 7.0557861328125, 7.30712890625, 7.5584716796875, 7.809814453125, 8.0611572265625, 8.3125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 2.0, 12.0, 14.0, 17.0, 16.0, 25.0, 29.0, 42.0, 42.0, 55.0, 60.0, 72.0, 78.0, 73.0, 74.0, 75.0, 64.0, 46.0, 40.0, 25.0, 22.0, 19.0, 24.0, 7.0, 13.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.91015625, -2.823394775390625, -2.73663330078125, -2.649871826171875, -2.5631103515625, -2.476348876953125, -2.38958740234375, -2.302825927734375, -2.216064453125, -2.129302978515625, -2.04254150390625, -1.955780029296875, -1.8690185546875, -1.782257080078125, -1.69549560546875, -1.608734130859375, -1.52197265625, -1.435211181640625, -1.34844970703125, -1.261688232421875, -1.1749267578125, -1.088165283203125, -1.00140380859375, -0.914642333984375, -0.827880859375, -0.741119384765625, -0.65435791015625, -0.567596435546875, -0.4808349609375, -0.394073486328125, -0.30731201171875, -0.220550537109375, -0.1337890625, -0.047027587890625, 0.03973388671875, 0.126495361328125, 0.2132568359375, 0.300018310546875, 0.38677978515625, 0.473541259765625, 0.560302734375, 0.647064208984375, 0.73382568359375, 0.820587158203125, 0.9073486328125, 0.994110107421875, 1.08087158203125, 1.167633056640625, 1.25439453125, 1.341156005859375, 1.42791748046875, 1.514678955078125, 1.6014404296875, 1.688201904296875, 1.77496337890625, 1.861724853515625, 1.948486328125, 2.035247802734375, 2.12200927734375, 2.208770751953125, 2.2955322265625, 2.382293701171875, 2.46905517578125, 2.555816650390625, 2.642578125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 2.0, 5.0, 8.0, 12.0, 18.0, 14.0, 23.0, 26.0, 42.0, 50.0, 57.0, 88.0, 71.0, 91.0, 87.0, 79.0, 62.0, 53.0, 50.0, 38.0, 24.0, 25.0, 14.0, 14.0, 9.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.215232849121094, -21.419559478759766, -20.623886108398438, -19.82821273803711, -19.032541275024414, -18.236867904663086, -17.441194534301758, -16.64552116394043, -15.849847793579102, -15.054174423217773, -14.258502006530762, -13.462828636169434, -12.667155265808105, -11.871482849121094, -11.075809478759766, -10.280136108398438, -9.484463691711426, -8.688790321350098, -7.893117427825928, -7.097444534301758, -6.30177116394043, -5.50609827041626, -4.71042537689209, -3.9147520065307617, -3.119079113006592, -2.3234059810638428, -1.5277329683303833, -0.7320599555969238, 0.0636131763458252, 0.8592863082885742, 1.6549592018127441, 2.4506325721740723, 3.246305465698242, 4.041978359222412, 4.83765172958374, 5.63332462310791, 6.428997993469238, 7.224670886993408, 8.020343780517578, 8.816017150878906, 9.611690521240234, 10.407363891601562, 11.203036308288574, 11.998709678649902, 12.79438304901123, 13.590055465698242, 14.38572883605957, 15.181402206420898, 15.97707462310791, 16.772747039794922, 17.56842041015625, 18.364093780517578, 19.159767150878906, 19.955440521240234, 20.751113891601562, 21.54678726196289, 22.342458724975586, 23.138132095336914, 23.933805465698242, 24.729476928710938, 25.525150299072266, 26.320823669433594, 27.116497039794922, 27.91217041015625, 28.707843780517578]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 8.0, 8.0, 9.0, 12.0, 11.0, 11.0, 20.0, 16.0, 18.0, 17.0, 24.0, 37.0, 31.0, 31.0, 30.0, 35.0, 41.0, 46.0, 41.0, 27.0, 44.0, 35.0, 41.0, 30.0, 35.0, 51.0, 32.0, 35.0, 29.0, 28.0, 30.0, 28.0, 14.0, 23.0, 14.0, 12.0, 14.0, 4.0, 7.0, 5.0, 8.0, 3.0, 4.0, 0.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.837150573730469, -9.527704238891602, -9.218257904052734, -8.90881061553955, -8.599364280700684, -8.289917945861816, -7.980471611022949, -7.671024799346924, -7.361577987670898, -7.052131652832031, -6.742684841156006, -6.433238506317139, -6.123791694641113, -5.814345359802246, -5.504899024963379, -5.1954522132873535, -4.886005878448486, -4.576559543609619, -4.267112731933594, -3.9576663970947266, -3.648219585418701, -3.338773250579834, -3.0293266773223877, -2.7198801040649414, -2.410433530807495, -2.100986957550049, -1.7915403842926025, -1.4820939302444458, -1.1726473569869995, -0.8632007837295532, -0.5537543296813965, -0.2443077564239502, 0.0651388168334961, 0.37458536028862, 0.6840319037437439, 0.9934784173965454, 1.3029249906539917, 1.612371563911438, 1.9218180179595947, 2.231264591217041, 2.5407111644744873, 2.8501577377319336, 3.15960431098938, 3.469050884246826, 3.7784972190856934, 4.087944030761719, 4.397390365600586, 4.706836700439453, 5.0162835121154785, 5.325729846954346, 5.635176658630371, 5.944622993469238, 6.254069805145264, 6.563516139984131, 6.872962951660156, 7.182409286499023, 7.491855621337891, 7.801301956176758, 8.110748291015625, 8.420195579528809, 8.729641914367676, 9.039088249206543, 9.34853458404541, 9.657981872558594, 9.967428207397461]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 6.0, 13.0, 15.0, 21.0, 28.0, 56.0, 55.0, 93.0, 137.0, 185.0, 274.0, 383.0, 599.0, 900.0, 1304.0, 2167.0, 3492.0, 5621.0, 10378.0, 19156.0, 38941.0, 87611.0, 217238.0, 607038.0, 1418050.0, 1100973.0, 401109.0, 150834.0, 63747.0, 29385.0, 14743.0, 7934.0, 4601.0, 2689.0, 1623.0, 982.0, 682.0, 404.0, 246.0, 162.0, 112.0, 85.0, 71.0, 45.0, 26.0, 30.0, 15.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.9375, -23.160400390625, -22.38330078125, -21.606201171875, -20.8291015625, -20.052001953125, -19.27490234375, -18.497802734375, -17.720703125, -16.943603515625, -16.16650390625, -15.389404296875, -14.6123046875, -13.835205078125, -13.05810546875, -12.281005859375, -11.50390625, -10.726806640625, -9.94970703125, -9.172607421875, -8.3955078125, -7.618408203125, -6.84130859375, -6.064208984375, -5.287109375, -4.510009765625, -3.73291015625, -2.955810546875, -2.1787109375, -1.401611328125, -0.62451171875, 0.152587890625, 0.9296875, 1.706787109375, 2.48388671875, 3.260986328125, 4.0380859375, 4.815185546875, 5.59228515625, 6.369384765625, 7.146484375, 7.923583984375, 8.70068359375, 9.477783203125, 10.2548828125, 11.031982421875, 11.80908203125, 12.586181640625, 13.36328125, 14.140380859375, 14.91748046875, 15.694580078125, 16.4716796875, 17.248779296875, 18.02587890625, 18.802978515625, 19.580078125, 20.357177734375, 21.13427734375, 21.911376953125, 22.6884765625, 23.465576171875, 24.24267578125, 25.019775390625, 25.796875]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 8.0, 14.0, 17.0, 16.0, 15.0, 22.0, 13.0, 34.0, 26.0, 33.0, 31.0, 36.0, 46.0, 45.0, 47.0, 37.0, 50.0, 50.0, 44.0, 36.0, 40.0, 32.0, 33.0, 43.0, 33.0, 39.0, 29.0, 28.0, 20.0, 12.0, 15.0, 8.0, 6.0, 7.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.171875, -8.8851318359375, -8.598388671875, -8.3116455078125, -8.02490234375, -7.7381591796875, -7.451416015625, -7.1646728515625, -6.8779296875, -6.5911865234375, -6.304443359375, -6.0177001953125, -5.73095703125, -5.4442138671875, -5.157470703125, -4.8707275390625, -4.583984375, -4.2972412109375, -4.010498046875, -3.7237548828125, -3.43701171875, -3.1502685546875, -2.863525390625, -2.5767822265625, -2.2900390625, -2.0032958984375, -1.716552734375, -1.4298095703125, -1.14306640625, -0.8563232421875, -0.569580078125, -0.2828369140625, 0.00390625, 0.2906494140625, 0.577392578125, 0.8641357421875, 1.15087890625, 1.4376220703125, 1.724365234375, 2.0111083984375, 2.2978515625, 2.5845947265625, 2.871337890625, 3.1580810546875, 3.44482421875, 3.7315673828125, 4.018310546875, 4.3050537109375, 4.591796875, 4.8785400390625, 5.165283203125, 5.4520263671875, 5.73876953125, 6.0255126953125, 6.312255859375, 6.5989990234375, 6.8857421875, 7.1724853515625, 7.459228515625, 7.7459716796875, 8.03271484375, 8.3194580078125, 8.606201171875, 8.8929443359375, 9.1796875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 3.0, 6.0, 11.0, 16.0, 27.0, 29.0, 66.0, 82.0, 124.0, 182.0, 320.0, 525.0, 780.0, 1232.0, 2117.0, 3602.0, 6873.0, 13220.0, 26876.0, 59489.0, 145020.0, 392073.0, 1085628.0, 1458504.0, 615320.0, 219290.0, 86389.0, 37562.0, 17827.0, 9117.0, 4944.0, 2826.0, 1634.0, 969.0, 596.0, 371.0, 211.0, 143.0, 85.0, 58.0, 46.0, 36.0, 17.0, 15.0, 10.0, 3.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.953125, -26.996337890625, -26.03955078125, -25.082763671875, -24.1259765625, -23.169189453125, -22.21240234375, -21.255615234375, -20.298828125, -19.342041015625, -18.38525390625, -17.428466796875, -16.4716796875, -15.514892578125, -14.55810546875, -13.601318359375, -12.64453125, -11.687744140625, -10.73095703125, -9.774169921875, -8.8173828125, -7.860595703125, -6.90380859375, -5.947021484375, -4.990234375, -4.033447265625, -3.07666015625, -2.119873046875, -1.1630859375, -0.206298828125, 0.75048828125, 1.707275390625, 2.6640625, 3.620849609375, 4.57763671875, 5.534423828125, 6.4912109375, 7.447998046875, 8.40478515625, 9.361572265625, 10.318359375, 11.275146484375, 12.23193359375, 13.188720703125, 14.1455078125, 15.102294921875, 16.05908203125, 17.015869140625, 17.97265625, 18.929443359375, 19.88623046875, 20.843017578125, 21.7998046875, 22.756591796875, 23.71337890625, 24.670166015625, 25.626953125, 26.583740234375, 27.54052734375, 28.497314453125, 29.4541015625, 30.410888671875, 31.36767578125, 32.324462890625, 33.28125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 9.0, 6.0, 13.0, 13.0, 22.0, 19.0, 35.0, 41.0, 55.0, 74.0, 100.0, 135.0, 151.0, 214.0, 234.0, 306.0, 311.0, 333.0, 315.0, 326.0, 310.0, 238.0, 199.0, 159.0, 113.0, 76.0, 68.0, 47.0, 40.0, 28.0, 17.0, 14.0, 12.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.0, -5.7857666015625, -5.571533203125, -5.3572998046875, -5.14306640625, -4.9288330078125, -4.714599609375, -4.5003662109375, -4.2861328125, -4.0718994140625, -3.857666015625, -3.6434326171875, -3.42919921875, -3.2149658203125, -3.000732421875, -2.7864990234375, -2.572265625, -2.3580322265625, -2.143798828125, -1.9295654296875, -1.71533203125, -1.5010986328125, -1.286865234375, -1.0726318359375, -0.8583984375, -0.6441650390625, -0.429931640625, -0.2156982421875, -0.00146484375, 0.2127685546875, 0.427001953125, 0.6412353515625, 0.85546875, 1.0697021484375, 1.283935546875, 1.4981689453125, 1.71240234375, 1.9266357421875, 2.140869140625, 2.3551025390625, 2.5693359375, 2.7835693359375, 2.997802734375, 3.2120361328125, 3.42626953125, 3.6405029296875, 3.854736328125, 4.0689697265625, 4.283203125, 4.4974365234375, 4.711669921875, 4.9259033203125, 5.14013671875, 5.3543701171875, 5.568603515625, 5.7828369140625, 5.9970703125, 6.2113037109375, 6.425537109375, 6.6397705078125, 6.85400390625, 7.0682373046875, 7.282470703125, 7.4967041015625, 7.7109375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 12.0, 12.0, 20.0, 21.0, 35.0, 45.0, 59.0, 63.0, 101.0, 82.0, 92.0, 99.0, 77.0, 67.0, 44.0, 36.0, 32.0, 21.0, 18.0, 11.0, 9.0, 7.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.593488693237305, -22.65788459777832, -21.722280502319336, -20.78667640686035, -19.851070404052734, -18.91546630859375, -17.979862213134766, -17.04425811767578, -16.108654022216797, -15.173049926757812, -14.237445831298828, -13.301840782165527, -12.366236686706543, -11.430632591247559, -10.495027542114258, -9.559423446655273, -8.623819351196289, -7.688215255737305, -6.752610683441162, -5.8170061111450195, -4.881402015686035, -3.945797920227051, -3.010193347930908, -2.0745887756347656, -1.1389846801757812, -0.20338034629821777, 0.7322239875793457, 1.6678283214569092, 2.6034326553344727, 3.539036750793457, 4.4746413230896, 5.410245895385742, 6.345848083496094, 7.281452178955078, 8.217056274414062, 9.152661323547363, 10.088265419006348, 11.023869514465332, 11.959474563598633, 12.895078659057617, 13.830682754516602, 14.766286849975586, 15.70189094543457, 16.637495040893555, 17.573101043701172, 18.508705139160156, 19.44430923461914, 20.379913330078125, 21.31551742553711, 22.251121520996094, 23.186725616455078, 24.122329711914062, 25.057933807373047, 25.99353790283203, 26.92914390563965, 27.864748001098633, 28.800352096557617, 29.7359561920166, 30.671560287475586, 31.60716438293457, 32.54277038574219, 33.47837448120117, 34.413978576660156, 35.34958267211914, 36.285186767578125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 10.0, 0.0, 14.0, 11.0, 13.0, 6.0, 7.0, 20.0, 21.0, 27.0, 20.0, 26.0, 38.0, 27.0, 35.0, 28.0, 38.0, 45.0, 36.0, 32.0, 27.0, 37.0, 32.0, 40.0, 40.0, 25.0, 34.0, 38.0, 38.0, 22.0, 27.0, 15.0, 21.0, 19.0, 16.0, 14.0, 15.0, 16.0, 13.0, 8.0, 12.0, 5.0, 7.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.33753490447998, -8.042204856872559, -7.746875762939453, -7.451545715332031, -7.156216144561768, -6.860886573791504, -6.56555700302124, -6.270227432250977, -5.974897384643555, -5.679567813873291, -5.384238243103027, -5.0889081954956055, -4.793578624725342, -4.498249053955078, -4.2029194831848145, -3.9075896739959717, -3.612260341644287, -3.3169307708740234, -3.0216009616851807, -2.726271390914917, -2.430941581726074, -2.1356120109558105, -1.8402824401855469, -1.544952630996704, -1.2496230602264404, -0.9542933702468872, -0.6589637398719788, -0.3636341094970703, -0.06830441951751709, 0.22702527046203613, 0.5223548412322998, 0.8176846504211426, 1.1130142211914062, 1.4083439111709595, 1.7036736011505127, 1.9990031719207764, 2.294332981109619, 2.589662551879883, 2.8849921226501465, 3.1803219318389893, 3.475651502609253, 3.7709810733795166, 4.066310882568359, 4.361640453338623, 4.656970024108887, 4.952300071716309, 5.247629165649414, 5.542959213256836, 5.8382887840271, 6.133618354797363, 6.428947925567627, 6.724277496337891, 7.0196075439453125, 7.314937114715576, 7.61026668548584, 7.905596733093262, 8.200925827026367, 8.496255874633789, 8.791584968566895, 9.086915016174316, 9.382244110107422, 9.677574157714844, 9.972904205322266, 10.268233299255371, 10.563563346862793]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 12.0, 7.0, 23.0, 22.0, 45.0, 55.0, 98.0, 119.0, 177.0, 268.0, 362.0, 559.0, 935.0, 1365.0, 2168.0, 3465.0, 5754.0, 10048.0, 17828.0, 33429.0, 62296.0, 115703.0, 191448.0, 226868.0, 165526.0, 94625.0, 51273.0, 27331.0, 15011.0, 8480.0, 4962.0, 2910.0, 1871.0, 1241.0, 761.0, 502.0, 311.0, 217.0, 162.0, 91.0, 76.0, 38.0, 26.0, 28.0, 25.0, 7.0, 10.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.4765625, -11.1103515625, -10.744140625, -10.3779296875, -10.01171875, -9.6455078125, -9.279296875, -8.9130859375, -8.546875, -8.1806640625, -7.814453125, -7.4482421875, -7.08203125, -6.7158203125, -6.349609375, -5.9833984375, -5.6171875, -5.2509765625, -4.884765625, -4.5185546875, -4.15234375, -3.7861328125, -3.419921875, -3.0537109375, -2.6875, -2.3212890625, -1.955078125, -1.5888671875, -1.22265625, -0.8564453125, -0.490234375, -0.1240234375, 0.2421875, 0.6083984375, 0.974609375, 1.3408203125, 1.70703125, 2.0732421875, 2.439453125, 2.8056640625, 3.171875, 3.5380859375, 3.904296875, 4.2705078125, 4.63671875, 5.0029296875, 5.369140625, 5.7353515625, 6.1015625, 6.4677734375, 6.833984375, 7.2001953125, 7.56640625, 7.9326171875, 8.298828125, 8.6650390625, 9.03125, 9.3974609375, 9.763671875, 10.1298828125, 10.49609375, 10.8623046875, 11.228515625, 11.5947265625, 11.9609375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 2.0, 10.0, 6.0, 11.0, 13.0, 13.0, 21.0, 18.0, 30.0, 23.0, 35.0, 27.0, 45.0, 48.0, 36.0, 38.0, 57.0, 33.0, 43.0, 41.0, 34.0, 48.0, 37.0, 41.0, 41.0, 24.0, 30.0, 33.0, 18.0, 24.0, 19.0, 15.0, 14.0, 12.0, 12.0, 12.0, 4.0, 7.0, 9.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.46875, -13.068359375, -12.66796875, -12.267578125, -11.8671875, -11.466796875, -11.06640625, -10.666015625, -10.265625, -9.865234375, -9.46484375, -9.064453125, -8.6640625, -8.263671875, -7.86328125, -7.462890625, -7.0625, -6.662109375, -6.26171875, -5.861328125, -5.4609375, -5.060546875, -4.66015625, -4.259765625, -3.859375, -3.458984375, -3.05859375, -2.658203125, -2.2578125, -1.857421875, -1.45703125, -1.056640625, -0.65625, -0.255859375, 0.14453125, 0.544921875, 0.9453125, 1.345703125, 1.74609375, 2.146484375, 2.546875, 2.947265625, 3.34765625, 3.748046875, 4.1484375, 4.548828125, 4.94921875, 5.349609375, 5.75, 6.150390625, 6.55078125, 6.951171875, 7.3515625, 7.751953125, 8.15234375, 8.552734375, 8.953125, 9.353515625, 9.75390625, 10.154296875, 10.5546875, 10.955078125, 11.35546875, 11.755859375, 12.15625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 12.0, 13.0, 23.0, 23.0, 23.0, 39.0, 49.0, 76.0, 116.0, 147.0, 217.0, 290.0, 432.0, 549.0, 811.0, 1273.0, 1933.0, 3152.0, 5155.0, 9127.0, 17017.0, 34499.0, 72511.0, 157662.0, 279769.0, 235762.0, 116378.0, 53464.0, 25808.0, 13111.0, 7212.0, 4217.0, 2511.0, 1722.0, 1021.0, 683.0, 489.0, 348.0, 247.0, 183.0, 122.0, 92.0, 72.0, 56.0, 39.0, 35.0, 19.0, 9.0, 15.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0], "bins": [-15.8046875, -15.3228759765625, -14.841064453125, -14.3592529296875, -13.87744140625, -13.3956298828125, -12.913818359375, -12.4320068359375, -11.9501953125, -11.4683837890625, -10.986572265625, -10.5047607421875, -10.02294921875, -9.5411376953125, -9.059326171875, -8.5775146484375, -8.095703125, -7.6138916015625, -7.132080078125, -6.6502685546875, -6.16845703125, -5.6866455078125, -5.204833984375, -4.7230224609375, -4.2412109375, -3.7593994140625, -3.277587890625, -2.7957763671875, -2.31396484375, -1.8321533203125, -1.350341796875, -0.8685302734375, -0.38671875, 0.0950927734375, 0.576904296875, 1.0587158203125, 1.54052734375, 2.0223388671875, 2.504150390625, 2.9859619140625, 3.4677734375, 3.9495849609375, 4.431396484375, 4.9132080078125, 5.39501953125, 5.8768310546875, 6.358642578125, 6.8404541015625, 7.322265625, 7.8040771484375, 8.285888671875, 8.7677001953125, 9.24951171875, 9.7313232421875, 10.213134765625, 10.6949462890625, 11.1767578125, 11.6585693359375, 12.140380859375, 12.6221923828125, 13.10400390625, 13.5858154296875, 14.067626953125, 14.5494384765625, 15.03125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 7.0, 8.0, 9.0, 10.0, 14.0, 16.0, 15.0, 16.0, 27.0, 20.0, 33.0, 32.0, 32.0, 37.0, 39.0, 25.0, 42.0, 30.0, 38.0, 44.0, 40.0, 45.0, 40.0, 41.0, 39.0, 30.0, 41.0, 23.0, 26.0, 35.0, 25.0, 13.0, 14.0, 14.0, 16.0, 11.0, 9.0, 9.0, 4.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.76171875, -7.53497314453125, -7.3082275390625, -7.08148193359375, -6.854736328125, -6.62799072265625, -6.4012451171875, -6.17449951171875, -5.94775390625, -5.72100830078125, -5.4942626953125, -5.26751708984375, -5.040771484375, -4.81402587890625, -4.5872802734375, -4.36053466796875, -4.1337890625, -3.90704345703125, -3.6802978515625, -3.45355224609375, -3.226806640625, -3.00006103515625, -2.7733154296875, -2.54656982421875, -2.31982421875, -2.09307861328125, -1.8663330078125, -1.63958740234375, -1.412841796875, -1.18609619140625, -0.9593505859375, -0.73260498046875, -0.505859375, -0.27911376953125, -0.0523681640625, 0.17437744140625, 0.401123046875, 0.62786865234375, 0.8546142578125, 1.08135986328125, 1.30810546875, 1.53485107421875, 1.7615966796875, 1.98834228515625, 2.215087890625, 2.44183349609375, 2.6685791015625, 2.89532470703125, 3.1220703125, 3.34881591796875, 3.5755615234375, 3.80230712890625, 4.029052734375, 4.25579833984375, 4.4825439453125, 4.70928955078125, 4.93603515625, 5.16278076171875, 5.3895263671875, 5.61627197265625, 5.843017578125, 6.06976318359375, 6.2965087890625, 6.52325439453125, 6.75]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 5.0, 6.0, 3.0, 2.0, 4.0, 10.0, 19.0, 22.0, 18.0, 22.0, 35.0, 40.0, 58.0, 85.0, 101.0, 147.0, 220.0, 345.0, 419.0, 562.0, 948.0, 1412.0, 2501.0, 4712.0, 11178.0, 33009.0, 136622.0, 541273.0, 235715.0, 49768.0, 14882.0, 6213.0, 3049.0, 1746.0, 1079.0, 675.0, 438.0, 353.0, 255.0, 148.0, 123.0, 93.0, 63.0, 55.0, 36.0, 30.0, 21.0, 12.0, 13.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0625, -10.676513671875, -10.29052734375, -9.904541015625, -9.5185546875, -9.132568359375, -8.74658203125, -8.360595703125, -7.974609375, -7.588623046875, -7.20263671875, -6.816650390625, -6.4306640625, -6.044677734375, -5.65869140625, -5.272705078125, -4.88671875, -4.500732421875, -4.11474609375, -3.728759765625, -3.3427734375, -2.956787109375, -2.57080078125, -2.184814453125, -1.798828125, -1.412841796875, -1.02685546875, -0.640869140625, -0.2548828125, 0.131103515625, 0.51708984375, 0.903076171875, 1.2890625, 1.675048828125, 2.06103515625, 2.447021484375, 2.8330078125, 3.218994140625, 3.60498046875, 3.990966796875, 4.376953125, 4.762939453125, 5.14892578125, 5.534912109375, 5.9208984375, 6.306884765625, 6.69287109375, 7.078857421875, 7.46484375, 7.850830078125, 8.23681640625, 8.622802734375, 9.0087890625, 9.394775390625, 9.78076171875, 10.166748046875, 10.552734375, 10.938720703125, 11.32470703125, 11.710693359375, 12.0966796875, 12.482666015625, 12.86865234375, 13.254638671875, 13.640625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 9.0, 9.0, 20.0, 25.0, 52.0, 99.0, 153.0, 185.0, 158.0, 121.0, 63.0, 44.0, 18.0, 15.0, 8.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007781982421875, -0.0007500648498535156, -0.0007219314575195312, -0.0006937980651855469, -0.0006656646728515625, -0.0006375312805175781, -0.0006093978881835938, -0.0005812644958496094, -0.000553131103515625, -0.0005249977111816406, -0.0004968643188476562, -0.0004687309265136719, -0.0004405975341796875, -0.0004124641418457031, -0.00038433074951171875, -0.0003561973571777344, -0.00032806396484375, -0.0002999305725097656, -0.00027179718017578125, -0.00024366378784179688, -0.0002155303955078125, -0.00018739700317382812, -0.00015926361083984375, -0.00013113021850585938, -0.000102996826171875, -7.486343383789062e-05, -4.673004150390625e-05, -1.8596649169921875e-05, 9.5367431640625e-06, 3.7670135498046875e-05, 6.580352783203125e-05, 9.393692016601562e-05, 0.0001220703125, 0.00015020370483398438, 0.00017833709716796875, 0.00020647048950195312, 0.0002346038818359375, 0.0002627372741699219, 0.00029087066650390625, 0.0003190040588378906, 0.000347137451171875, 0.0003752708435058594, 0.00040340423583984375, 0.0004315376281738281, 0.0004596710205078125, 0.0004878044128417969, 0.0005159378051757812, 0.0005440711975097656, 0.00057220458984375, 0.0006003379821777344, 0.0006284713745117188, 0.0006566047668457031, 0.0006847381591796875, 0.0007128715515136719, 0.0007410049438476562, 0.0007691383361816406, 0.000797271728515625, 0.0008254051208496094, 0.0008535385131835938, 0.0008816719055175781, 0.0009098052978515625, 0.0009379386901855469, 0.0009660720825195312, 0.0009942054748535156, 0.0010223388671875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 10.0, 17.0, 28.0, 36.0, 39.0, 55.0, 70.0, 111.0, 149.0, 207.0, 252.0, 349.0, 447.0, 581.0, 817.0, 1037.0, 1553.0, 2237.0, 3440.0, 6096.0, 13101.0, 34543.0, 109532.0, 329728.0, 351845.0, 121925.0, 37982.0, 14064.0, 6461.0, 3563.0, 2220.0, 1595.0, 1158.0, 875.0, 620.0, 456.0, 338.0, 291.0, 192.0, 137.0, 114.0, 75.0, 68.0, 42.0, 28.0, 18.0, 20.0, 12.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0], "bins": [-10.7578125, -10.4322509765625, -10.106689453125, -9.7811279296875, -9.45556640625, -9.1300048828125, -8.804443359375, -8.4788818359375, -8.1533203125, -7.8277587890625, -7.502197265625, -7.1766357421875, -6.85107421875, -6.5255126953125, -6.199951171875, -5.8743896484375, -5.548828125, -5.2232666015625, -4.897705078125, -4.5721435546875, -4.24658203125, -3.9210205078125, -3.595458984375, -3.2698974609375, -2.9443359375, -2.6187744140625, -2.293212890625, -1.9676513671875, -1.64208984375, -1.3165283203125, -0.990966796875, -0.6654052734375, -0.33984375, -0.0142822265625, 0.311279296875, 0.6368408203125, 0.96240234375, 1.2879638671875, 1.613525390625, 1.9390869140625, 2.2646484375, 2.5902099609375, 2.915771484375, 3.2413330078125, 3.56689453125, 3.8924560546875, 4.218017578125, 4.5435791015625, 4.869140625, 5.1947021484375, 5.520263671875, 5.8458251953125, 6.17138671875, 6.4969482421875, 6.822509765625, 7.1480712890625, 7.4736328125, 7.7991943359375, 8.124755859375, 8.4503173828125, 8.77587890625, 9.1014404296875, 9.427001953125, 9.7525634765625, 10.078125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 11.0, 8.0, 15.0, 11.0, 18.0, 23.0, 31.0, 27.0, 54.0, 58.0, 75.0, 86.0, 108.0, 91.0, 82.0, 65.0, 55.0, 49.0, 29.0, 24.0, 14.0, 18.0, 10.0, 5.0, 9.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740234375, -1.8064422607421875, -1.738861083984375, -1.6712799072265625, -1.60369873046875, -1.5361175537109375, -1.468536376953125, -1.4009552001953125, -1.3333740234375, -1.2657928466796875, -1.198211669921875, -1.1306304931640625, -1.06304931640625, -0.9954681396484375, -0.927886962890625, -0.8603057861328125, -0.792724609375, -0.7251434326171875, -0.657562255859375, -0.5899810791015625, -0.52239990234375, -0.4548187255859375, -0.387237548828125, -0.3196563720703125, -0.2520751953125, -0.1844940185546875, -0.116912841796875, -0.0493316650390625, 0.01824951171875, 0.0858306884765625, 0.153411865234375, 0.2209930419921875, 0.28857421875, 0.3561553955078125, 0.423736572265625, 0.4913177490234375, 0.55889892578125, 0.6264801025390625, 0.694061279296875, 0.7616424560546875, 0.8292236328125, 0.8968048095703125, 0.964385986328125, 1.0319671630859375, 1.09954833984375, 1.1671295166015625, 1.234710693359375, 1.3022918701171875, 1.369873046875, 1.4374542236328125, 1.505035400390625, 1.5726165771484375, 1.64019775390625, 1.7077789306640625, 1.775360107421875, 1.8429412841796875, 1.9105224609375, 1.9781036376953125, 2.045684814453125, 2.1132659912109375, 2.18084716796875, 2.2484283447265625, 2.316009521484375, 2.3835906982421875, 2.451171875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 11.0, 11.0, 12.0, 25.0, 24.0, 35.0, 40.0, 68.0, 77.0, 86.0, 88.0, 95.0, 80.0, 84.0, 61.0, 52.0, 25.0, 26.0, 20.0, 17.0, 14.0, 11.0, 3.0, 4.0, 4.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.817096710205078, -21.90509605407715, -20.99309539794922, -20.08109474182129, -19.16909408569336, -18.25709342956543, -17.3450927734375, -16.433090209960938, -15.521090507507324, -14.609089851379395, -13.697089195251465, -12.785087585449219, -11.873086929321289, -10.96108627319336, -10.04908561706543, -9.1370849609375, -8.22508430480957, -7.313083648681641, -6.401082992553711, -5.489081859588623, -4.577081203460693, -3.6650805473327637, -2.753079414367676, -1.841078758239746, -0.9290781021118164, -0.017077326774597168, 0.8949234485626221, 1.8069243431091309, 2.7189249992370605, 3.6309256553649902, 4.542926788330078, 5.454927444458008, 6.3669281005859375, 7.278928756713867, 8.190929412841797, 9.102930068969727, 10.014930725097656, 10.926931381225586, 11.838932991027832, 12.750933647155762, 13.662934303283691, 14.574934959411621, 15.48693561553955, 16.398937225341797, 17.310937881469727, 18.222938537597656, 19.134939193725586, 20.046939849853516, 20.958940505981445, 21.870941162109375, 22.782941818237305, 23.694942474365234, 24.606943130493164, 25.518943786621094, 26.430946350097656, 27.342945098876953, 28.254947662353516, 29.166948318481445, 30.078948974609375, 30.990949630737305, 31.902950286865234, 32.8149528503418, 33.726951599121094, 34.638954162597656, 35.55095291137695]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 6.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 8.0, 11.0, 11.0, 9.0, 11.0, 9.0, 17.0, 19.0, 22.0, 22.0, 26.0, 28.0, 38.0, 31.0, 27.0, 39.0, 43.0, 25.0, 44.0, 36.0, 32.0, 26.0, 39.0, 34.0, 34.0, 31.0, 37.0, 26.0, 34.0, 24.0, 25.0, 25.0, 17.0, 11.0, 15.0, 16.0, 18.0, 13.0, 13.0, 7.0, 8.0, 6.0, 6.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.32688045501709, -8.037407875061035, -7.747934341430664, -7.458461284637451, -7.168988227844238, -6.879515171051025, -6.5900421142578125, -6.300569534301758, -6.011096000671387, -5.721622943878174, -5.432149887084961, -5.142676830291748, -4.853203773498535, -4.563730716705322, -4.274257659912109, -3.9847848415374756, -3.695312023162842, -3.405838966369629, -3.116365909576416, -2.826892852783203, -2.5374197959899902, -2.2479467391967773, -1.9584739208221436, -1.6690008640289307, -1.3795278072357178, -1.0900547504425049, -0.8005817532539368, -0.5111087560653687, -0.22163569927215576, 0.06783735752105713, 0.35731029510498047, 0.6467833518981934, 0.9362564086914062, 1.2257294654846191, 1.515202522277832, 1.8046754598617554, 2.094148635864258, 2.3836216926574707, 2.6730945110321045, 2.9625675678253174, 3.2520406246185303, 3.541513681411743, 3.830986738204956, 4.12045955657959, 4.409932613372803, 4.699405670166016, 4.9888787269592285, 5.278351783752441, 5.567824840545654, 5.857297897338867, 6.14677095413208, 6.436244010925293, 6.725717067718506, 7.015190124511719, 7.304662704467773, 7.5941362380981445, 7.883608818054199, 8.173081398010254, 8.462554931640625, 8.75202751159668, 9.04150104522705, 9.330973625183105, 9.620447158813477, 9.909919738769531, 10.199393272399902]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 13.0, 14.0, 35.0, 47.0, 61.0, 114.0, 194.0, 343.0, 581.0, 1097.0, 1918.0, 3510.0, 6753.0, 12366.0, 23467.0, 43282.0, 79113.0, 131211.0, 187697.0, 197319.0, 150933.0, 94354.0, 52532.0, 28471.0, 15224.0, 8181.0, 4292.0, 2397.0, 1336.0, 707.0, 399.0, 245.0, 133.0, 74.0, 38.0, 25.0, 23.0, 17.0, 6.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-21.46875, -20.858154296875, -20.24755859375, -19.636962890625, -19.0263671875, -18.415771484375, -17.80517578125, -17.194580078125, -16.583984375, -15.973388671875, -15.36279296875, -14.752197265625, -14.1416015625, -13.531005859375, -12.92041015625, -12.309814453125, -11.69921875, -11.088623046875, -10.47802734375, -9.867431640625, -9.2568359375, -8.646240234375, -8.03564453125, -7.425048828125, -6.814453125, -6.203857421875, -5.59326171875, -4.982666015625, -4.3720703125, -3.761474609375, -3.15087890625, -2.540283203125, -1.9296875, -1.319091796875, -0.70849609375, -0.097900390625, 0.5126953125, 1.123291015625, 1.73388671875, 2.344482421875, 2.955078125, 3.565673828125, 4.17626953125, 4.786865234375, 5.3974609375, 6.008056640625, 6.61865234375, 7.229248046875, 7.83984375, 8.450439453125, 9.06103515625, 9.671630859375, 10.2822265625, 10.892822265625, 11.50341796875, 12.114013671875, 12.724609375, 13.335205078125, 13.94580078125, 14.556396484375, 15.1669921875, 15.777587890625, 16.38818359375, 16.998779296875, 17.609375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 7.0, 8.0, 18.0, 12.0, 25.0, 15.0, 24.0, 30.0, 33.0, 49.0, 44.0, 39.0, 58.0, 51.0, 46.0, 59.0, 40.0, 49.0, 52.0, 52.0, 52.0, 31.0, 41.0, 32.0, 20.0, 26.0, 20.0, 13.0, 16.0, 10.0, 13.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.859375, -12.398681640625, -11.93798828125, -11.477294921875, -11.0166015625, -10.555908203125, -10.09521484375, -9.634521484375, -9.173828125, -8.713134765625, -8.25244140625, -7.791748046875, -7.3310546875, -6.870361328125, -6.40966796875, -5.948974609375, -5.48828125, -5.027587890625, -4.56689453125, -4.106201171875, -3.6455078125, -3.184814453125, -2.72412109375, -2.263427734375, -1.802734375, -1.342041015625, -0.88134765625, -0.420654296875, 0.0400390625, 0.500732421875, 0.96142578125, 1.422119140625, 1.8828125, 2.343505859375, 2.80419921875, 3.264892578125, 3.7255859375, 4.186279296875, 4.64697265625, 5.107666015625, 5.568359375, 6.029052734375, 6.48974609375, 6.950439453125, 7.4111328125, 7.871826171875, 8.33251953125, 8.793212890625, 9.25390625, 9.714599609375, 10.17529296875, 10.635986328125, 11.0966796875, 11.557373046875, 12.01806640625, 12.478759765625, 12.939453125, 13.400146484375, 13.86083984375, 14.321533203125, 14.7822265625, 15.242919921875, 15.70361328125, 16.164306640625, 16.625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 7.0, 15.0, 36.0, 40.0, 69.0, 90.0, 166.0, 198.0, 322.0, 491.0, 906.0, 1351.0, 2128.0, 3451.0, 5755.0, 9216.0, 15169.0, 24164.0, 38932.0, 60242.0, 89284.0, 121722.0, 147490.0, 147776.0, 123737.0, 90546.0, 60990.0, 39202.0, 24669.0, 15321.0, 9611.0, 5766.0, 3622.0, 2219.0, 1415.0, 891.0, 556.0, 366.0, 217.0, 134.0, 89.0, 66.0, 40.0, 21.0, 20.0, 9.0, 12.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.8515625, -12.4234619140625, -11.995361328125, -11.5672607421875, -11.13916015625, -10.7110595703125, -10.282958984375, -9.8548583984375, -9.4267578125, -8.9986572265625, -8.570556640625, -8.1424560546875, -7.71435546875, -7.2862548828125, -6.858154296875, -6.4300537109375, -6.001953125, -5.5738525390625, -5.145751953125, -4.7176513671875, -4.28955078125, -3.8614501953125, -3.433349609375, -3.0052490234375, -2.5771484375, -2.1490478515625, -1.720947265625, -1.2928466796875, -0.86474609375, -0.4366455078125, -0.008544921875, 0.4195556640625, 0.84765625, 1.2757568359375, 1.703857421875, 2.1319580078125, 2.56005859375, 2.9881591796875, 3.416259765625, 3.8443603515625, 4.2724609375, 4.7005615234375, 5.128662109375, 5.5567626953125, 5.98486328125, 6.4129638671875, 6.841064453125, 7.2691650390625, 7.697265625, 8.1253662109375, 8.553466796875, 8.9815673828125, 9.40966796875, 9.8377685546875, 10.265869140625, 10.6939697265625, 11.1220703125, 11.5501708984375, 11.978271484375, 12.4063720703125, 12.83447265625, 13.2625732421875, 13.690673828125, 14.1187744140625, 14.546875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 5.0, 1.0, 4.0, 6.0, 9.0, 14.0, 14.0, 27.0, 19.0, 30.0, 34.0, 24.0, 22.0, 46.0, 48.0, 50.0, 41.0, 40.0, 57.0, 40.0, 47.0, 34.0, 42.0, 33.0, 36.0, 27.0, 33.0, 29.0, 32.0, 25.0, 25.0, 23.0, 15.0, 17.0, 9.0, 11.0, 5.0, 7.0, 10.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.7578125, -6.52874755859375, -6.2996826171875, -6.07061767578125, -5.841552734375, -5.61248779296875, -5.3834228515625, -5.15435791015625, -4.92529296875, -4.69622802734375, -4.4671630859375, -4.23809814453125, -4.009033203125, -3.77996826171875, -3.5509033203125, -3.32183837890625, -3.0927734375, -2.86370849609375, -2.6346435546875, -2.40557861328125, -2.176513671875, -1.94744873046875, -1.7183837890625, -1.48931884765625, -1.26025390625, -1.03118896484375, -0.8021240234375, -0.57305908203125, -0.343994140625, -0.11492919921875, 0.1141357421875, 0.34320068359375, 0.572265625, 0.80133056640625, 1.0303955078125, 1.25946044921875, 1.488525390625, 1.71759033203125, 1.9466552734375, 2.17572021484375, 2.40478515625, 2.63385009765625, 2.8629150390625, 3.09197998046875, 3.321044921875, 3.55010986328125, 3.7791748046875, 4.00823974609375, 4.2373046875, 4.46636962890625, 4.6954345703125, 4.92449951171875, 5.153564453125, 5.38262939453125, 5.6116943359375, 5.84075927734375, 6.06982421875, 6.29888916015625, 6.5279541015625, 6.75701904296875, 6.986083984375, 7.21514892578125, 7.4442138671875, 7.67327880859375, 7.90234375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 25.0, 23.0, 35.0, 54.0, 69.0, 97.0, 136.0, 208.0, 344.0, 452.0, 659.0, 1033.0, 1577.0, 2503.0, 3927.0, 6525.0, 10733.0, 18270.0, 31246.0, 53871.0, 91598.0, 143655.0, 187235.0, 178077.0, 126762.0, 77669.0, 45479.0, 26292.0, 15411.0, 9095.0, 5667.0, 3453.0, 2175.0, 1375.0, 887.0, 568.0, 413.0, 298.0, 200.0, 122.0, 98.0, 61.0, 47.0, 24.0, 29.0, 20.0, 12.0, 11.0, 10.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.81640625, -6.60235595703125, -6.3883056640625, -6.17425537109375, -5.960205078125, -5.74615478515625, -5.5321044921875, -5.31805419921875, -5.10400390625, -4.88995361328125, -4.6759033203125, -4.46185302734375, -4.247802734375, -4.03375244140625, -3.8197021484375, -3.60565185546875, -3.3916015625, -3.17755126953125, -2.9635009765625, -2.74945068359375, -2.535400390625, -2.32135009765625, -2.1072998046875, -1.89324951171875, -1.67919921875, -1.46514892578125, -1.2510986328125, -1.03704833984375, -0.822998046875, -0.60894775390625, -0.3948974609375, -0.18084716796875, 0.033203125, 0.24725341796875, 0.4613037109375, 0.67535400390625, 0.889404296875, 1.10345458984375, 1.3175048828125, 1.53155517578125, 1.74560546875, 1.95965576171875, 2.1737060546875, 2.38775634765625, 2.601806640625, 2.81585693359375, 3.0299072265625, 3.24395751953125, 3.4580078125, 3.67205810546875, 3.8861083984375, 4.10015869140625, 4.314208984375, 4.52825927734375, 4.7423095703125, 4.95635986328125, 5.17041015625, 5.38446044921875, 5.5985107421875, 5.81256103515625, 6.026611328125, 6.24066162109375, 6.4547119140625, 6.66876220703125, 6.8828125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 9.0, 10.0, 19.0, 13.0, 26.0, 28.0, 37.0, 42.0, 55.0, 66.0, 76.0, 98.0, 87.0, 95.0, 78.0, 66.0, 47.0, 33.0, 26.0, 17.0, 11.0, 11.0, 15.0, 7.0, 8.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010080337524414062, -0.0009734034538269043, -0.0009387731552124023, -0.0009041428565979004, -0.0008695125579833984, -0.0008348822593688965, -0.0008002519607543945, -0.0007656216621398926, -0.0007309913635253906, -0.0006963610649108887, -0.0006617307662963867, -0.0006271004676818848, -0.0005924701690673828, -0.0005578398704528809, -0.0005232095718383789, -0.000488579273223877, -0.000453948974609375, -0.00041931867599487305, -0.0003846883773803711, -0.00035005807876586914, -0.0003154277801513672, -0.00028079748153686523, -0.0002461671829223633, -0.00021153688430786133, -0.00017690658569335938, -0.00014227628707885742, -0.00010764598846435547, -7.301568984985352e-05, -3.838539123535156e-05, -3.7550926208496094e-06, 3.0875205993652344e-05, 6.55055046081543e-05, 0.00010013580322265625, 0.0001347661018371582, 0.00016939640045166016, 0.0002040266990661621, 0.00023865699768066406, 0.000273287296295166, 0.00030791759490966797, 0.0003425478935241699, 0.0003771781921386719, 0.00041180849075317383, 0.0004464387893676758, 0.00048106908798217773, 0.0005156993865966797, 0.0005503296852111816, 0.0005849599838256836, 0.0006195902824401855, 0.0006542205810546875, 0.0006888508796691895, 0.0007234811782836914, 0.0007581114768981934, 0.0007927417755126953, 0.0008273720741271973, 0.0008620023727416992, 0.0008966326713562012, 0.0009312629699707031, 0.0009658932685852051, 0.001000523567199707, 0.001035153865814209, 0.001069784164428711, 0.0011044144630432129, 0.0011390447616577148, 0.0011736750602722168, 0.0012083053588867188]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 14.0, 5.0, 12.0, 24.0, 44.0, 45.0, 125.0, 156.0, 259.0, 425.0, 690.0, 1103.0, 1941.0, 3354.0, 5920.0, 10659.0, 19632.0, 37116.0, 71023.0, 128020.0, 198449.0, 217044.0, 157031.0, 90380.0, 48526.0, 25189.0, 13611.0, 7529.0, 4221.0, 2491.0, 1452.0, 773.0, 515.0, 305.0, 171.0, 108.0, 81.0, 42.0, 32.0, 15.0, 17.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.82781982421875, -8.5697021484375, -8.31158447265625, -8.053466796875, -7.79534912109375, -7.5372314453125, -7.27911376953125, -7.02099609375, -6.76287841796875, -6.5047607421875, -6.24664306640625, -5.988525390625, -5.73040771484375, -5.4722900390625, -5.21417236328125, -4.9560546875, -4.69793701171875, -4.4398193359375, -4.18170166015625, -3.923583984375, -3.66546630859375, -3.4073486328125, -3.14923095703125, -2.89111328125, -2.63299560546875, -2.3748779296875, -2.11676025390625, -1.858642578125, -1.60052490234375, -1.3424072265625, -1.08428955078125, -0.826171875, -0.56805419921875, -0.3099365234375, -0.05181884765625, 0.206298828125, 0.46441650390625, 0.7225341796875, 0.98065185546875, 1.23876953125, 1.49688720703125, 1.7550048828125, 2.01312255859375, 2.271240234375, 2.52935791015625, 2.7874755859375, 3.04559326171875, 3.3037109375, 3.56182861328125, 3.8199462890625, 4.07806396484375, 4.336181640625, 4.59429931640625, 4.8524169921875, 5.11053466796875, 5.36865234375, 5.62677001953125, 5.8848876953125, 6.14300537109375, 6.401123046875, 6.65924072265625, 6.9173583984375, 7.17547607421875, 7.43359375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 9.0, 7.0, 6.0, 8.0, 18.0, 10.0, 21.0, 17.0, 18.0, 25.0, 25.0, 26.0, 34.0, 36.0, 50.0, 39.0, 72.0, 56.0, 57.0, 40.0, 38.0, 43.0, 60.0, 47.0, 29.0, 27.0, 24.0, 28.0, 17.0, 19.0, 22.0, 10.0, 10.0, 7.0, 7.0, 11.0, 15.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.983001708984375, -1.91912841796875, -1.855255126953125, -1.7913818359375, -1.727508544921875, -1.66363525390625, -1.599761962890625, -1.535888671875, -1.472015380859375, -1.40814208984375, -1.344268798828125, -1.2803955078125, -1.216522216796875, -1.15264892578125, -1.088775634765625, -1.02490234375, -0.961029052734375, -0.89715576171875, -0.833282470703125, -0.7694091796875, -0.705535888671875, -0.64166259765625, -0.577789306640625, -0.513916015625, -0.450042724609375, -0.38616943359375, -0.322296142578125, -0.2584228515625, -0.194549560546875, -0.13067626953125, -0.066802978515625, -0.0029296875, 0.060943603515625, 0.12481689453125, 0.188690185546875, 0.2525634765625, 0.316436767578125, 0.38031005859375, 0.444183349609375, 0.508056640625, 0.571929931640625, 0.63580322265625, 0.699676513671875, 0.7635498046875, 0.827423095703125, 0.89129638671875, 0.955169677734375, 1.01904296875, 1.082916259765625, 1.14678955078125, 1.210662841796875, 1.2745361328125, 1.338409423828125, 1.40228271484375, 1.466156005859375, 1.530029296875, 1.593902587890625, 1.65777587890625, 1.721649169921875, 1.7855224609375, 1.849395751953125, 1.91326904296875, 1.977142333984375, 2.041015625]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 6.0, 12.0, 8.0, 15.0, 25.0, 22.0, 24.0, 38.0, 49.0, 52.0, 71.0, 85.0, 77.0, 80.0, 79.0, 67.0, 64.0, 50.0, 40.0, 27.0, 17.0, 14.0, 16.0, 8.0, 15.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.304981231689453, -20.486417770385742, -19.66785430908203, -18.84929084777832, -18.03072738647461, -17.2121639251709, -16.393600463867188, -15.575037002563477, -14.756473541259766, -13.937910079956055, -13.119346618652344, -12.300783157348633, -11.482219696044922, -10.663656234741211, -9.8450927734375, -9.026529312133789, -8.207964897155762, -7.389401435852051, -6.57083797454834, -5.752274513244629, -4.933711051940918, -4.115147113800049, -3.296583652496338, -2.478020191192627, -1.659456729888916, -0.8408932089805603, -0.02232968807220459, 0.7962338924407959, 1.6147973537445068, 2.433361053466797, 3.251924514770508, 4.070487976074219, 4.88905143737793, 5.707614898681641, 6.526178359985352, 7.3447418212890625, 8.163305282592773, 8.981868743896484, 9.800432205200195, 10.618995666503906, 11.437559127807617, 12.256122589111328, 13.074686050415039, 13.89324951171875, 14.711812973022461, 15.530376434326172, 16.348939895629883, 17.167503356933594, 17.986068725585938, 18.80463218688965, 19.62319564819336, 20.44175910949707, 21.26032257080078, 22.078886032104492, 22.897449493408203, 23.716012954711914, 24.534576416015625, 25.353139877319336, 26.171703338623047, 26.990266799926758, 27.80883026123047, 28.62739372253418, 29.44595718383789, 30.2645206451416, 31.083084106445312]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 6.0, 9.0, 10.0, 8.0, 15.0, 8.0, 12.0, 17.0, 17.0, 18.0, 21.0, 25.0, 25.0, 26.0, 26.0, 40.0, 40.0, 31.0, 32.0, 39.0, 41.0, 29.0, 34.0, 39.0, 37.0, 25.0, 34.0, 25.0, 31.0, 33.0, 25.0, 30.0, 14.0, 19.0, 15.0, 21.0, 11.0, 14.0, 12.0, 15.0, 9.0, 8.0, 9.0, 5.0, 6.0, 3.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.12578010559082, -7.842883110046387, -7.559986114501953, -7.2770891189575195, -6.994192123413086, -6.711295127868652, -6.428398609161377, -6.145501613616943, -5.86260461807251, -5.579707622528076, -5.296810626983643, -5.013913631439209, -4.731017112731934, -4.4481201171875, -4.165223121643066, -3.882326126098633, -3.599429130554199, -3.3165321350097656, -3.033635139465332, -2.7507383823394775, -2.467841386795044, -2.1849443912506104, -1.9020475149154663, -1.6191506385803223, -1.3362536430358887, -1.053356647491455, -0.770459771156311, -0.4875628352165222, -0.2046658992767334, 0.0782310962677002, 0.36112797260284424, 0.6440248489379883, 0.9269227981567383, 1.2098197937011719, 1.492716670036316, 1.77561354637146, 2.0585105419158936, 2.341407537460327, 2.6243042945861816, 2.9072012901306152, 3.190098285675049, 3.4729952812194824, 3.755892276763916, 4.03878927230835, 4.321685791015625, 4.604582786560059, 4.887479782104492, 5.170376777648926, 5.453273773193359, 5.736170768737793, 6.019067764282227, 6.30196475982666, 6.584861755371094, 6.867758750915527, 7.150655269622803, 7.433552265167236, 7.71644926071167, 7.9993462562561035, 8.282242774963379, 8.565139770507812, 8.848036766052246, 9.13093376159668, 9.413830757141113, 9.696727752685547, 9.97962474822998]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 11.0, 11.0, 17.0, 25.0, 32.0, 61.0, 72.0, 98.0, 174.0, 278.0, 433.0, 628.0, 995.0, 1662.0, 2646.0, 4622.0, 8258.0, 15521.0, 30661.0, 68161.0, 168702.0, 477298.0, 1261938.0, 1326379.0, 509489.0, 177687.0, 70531.0, 31608.0, 15910.0, 8404.0, 4574.0, 2772.0, 1672.0, 970.0, 704.0, 409.0, 293.0, 188.0, 112.0, 72.0, 67.0, 46.0, 27.0, 20.0, 14.0, 11.0, 10.0, 9.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-23.828125, -22.912841796875, -21.99755859375, -21.082275390625, -20.1669921875, -19.251708984375, -18.33642578125, -17.421142578125, -16.505859375, -15.590576171875, -14.67529296875, -13.760009765625, -12.8447265625, -11.929443359375, -11.01416015625, -10.098876953125, -9.18359375, -8.268310546875, -7.35302734375, -6.437744140625, -5.5224609375, -4.607177734375, -3.69189453125, -2.776611328125, -1.861328125, -0.946044921875, -0.03076171875, 0.884521484375, 1.7998046875, 2.715087890625, 3.63037109375, 4.545654296875, 5.4609375, 6.376220703125, 7.29150390625, 8.206787109375, 9.1220703125, 10.037353515625, 10.95263671875, 11.867919921875, 12.783203125, 13.698486328125, 14.61376953125, 15.529052734375, 16.4443359375, 17.359619140625, 18.27490234375, 19.190185546875, 20.10546875, 21.020751953125, 21.93603515625, 22.851318359375, 23.7666015625, 24.681884765625, 25.59716796875, 26.512451171875, 27.427734375, 28.343017578125, 29.25830078125, 30.173583984375, 31.0888671875, 32.004150390625, 32.91943359375, 33.834716796875, 34.75]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 1.0, 7.0, 9.0, 10.0, 12.0, 6.0, 12.0, 21.0, 19.0, 18.0, 23.0, 30.0, 24.0, 30.0, 23.0, 36.0, 47.0, 37.0, 27.0, 41.0, 45.0, 43.0, 41.0, 39.0, 25.0, 33.0, 27.0, 26.0, 43.0, 21.0, 29.0, 41.0, 24.0, 13.0, 13.0, 16.0, 11.0, 10.0, 7.0, 10.0, 7.0, 7.0, 4.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-8.546875, -8.2864990234375, -8.026123046875, -7.7657470703125, -7.50537109375, -7.2449951171875, -6.984619140625, -6.7242431640625, -6.4638671875, -6.2034912109375, -5.943115234375, -5.6827392578125, -5.42236328125, -5.1619873046875, -4.901611328125, -4.6412353515625, -4.380859375, -4.1204833984375, -3.860107421875, -3.5997314453125, -3.33935546875, -3.0789794921875, -2.818603515625, -2.5582275390625, -2.2978515625, -2.0374755859375, -1.777099609375, -1.5167236328125, -1.25634765625, -0.9959716796875, -0.735595703125, -0.4752197265625, -0.21484375, 0.0455322265625, 0.305908203125, 0.5662841796875, 0.82666015625, 1.0870361328125, 1.347412109375, 1.6077880859375, 1.8681640625, 2.1285400390625, 2.388916015625, 2.6492919921875, 2.90966796875, 3.1700439453125, 3.430419921875, 3.6907958984375, 3.951171875, 4.2115478515625, 4.471923828125, 4.7322998046875, 4.99267578125, 5.2530517578125, 5.513427734375, 5.7738037109375, 6.0341796875, 6.2945556640625, 6.554931640625, 6.8153076171875, 7.07568359375, 7.3360595703125, 7.596435546875, 7.8568115234375, 8.1171875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 9.0, 19.0, 20.0, 41.0, 54.0, 81.0, 120.0, 192.0, 262.0, 415.0, 621.0, 940.0, 1511.0, 2455.0, 3966.0, 6461.0, 11046.0, 19797.0, 37157.0, 76500.0, 172742.0, 427564.0, 1036005.0, 1302501.0, 628555.0, 248436.0, 105454.0, 49958.0, 26005.0, 14232.0, 8156.0, 4864.0, 2877.0, 1896.0, 1160.0, 765.0, 479.0, 317.0, 214.0, 143.0, 96.0, 54.0, 48.0, 34.0, 13.0, 19.0, 8.0, 12.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.140625, -29.1748046875, -28.208984375, -27.2431640625, -26.27734375, -25.3115234375, -24.345703125, -23.3798828125, -22.4140625, -21.4482421875, -20.482421875, -19.5166015625, -18.55078125, -17.5849609375, -16.619140625, -15.6533203125, -14.6875, -13.7216796875, -12.755859375, -11.7900390625, -10.82421875, -9.8583984375, -8.892578125, -7.9267578125, -6.9609375, -5.9951171875, -5.029296875, -4.0634765625, -3.09765625, -2.1318359375, -1.166015625, -0.2001953125, 0.765625, 1.7314453125, 2.697265625, 3.6630859375, 4.62890625, 5.5947265625, 6.560546875, 7.5263671875, 8.4921875, 9.4580078125, 10.423828125, 11.3896484375, 12.35546875, 13.3212890625, 14.287109375, 15.2529296875, 16.21875, 17.1845703125, 18.150390625, 19.1162109375, 20.08203125, 21.0478515625, 22.013671875, 22.9794921875, 23.9453125, 24.9111328125, 25.876953125, 26.8427734375, 27.80859375, 28.7744140625, 29.740234375, 30.7060546875, 31.671875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 12.0, 15.0, 16.0, 34.0, 27.0, 39.0, 45.0, 55.0, 95.0, 109.0, 172.0, 178.0, 230.0, 244.0, 305.0, 340.0, 351.0, 350.0, 293.0, 244.0, 198.0, 136.0, 132.0, 104.0, 71.0, 55.0, 40.0, 40.0, 27.0, 19.0, 18.0, 17.0, 14.0, 10.0, 7.0, 9.0, 4.0, 2.0, 3.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.171875, -6.9295654296875, -6.687255859375, -6.4449462890625, -6.20263671875, -5.9603271484375, -5.718017578125, -5.4757080078125, -5.2333984375, -4.9910888671875, -4.748779296875, -4.5064697265625, -4.26416015625, -4.0218505859375, -3.779541015625, -3.5372314453125, -3.294921875, -3.0526123046875, -2.810302734375, -2.5679931640625, -2.32568359375, -2.0833740234375, -1.841064453125, -1.5987548828125, -1.3564453125, -1.1141357421875, -0.871826171875, -0.6295166015625, -0.38720703125, -0.1448974609375, 0.097412109375, 0.3397216796875, 0.58203125, 0.8243408203125, 1.066650390625, 1.3089599609375, 1.55126953125, 1.7935791015625, 2.035888671875, 2.2781982421875, 2.5205078125, 2.7628173828125, 3.005126953125, 3.2474365234375, 3.48974609375, 3.7320556640625, 3.974365234375, 4.2166748046875, 4.458984375, 4.7012939453125, 4.943603515625, 5.1859130859375, 5.42822265625, 5.6705322265625, 5.912841796875, 6.1551513671875, 6.3974609375, 6.6397705078125, 6.882080078125, 7.1243896484375, 7.36669921875, 7.6090087890625, 7.851318359375, 8.0936279296875, 8.3359375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 9.0, 4.0, 7.0, 15.0, 15.0, 21.0, 22.0, 30.0, 34.0, 46.0, 49.0, 64.0, 63.0, 61.0, 70.0, 71.0, 57.0, 56.0, 47.0, 39.0, 39.0, 32.0, 33.0, 19.0, 16.0, 15.0, 14.0, 13.0, 5.0, 3.0, 5.0, 8.0, 0.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.447826385498047, -24.647003173828125, -23.846179962158203, -23.04535675048828, -22.24453353881836, -21.443710327148438, -20.642887115478516, -19.842063903808594, -19.041240692138672, -18.24041748046875, -17.439594268798828, -16.638771057128906, -15.837947845458984, -15.037124633789062, -14.23630142211914, -13.435478210449219, -12.634654998779297, -11.833831787109375, -11.033008575439453, -10.232185363769531, -9.43136215209961, -8.630538940429688, -7.829715728759766, -7.028892517089844, -6.228069305419922, -5.42724609375, -4.626422882080078, -3.8255996704101562, -3.0247764587402344, -2.2239532470703125, -1.4231300354003906, -0.6223068237304688, 0.17851829528808594, 0.9793415069580078, 1.7801647186279297, 2.5809879302978516, 3.3818111419677734, 4.182634353637695, 4.983457565307617, 5.784280776977539, 6.585103988647461, 7.385927200317383, 8.186750411987305, 8.987573623657227, 9.788396835327148, 10.58922004699707, 11.390043258666992, 12.190866470336914, 12.991689682006836, 13.792512893676758, 14.59333610534668, 15.394159317016602, 16.194982528686523, 16.995805740356445, 17.796628952026367, 18.59745216369629, 19.39827537536621, 20.199098587036133, 20.999921798706055, 21.800745010375977, 22.6015682220459, 23.40239143371582, 24.203214645385742, 25.004037857055664, 25.804861068725586]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 6.0, 7.0, 8.0, 12.0, 9.0, 7.0, 10.0, 15.0, 15.0, 13.0, 31.0, 16.0, 25.0, 33.0, 21.0, 22.0, 36.0, 32.0, 36.0, 40.0, 33.0, 36.0, 52.0, 37.0, 38.0, 36.0, 36.0, 34.0, 29.0, 31.0, 32.0, 28.0, 19.0, 15.0, 31.0, 13.0, 24.0, 19.0, 7.0, 7.0, 12.0, 7.0, 7.0, 4.0, 5.0, 7.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.708602905273438, -10.358699798583984, -10.008796691894531, -9.658893585205078, -9.308990478515625, -8.959087371826172, -8.609184265136719, -8.25928020477295, -7.909377098083496, -7.559473991394043, -7.20957088470459, -6.859667778015137, -6.509764194488525, -6.159861087799072, -5.809957981109619, -5.460054397583008, -5.110151767730713, -4.76024866104126, -4.410345554351807, -4.060441970825195, -3.710538864135742, -3.360635757446289, -3.010732650756836, -2.6608293056488037, -2.3109261989593506, -1.961022973060608, -1.6111197471618652, -1.261216640472412, -0.9113134145736694, -0.5614101886749268, -0.21150708198547363, 0.1383962631225586, 0.4882993698120117, 0.8382025957107544, 1.188105821609497, 1.5380089282989502, 1.8879121541976929, 2.2378153800964355, 2.5877184867858887, 2.937621831893921, 3.287524938583374, 3.637428045272827, 3.9873313903808594, 4.3372344970703125, 4.687137603759766, 5.037040710449219, 5.386943817138672, 5.736847400665283, 6.086750507354736, 6.4366536140441895, 6.786556720733643, 7.136460304260254, 7.486363410949707, 7.83626651763916, 8.186169624328613, 8.536072731018066, 8.88597583770752, 9.235878944396973, 9.585782051086426, 9.935685157775879, 10.285588264465332, 10.635492324829102, 10.985395431518555, 11.335298538208008, 11.685201644897461]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 6.0, 11.0, 8.0, 19.0, 28.0, 52.0, 80.0, 104.0, 171.0, 273.0, 390.0, 592.0, 1022.0, 1614.0, 2505.0, 4082.0, 6533.0, 10528.0, 16583.0, 26884.0, 43193.0, 68205.0, 103074.0, 143221.0, 165996.0, 148239.0, 109478.0, 72930.0, 46417.0, 28922.0, 17791.0, 10988.0, 6894.0, 4383.0, 2710.0, 1752.0, 1004.0, 670.0, 416.0, 269.0, 175.0, 127.0, 82.0, 53.0, 25.0, 17.0, 19.0, 7.0, 11.0, 5.0, 1.0, 1.0, 1.0, 3.0], "bins": [-9.265625, -8.99761962890625, -8.7296142578125, -8.46160888671875, -8.193603515625, -7.92559814453125, -7.6575927734375, -7.38958740234375, -7.12158203125, -6.85357666015625, -6.5855712890625, -6.31756591796875, -6.049560546875, -5.78155517578125, -5.5135498046875, -5.24554443359375, -4.9775390625, -4.70953369140625, -4.4415283203125, -4.17352294921875, -3.905517578125, -3.63751220703125, -3.3695068359375, -3.10150146484375, -2.83349609375, -2.56549072265625, -2.2974853515625, -2.02947998046875, -1.761474609375, -1.49346923828125, -1.2254638671875, -0.95745849609375, -0.689453125, -0.42144775390625, -0.1534423828125, 0.11456298828125, 0.382568359375, 0.65057373046875, 0.9185791015625, 1.18658447265625, 1.45458984375, 1.72259521484375, 1.9906005859375, 2.25860595703125, 2.526611328125, 2.79461669921875, 3.0626220703125, 3.33062744140625, 3.5986328125, 3.86663818359375, 4.1346435546875, 4.40264892578125, 4.670654296875, 4.93865966796875, 5.2066650390625, 5.47467041015625, 5.74267578125, 6.01068115234375, 6.2786865234375, 6.54669189453125, 6.814697265625, 7.08270263671875, 7.3507080078125, 7.61871337890625, 7.88671875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 1.0, 2.0, 8.0, 11.0, 9.0, 15.0, 16.0, 15.0, 21.0, 19.0, 26.0, 31.0, 15.0, 27.0, 29.0, 34.0, 48.0, 46.0, 45.0, 38.0, 51.0, 32.0, 43.0, 39.0, 42.0, 41.0, 37.0, 37.0, 24.0, 28.0, 32.0, 29.0, 23.0, 10.0, 11.0, 11.0, 11.0, 9.0, 15.0, 7.0, 6.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.53125, -14.0760498046875, -13.620849609375, -13.1656494140625, -12.71044921875, -12.2552490234375, -11.800048828125, -11.3448486328125, -10.8896484375, -10.4344482421875, -9.979248046875, -9.5240478515625, -9.06884765625, -8.6136474609375, -8.158447265625, -7.7032470703125, -7.248046875, -6.7928466796875, -6.337646484375, -5.8824462890625, -5.42724609375, -4.9720458984375, -4.516845703125, -4.0616455078125, -3.6064453125, -3.1512451171875, -2.696044921875, -2.2408447265625, -1.78564453125, -1.3304443359375, -0.875244140625, -0.4200439453125, 0.03515625, 0.4903564453125, 0.945556640625, 1.4007568359375, 1.85595703125, 2.3111572265625, 2.766357421875, 3.2215576171875, 3.6767578125, 4.1319580078125, 4.587158203125, 5.0423583984375, 5.49755859375, 5.9527587890625, 6.407958984375, 6.8631591796875, 7.318359375, 7.7735595703125, 8.228759765625, 8.6839599609375, 9.13916015625, 9.5943603515625, 10.049560546875, 10.5047607421875, 10.9599609375, 11.4151611328125, 11.870361328125, 12.3255615234375, 12.78076171875, 13.2359619140625, 13.691162109375, 14.1463623046875, 14.6015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 8.0, 10.0, 15.0, 13.0, 38.0, 39.0, 78.0, 100.0, 150.0, 176.0, 262.0, 360.0, 493.0, 795.0, 1075.0, 1569.0, 2320.0, 3388.0, 5233.0, 7959.0, 12989.0, 20994.0, 34490.0, 56805.0, 91906.0, 142709.0, 186567.0, 169408.0, 116961.0, 73402.0, 44425.0, 27172.0, 16558.0, 10325.0, 6603.0, 4131.0, 2884.0, 1855.0, 1237.0, 866.0, 641.0, 438.0, 307.0, 227.0, 175.0, 124.0, 94.0, 64.0, 42.0, 25.0, 22.0, 14.0, 7.0, 6.0, 2.0, 4.0, 1.0], "bins": [-10.9453125, -10.62109375, -10.296875, -9.97265625, -9.6484375, -9.32421875, -9.0, -8.67578125, -8.3515625, -8.02734375, -7.703125, -7.37890625, -7.0546875, -6.73046875, -6.40625, -6.08203125, -5.7578125, -5.43359375, -5.109375, -4.78515625, -4.4609375, -4.13671875, -3.8125, -3.48828125, -3.1640625, -2.83984375, -2.515625, -2.19140625, -1.8671875, -1.54296875, -1.21875, -0.89453125, -0.5703125, -0.24609375, 0.078125, 0.40234375, 0.7265625, 1.05078125, 1.375, 1.69921875, 2.0234375, 2.34765625, 2.671875, 2.99609375, 3.3203125, 3.64453125, 3.96875, 4.29296875, 4.6171875, 4.94140625, 5.265625, 5.58984375, 5.9140625, 6.23828125, 6.5625, 6.88671875, 7.2109375, 7.53515625, 7.859375, 8.18359375, 8.5078125, 8.83203125, 9.15625, 9.48046875, 9.8046875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 5.0, 6.0, 10.0, 4.0, 9.0, 9.0, 7.0, 14.0, 8.0, 11.0, 24.0, 15.0, 14.0, 25.0, 27.0, 37.0, 31.0, 25.0, 30.0, 41.0, 35.0, 37.0, 30.0, 36.0, 25.0, 31.0, 43.0, 39.0, 31.0, 39.0, 26.0, 22.0, 29.0, 29.0, 35.0, 25.0, 22.0, 15.0, 19.0, 17.0, 15.0, 14.0, 10.0, 3.0, 9.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-8.140625, -7.90020751953125, -7.6597900390625, -7.41937255859375, -7.178955078125, -6.93853759765625, -6.6981201171875, -6.45770263671875, -6.21728515625, -5.97686767578125, -5.7364501953125, -5.49603271484375, -5.255615234375, -5.01519775390625, -4.7747802734375, -4.53436279296875, -4.2939453125, -4.05352783203125, -3.8131103515625, -3.57269287109375, -3.332275390625, -3.09185791015625, -2.8514404296875, -2.61102294921875, -2.37060546875, -2.13018798828125, -1.8897705078125, -1.64935302734375, -1.408935546875, -1.16851806640625, -0.9281005859375, -0.68768310546875, -0.447265625, -0.20684814453125, 0.0335693359375, 0.27398681640625, 0.514404296875, 0.75482177734375, 0.9952392578125, 1.23565673828125, 1.47607421875, 1.71649169921875, 1.9569091796875, 2.19732666015625, 2.437744140625, 2.67816162109375, 2.9185791015625, 3.15899658203125, 3.3994140625, 3.63983154296875, 3.8802490234375, 4.12066650390625, 4.361083984375, 4.60150146484375, 4.8419189453125, 5.08233642578125, 5.32275390625, 5.56317138671875, 5.8035888671875, 6.04400634765625, 6.284423828125, 6.52484130859375, 6.7652587890625, 7.00567626953125, 7.24609375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 6.0, 8.0, 10.0, 12.0, 21.0, 39.0, 39.0, 88.0, 125.0, 246.0, 420.0, 767.0, 1490.0, 2730.0, 5229.0, 10250.0, 21736.0, 48052.0, 110235.0, 240599.0, 307740.0, 164736.0, 72136.0, 31741.0, 14937.0, 7176.0, 3607.0, 1976.0, 1019.0, 611.0, 308.0, 181.0, 115.0, 73.0, 44.0, 25.0, 11.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.234375, -5.049072265625, -4.86376953125, -4.678466796875, -4.4931640625, -4.307861328125, -4.12255859375, -3.937255859375, -3.751953125, -3.566650390625, -3.38134765625, -3.196044921875, -3.0107421875, -2.825439453125, -2.64013671875, -2.454833984375, -2.26953125, -2.084228515625, -1.89892578125, -1.713623046875, -1.5283203125, -1.343017578125, -1.15771484375, -0.972412109375, -0.787109375, -0.601806640625, -0.41650390625, -0.231201171875, -0.0458984375, 0.139404296875, 0.32470703125, 0.510009765625, 0.6953125, 0.880615234375, 1.06591796875, 1.251220703125, 1.4365234375, 1.621826171875, 1.80712890625, 1.992431640625, 2.177734375, 2.363037109375, 2.54833984375, 2.733642578125, 2.9189453125, 3.104248046875, 3.28955078125, 3.474853515625, 3.66015625, 3.845458984375, 4.03076171875, 4.216064453125, 4.4013671875, 4.586669921875, 4.77197265625, 4.957275390625, 5.142578125, 5.327880859375, 5.51318359375, 5.698486328125, 5.8837890625, 6.069091796875, 6.25439453125, 6.439697265625, 6.625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 3.0, 10.0, 1.0, 7.0, 7.0, 12.0, 17.0, 13.0, 18.0, 16.0, 24.0, 21.0, 31.0, 52.0, 30.0, 46.0, 49.0, 62.0, 43.0, 50.0, 58.0, 47.0, 57.0, 47.0, 40.0, 35.0, 38.0, 28.0, 34.0, 20.0, 16.0, 21.0, 13.0, 4.0, 3.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022029876708984375, -0.00021200254559516907, -0.00020370632410049438, -0.0001954101026058197, -0.00018711388111114502, -0.00017881765961647034, -0.00017052143812179565, -0.00016222521662712097, -0.0001539289951324463, -0.0001456327736377716, -0.00013733655214309692, -0.00012904033064842224, -0.00012074410915374756, -0.00011244788765907288, -0.0001041516661643982, -9.585544466972351e-05, -8.755922317504883e-05, -7.926300168037415e-05, -7.096678018569946e-05, -6.267055869102478e-05, -5.43743371963501e-05, -4.6078115701675415e-05, -3.778189420700073e-05, -2.948567271232605e-05, -2.1189451217651367e-05, -1.2893229722976685e-05, -4.597008228302002e-06, 3.6992132663726807e-06, 1.1995434761047363e-05, 2.0291656255722046e-05, 2.858787775039673e-05, 3.688409924507141e-05, 4.5180320739746094e-05, 5.3476542234420776e-05, 6.177276372909546e-05, 7.006898522377014e-05, 7.836520671844482e-05, 8.666142821311951e-05, 9.495764970779419e-05, 0.00010325387120246887, 0.00011155009269714355, 0.00011984631419181824, 0.00012814253568649292, 0.0001364387571811676, 0.00014473497867584229, 0.00015303120017051697, 0.00016132742166519165, 0.00016962364315986633, 0.00017791986465454102, 0.0001862160861492157, 0.00019451230764389038, 0.00020280852913856506, 0.00021110475063323975, 0.00021940097212791443, 0.0002276971936225891, 0.0002359934151172638, 0.0002442896366119385, 0.00025258585810661316, 0.00026088207960128784, 0.0002691783010959625, 0.0002774745225906372, 0.0002857707440853119, 0.00029406696557998657, 0.00030236318707466125, 0.00031065940856933594]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 11.0, 10.0, 23.0, 48.0, 72.0, 110.0, 135.0, 227.0, 333.0, 472.0, 751.0, 1168.0, 1811.0, 2839.0, 4731.0, 7748.0, 13070.0, 21623.0, 36817.0, 62274.0, 101260.0, 151602.0, 182473.0, 163745.0, 115738.0, 72532.0, 42676.0, 25442.0, 15042.0, 9008.0, 5477.0, 3396.0, 2054.0, 1336.0, 898.0, 544.0, 371.0, 227.0, 132.0, 104.0, 82.0, 49.0, 35.0, 18.0, 16.0, 8.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.02734375, -3.90008544921875, -3.7728271484375, -3.64556884765625, -3.518310546875, -3.39105224609375, -3.2637939453125, -3.13653564453125, -3.00927734375, -2.88201904296875, -2.7547607421875, -2.62750244140625, -2.500244140625, -2.37298583984375, -2.2457275390625, -2.11846923828125, -1.9912109375, -1.86395263671875, -1.7366943359375, -1.60943603515625, -1.482177734375, -1.35491943359375, -1.2276611328125, -1.10040283203125, -0.97314453125, -0.84588623046875, -0.7186279296875, -0.59136962890625, -0.464111328125, -0.33685302734375, -0.2095947265625, -0.08233642578125, 0.044921875, 0.17218017578125, 0.2994384765625, 0.42669677734375, 0.553955078125, 0.68121337890625, 0.8084716796875, 0.93572998046875, 1.06298828125, 1.19024658203125, 1.3175048828125, 1.44476318359375, 1.572021484375, 1.69927978515625, 1.8265380859375, 1.95379638671875, 2.0810546875, 2.20831298828125, 2.3355712890625, 2.46282958984375, 2.590087890625, 2.71734619140625, 2.8446044921875, 2.97186279296875, 3.09912109375, 3.22637939453125, 3.3536376953125, 3.48089599609375, 3.608154296875, 3.73541259765625, 3.8626708984375, 3.98992919921875, 4.1171875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 6.0, 1.0, 7.0, 10.0, 15.0, 25.0, 24.0, 24.0, 31.0, 29.0, 41.0, 47.0, 57.0, 62.0, 65.0, 54.0, 58.0, 56.0, 38.0, 47.0, 57.0, 52.0, 35.0, 24.0, 30.0, 22.0, 25.0, 12.0, 6.0, 9.0, 6.0, 7.0, 6.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2919921875, -1.2513885498046875, -1.210784912109375, -1.1701812744140625, -1.12957763671875, -1.0889739990234375, -1.048370361328125, -1.0077667236328125, -0.9671630859375, -0.9265594482421875, -0.885955810546875, -0.8453521728515625, -0.80474853515625, -0.7641448974609375, -0.723541259765625, -0.6829376220703125, -0.642333984375, -0.6017303466796875, -0.561126708984375, -0.5205230712890625, -0.47991943359375, -0.4393157958984375, -0.398712158203125, -0.3581085205078125, -0.3175048828125, -0.2769012451171875, -0.236297607421875, -0.1956939697265625, -0.15509033203125, -0.1144866943359375, -0.073883056640625, -0.0332794189453125, 0.00732421875, 0.0479278564453125, 0.088531494140625, 0.1291351318359375, 0.16973876953125, 0.2103424072265625, 0.250946044921875, 0.2915496826171875, 0.3321533203125, 0.3727569580078125, 0.413360595703125, 0.4539642333984375, 0.49456787109375, 0.5351715087890625, 0.575775146484375, 0.6163787841796875, 0.656982421875, 0.6975860595703125, 0.738189697265625, 0.7787933349609375, 0.81939697265625, 0.8600006103515625, 0.900604248046875, 0.9412078857421875, 0.9818115234375, 1.0224151611328125, 1.063018798828125, 1.1036224365234375, 1.14422607421875, 1.1848297119140625, 1.225433349609375, 1.2660369873046875, 1.306640625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 7.0, 7.0, 7.0, 17.0, 18.0, 27.0, 24.0, 37.0, 37.0, 44.0, 64.0, 64.0, 56.0, 75.0, 80.0, 69.0, 51.0, 50.0, 41.0, 40.0, 31.0, 33.0, 24.0, 19.0, 11.0, 13.0, 10.0, 9.0, 4.0, 5.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.555706024169922, -24.733627319335938, -23.911548614501953, -23.08946990966797, -22.267393112182617, -21.445314407348633, -20.62323570251465, -19.801156997680664, -18.979080200195312, -18.157001495361328, -17.334922790527344, -16.51284408569336, -15.690767288208008, -14.868688583374023, -14.046609878540039, -13.224531173706055, -12.40245246887207, -11.580373764038086, -10.758296012878418, -9.936217308044434, -9.114139556884766, -8.292060852050781, -7.469982147216797, -6.647903919219971, -5.8258256912231445, -5.003747463226318, -4.181669235229492, -3.359590530395508, -2.5375123023986816, -1.7154340744018555, -0.8933553695678711, -0.07127714157104492, 0.7508029937744141, 1.5728813409805298, 2.3949596881866455, 3.217038154602051, 4.039116382598877, 4.861194610595703, 5.6832733154296875, 6.505351543426514, 7.32742977142334, 8.149508476257324, 8.971586227416992, 9.793664932250977, 10.615743637084961, 11.437821388244629, 12.259900093078613, 13.081977844238281, 13.904056549072266, 14.72613525390625, 15.548213005065918, 16.37029266357422, 17.19236946105957, 18.014448165893555, 18.83652687072754, 19.658605575561523, 20.480682373046875, 21.30276107788086, 22.124839782714844, 22.946918487548828, 23.76899528503418, 24.591073989868164, 25.41315269470215, 26.235231399536133, 27.057310104370117]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 6.0, 8.0, 7.0, 6.0, 12.0, 8.0, 5.0, 15.0, 22.0, 11.0, 23.0, 24.0, 22.0, 30.0, 25.0, 25.0, 32.0, 30.0, 36.0, 39.0, 37.0, 42.0, 45.0, 44.0, 38.0, 44.0, 30.0, 33.0, 28.0, 37.0, 29.0, 33.0, 15.0, 22.0, 26.0, 18.0, 20.0, 15.0, 9.0, 11.0, 8.0, 6.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.9366455078125, -10.581901550292969, -10.227157592773438, -9.872413635253906, -9.517669677734375, -9.162925720214844, -8.808181762695312, -8.453437805175781, -8.09869384765625, -7.743949890136719, -7.3892059326171875, -7.034461975097656, -6.679718017578125, -6.324974060058594, -5.9702301025390625, -5.615486145019531, -5.260741710662842, -4.9059977531433105, -4.551253795623779, -4.196509838104248, -3.841765880584717, -3.4870219230651855, -3.132277727127075, -2.777533769607544, -2.4227898120880127, -2.0680458545684814, -1.7133018970489502, -1.3585578203201294, -1.0038138628005981, -0.6490699052810669, -0.2943258285522461, 0.060418128967285156, 0.4151620864868164, 0.7699060440063477, 1.124650001525879, 1.4793940782546997, 1.834138035774231, 2.1888818740844727, 2.543626070022583, 2.8983700275421143, 3.2531139850616455, 3.6078579425811768, 3.962601900100708, 4.317346096038818, 4.67209005355835, 5.026834011077881, 5.381577968597412, 5.736321926116943, 6.091065883636475, 6.445809841156006, 6.800553798675537, 7.155297756195068, 7.5100417137146, 7.864785671234131, 8.21953010559082, 8.574274063110352, 8.929018020629883, 9.283761978149414, 9.638505935668945, 9.993249893188477, 10.347993850708008, 10.702737808227539, 11.05748176574707, 11.412225723266602, 11.766969680786133]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 10.0, 7.0, 20.0, 34.0, 49.0, 84.0, 138.0, 231.0, 449.0, 802.0, 1488.0, 2742.0, 5180.0, 9959.0, 19488.0, 37824.0, 72366.0, 129224.0, 194359.0, 212137.0, 159983.0, 95271.0, 51515.0, 26454.0, 13637.0, 7094.0, 3668.0, 1859.0, 1100.0, 599.0, 328.0, 173.0, 107.0, 76.0, 36.0, 25.0, 10.0, 11.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.3916015625, -16.673828125, -15.9560546875, -15.23828125, -14.5205078125, -13.802734375, -13.0849609375, -12.3671875, -11.6494140625, -10.931640625, -10.2138671875, -9.49609375, -8.7783203125, -8.060546875, -7.3427734375, -6.625, -5.9072265625, -5.189453125, -4.4716796875, -3.75390625, -3.0361328125, -2.318359375, -1.6005859375, -0.8828125, -0.1650390625, 0.552734375, 1.2705078125, 1.98828125, 2.7060546875, 3.423828125, 4.1416015625, 4.859375, 5.5771484375, 6.294921875, 7.0126953125, 7.73046875, 8.4482421875, 9.166015625, 9.8837890625, 10.6015625, 11.3193359375, 12.037109375, 12.7548828125, 13.47265625, 14.1904296875, 14.908203125, 15.6259765625, 16.34375, 17.0615234375, 17.779296875, 18.4970703125, 19.21484375, 19.9326171875, 20.650390625, 21.3681640625, 22.0859375, 22.8037109375, 23.521484375, 24.2392578125, 24.95703125, 25.6748046875, 26.392578125, 27.1103515625, 27.828125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 4.0, 7.0, 14.0, 17.0, 9.0, 17.0, 25.0, 26.0, 32.0, 33.0, 34.0, 35.0, 47.0, 47.0, 55.0, 49.0, 52.0, 64.0, 49.0, 51.0, 41.0, 46.0, 41.0, 40.0, 29.0, 19.0, 24.0, 11.0, 22.0, 11.0, 12.0, 6.0, 8.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7421875, -13.2271728515625, -12.712158203125, -12.1971435546875, -11.68212890625, -11.1671142578125, -10.652099609375, -10.1370849609375, -9.6220703125, -9.1070556640625, -8.592041015625, -8.0770263671875, -7.56201171875, -7.0469970703125, -6.531982421875, -6.0169677734375, -5.501953125, -4.9869384765625, -4.471923828125, -3.9569091796875, -3.44189453125, -2.9268798828125, -2.411865234375, -1.8968505859375, -1.3818359375, -0.8668212890625, -0.351806640625, 0.1632080078125, 0.67822265625, 1.1932373046875, 1.708251953125, 2.2232666015625, 2.73828125, 3.2532958984375, 3.768310546875, 4.2833251953125, 4.79833984375, 5.3133544921875, 5.828369140625, 6.3433837890625, 6.8583984375, 7.3734130859375, 7.888427734375, 8.4034423828125, 8.91845703125, 9.4334716796875, 9.948486328125, 10.4635009765625, 10.978515625, 11.4935302734375, 12.008544921875, 12.5235595703125, 13.03857421875, 13.5535888671875, 14.068603515625, 14.5836181640625, 15.0986328125, 15.6136474609375, 16.128662109375, 16.6436767578125, 17.15869140625, 17.6737060546875, 18.188720703125, 18.7037353515625, 19.21875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 9.0, 10.0, 10.0, 16.0, 31.0, 43.0, 50.0, 81.0, 137.0, 176.0, 244.0, 431.0, 655.0, 1096.0, 1768.0, 2692.0, 4593.0, 7528.0, 12824.0, 21552.0, 36137.0, 58430.0, 91425.0, 130338.0, 159247.0, 157719.0, 127942.0, 89520.0, 56859.0, 34742.0, 20928.0, 12507.0, 7345.0, 4345.0, 2624.0, 1623.0, 1070.0, 640.0, 401.0, 257.0, 176.0, 95.0, 84.0, 49.0, 34.0, 32.0, 15.0, 12.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.640625, -16.103271484375, -15.56591796875, -15.028564453125, -14.4912109375, -13.953857421875, -13.41650390625, -12.879150390625, -12.341796875, -11.804443359375, -11.26708984375, -10.729736328125, -10.1923828125, -9.655029296875, -9.11767578125, -8.580322265625, -8.04296875, -7.505615234375, -6.96826171875, -6.430908203125, -5.8935546875, -5.356201171875, -4.81884765625, -4.281494140625, -3.744140625, -3.206787109375, -2.66943359375, -2.132080078125, -1.5947265625, -1.057373046875, -0.52001953125, 0.017333984375, 0.5546875, 1.092041015625, 1.62939453125, 2.166748046875, 2.7041015625, 3.241455078125, 3.77880859375, 4.316162109375, 4.853515625, 5.390869140625, 5.92822265625, 6.465576171875, 7.0029296875, 7.540283203125, 8.07763671875, 8.614990234375, 9.15234375, 9.689697265625, 10.22705078125, 10.764404296875, 11.3017578125, 11.839111328125, 12.37646484375, 12.913818359375, 13.451171875, 13.988525390625, 14.52587890625, 15.063232421875, 15.6005859375, 16.137939453125, 16.67529296875, 17.212646484375, 17.75]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 6.0, 2.0, 9.0, 9.0, 14.0, 21.0, 27.0, 18.0, 24.0, 20.0, 32.0, 35.0, 37.0, 38.0, 47.0, 40.0, 38.0, 39.0, 46.0, 50.0, 52.0, 36.0, 37.0, 39.0, 41.0, 31.0, 34.0, 31.0, 20.0, 24.0, 21.0, 19.0, 7.0, 7.0, 10.0, 7.0, 6.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.1484375, -9.869873046875, -9.59130859375, -9.312744140625, -9.0341796875, -8.755615234375, -8.47705078125, -8.198486328125, -7.919921875, -7.641357421875, -7.36279296875, -7.084228515625, -6.8056640625, -6.527099609375, -6.24853515625, -5.969970703125, -5.69140625, -5.412841796875, -5.13427734375, -4.855712890625, -4.5771484375, -4.298583984375, -4.02001953125, -3.741455078125, -3.462890625, -3.184326171875, -2.90576171875, -2.627197265625, -2.3486328125, -2.070068359375, -1.79150390625, -1.512939453125, -1.234375, -0.955810546875, -0.67724609375, -0.398681640625, -0.1201171875, 0.158447265625, 0.43701171875, 0.715576171875, 0.994140625, 1.272705078125, 1.55126953125, 1.829833984375, 2.1083984375, 2.386962890625, 2.66552734375, 2.944091796875, 3.22265625, 3.501220703125, 3.77978515625, 4.058349609375, 4.3369140625, 4.615478515625, 4.89404296875, 5.172607421875, 5.451171875, 5.729736328125, 6.00830078125, 6.286865234375, 6.5654296875, 6.843994140625, 7.12255859375, 7.401123046875, 7.6796875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 2.0, 5.0, 3.0, 6.0, 9.0, 20.0, 11.0, 38.0, 39.0, 53.0, 65.0, 117.0, 171.0, 248.0, 389.0, 566.0, 879.0, 1264.0, 2104.0, 3368.0, 5531.0, 9089.0, 15358.0, 26618.0, 46491.0, 80911.0, 133196.0, 187871.0, 190885.0, 138996.0, 85266.0, 49098.0, 28163.0, 16397.0, 9691.0, 5835.0, 3530.0, 2208.0, 1387.0, 889.0, 598.0, 384.0, 242.0, 168.0, 129.0, 80.0, 59.0, 39.0, 34.0, 17.0, 22.0, 8.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-9.8828125, -9.574462890625, -9.26611328125, -8.957763671875, -8.6494140625, -8.341064453125, -8.03271484375, -7.724365234375, -7.416015625, -7.107666015625, -6.79931640625, -6.490966796875, -6.1826171875, -5.874267578125, -5.56591796875, -5.257568359375, -4.94921875, -4.640869140625, -4.33251953125, -4.024169921875, -3.7158203125, -3.407470703125, -3.09912109375, -2.790771484375, -2.482421875, -2.174072265625, -1.86572265625, -1.557373046875, -1.2490234375, -0.940673828125, -0.63232421875, -0.323974609375, -0.015625, 0.292724609375, 0.60107421875, 0.909423828125, 1.2177734375, 1.526123046875, 1.83447265625, 2.142822265625, 2.451171875, 2.759521484375, 3.06787109375, 3.376220703125, 3.6845703125, 3.992919921875, 4.30126953125, 4.609619140625, 4.91796875, 5.226318359375, 5.53466796875, 5.843017578125, 6.1513671875, 6.459716796875, 6.76806640625, 7.076416015625, 7.384765625, 7.693115234375, 8.00146484375, 8.309814453125, 8.6181640625, 8.926513671875, 9.23486328125, 9.543212890625, 9.8515625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 12.0, 5.0, 7.0, 14.0, 16.0, 24.0, 24.0, 36.0, 39.0, 52.0, 63.0, 66.0, 72.0, 67.0, 78.0, 75.0, 72.0, 51.0, 44.0, 40.0, 24.0, 26.0, 22.0, 14.0, 13.0, 7.0, 7.0, 8.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010194778442382812, -0.0009839534759521484, -0.0009484291076660156, -0.0009129047393798828, -0.00087738037109375, -0.0008418560028076172, -0.0008063316345214844, -0.0007708072662353516, -0.0007352828979492188, -0.0006997585296630859, -0.0006642341613769531, -0.0006287097930908203, -0.0005931854248046875, -0.0005576610565185547, -0.0005221366882324219, -0.00048661231994628906, -0.00045108795166015625, -0.00041556358337402344, -0.0003800392150878906, -0.0003445148468017578, -0.000308990478515625, -0.0002734661102294922, -0.00023794174194335938, -0.00020241737365722656, -0.00016689300537109375, -0.00013136863708496094, -9.584426879882812e-05, -6.031990051269531e-05, -2.47955322265625e-05, 1.0728836059570312e-05, 4.6253204345703125e-05, 8.177757263183594e-05, 0.00011730194091796875, 0.00015282630920410156, 0.00018835067749023438, 0.0002238750457763672, 0.0002593994140625, 0.0002949237823486328, 0.0003304481506347656, 0.00036597251892089844, 0.00040149688720703125, 0.00043702125549316406, 0.0004725456237792969, 0.0005080699920654297, 0.0005435943603515625, 0.0005791187286376953, 0.0006146430969238281, 0.0006501674652099609, 0.0006856918334960938, 0.0007212162017822266, 0.0007567405700683594, 0.0007922649383544922, 0.000827789306640625, 0.0008633136749267578, 0.0008988380432128906, 0.0009343624114990234, 0.0009698867797851562, 0.001005411148071289, 0.0010409355163574219, 0.0010764598846435547, 0.0011119842529296875, 0.0011475086212158203, 0.0011830329895019531, 0.001218557357788086, 0.0012540817260742188]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 12.0, 10.0, 12.0, 14.0, 21.0, 43.0, 41.0, 86.0, 111.0, 134.0, 188.0, 225.0, 366.0, 493.0, 742.0, 1049.0, 1493.0, 2277.0, 3376.0, 5444.0, 8563.0, 14185.0, 23690.0, 41421.0, 73108.0, 120616.0, 174719.0, 191127.0, 150579.0, 96073.0, 56547.0, 32069.0, 18698.0, 11016.0, 6800.0, 4271.0, 2850.0, 1843.0, 1211.0, 889.0, 637.0, 443.0, 310.0, 204.0, 162.0, 105.0, 67.0, 68.0, 52.0, 29.0, 28.0, 13.0, 8.0, 12.0, 5.0, 2.0, 1.0, 3.0, 3.0], "bins": [-9.96875, -9.6597900390625, -9.350830078125, -9.0418701171875, -8.73291015625, -8.4239501953125, -8.114990234375, -7.8060302734375, -7.4970703125, -7.1881103515625, -6.879150390625, -6.5701904296875, -6.26123046875, -5.9522705078125, -5.643310546875, -5.3343505859375, -5.025390625, -4.7164306640625, -4.407470703125, -4.0985107421875, -3.78955078125, -3.4805908203125, -3.171630859375, -2.8626708984375, -2.5537109375, -2.2447509765625, -1.935791015625, -1.6268310546875, -1.31787109375, -1.0089111328125, -0.699951171875, -0.3909912109375, -0.08203125, 0.2269287109375, 0.535888671875, 0.8448486328125, 1.15380859375, 1.4627685546875, 1.771728515625, 2.0806884765625, 2.3896484375, 2.6986083984375, 3.007568359375, 3.3165283203125, 3.62548828125, 3.9344482421875, 4.243408203125, 4.5523681640625, 4.861328125, 5.1702880859375, 5.479248046875, 5.7882080078125, 6.09716796875, 6.4061279296875, 6.715087890625, 7.0240478515625, 7.3330078125, 7.6419677734375, 7.950927734375, 8.2598876953125, 8.56884765625, 8.8778076171875, 9.186767578125, 9.4957275390625, 9.8046875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 6.0, 5.0, 11.0, 20.0, 20.0, 18.0, 47.0, 32.0, 40.0, 50.0, 43.0, 58.0, 60.0, 60.0, 65.0, 55.0, 55.0, 54.0, 42.0, 43.0, 38.0, 30.0, 24.0, 19.0, 22.0, 18.0, 9.0, 12.0, 7.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.982421875, -2.89495849609375, -2.8074951171875, -2.72003173828125, -2.632568359375, -2.54510498046875, -2.4576416015625, -2.37017822265625, -2.28271484375, -2.19525146484375, -2.1077880859375, -2.02032470703125, -1.932861328125, -1.84539794921875, -1.7579345703125, -1.67047119140625, -1.5830078125, -1.49554443359375, -1.4080810546875, -1.32061767578125, -1.233154296875, -1.14569091796875, -1.0582275390625, -0.97076416015625, -0.88330078125, -0.79583740234375, -0.7083740234375, -0.62091064453125, -0.533447265625, -0.44598388671875, -0.3585205078125, -0.27105712890625, -0.18359375, -0.09613037109375, -0.0086669921875, 0.07879638671875, 0.166259765625, 0.25372314453125, 0.3411865234375, 0.42864990234375, 0.51611328125, 0.60357666015625, 0.6910400390625, 0.77850341796875, 0.865966796875, 0.95343017578125, 1.0408935546875, 1.12835693359375, 1.2158203125, 1.30328369140625, 1.3907470703125, 1.47821044921875, 1.565673828125, 1.65313720703125, 1.7406005859375, 1.82806396484375, 1.91552734375, 2.00299072265625, 2.0904541015625, 2.17791748046875, 2.265380859375, 2.35284423828125, 2.4403076171875, 2.52777099609375, 2.615234375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 9.0, 14.0, 15.0, 17.0, 29.0, 28.0, 39.0, 46.0, 43.0, 55.0, 69.0, 62.0, 69.0, 61.0, 49.0, 56.0, 63.0, 42.0, 42.0, 36.0, 30.0, 19.0, 14.0, 14.0, 11.0, 7.0, 10.0, 13.0, 5.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.586084365844727, -25.78007698059082, -24.97406768798828, -24.168060302734375, -23.362051010131836, -22.55604362487793, -21.75003433227539, -20.944026947021484, -20.138019561767578, -19.332012176513672, -18.526002883911133, -17.719995498657227, -16.913986206054688, -16.10797882080078, -15.301970481872559, -14.495962142944336, -13.689952850341797, -12.883944511413574, -12.077936172485352, -11.271928787231445, -10.465919494628906, -9.659912109375, -8.853903770446777, -8.047895431518555, -7.241887092590332, -6.435878753662109, -5.629870414733887, -4.823862552642822, -4.0178542137146, -3.211845874786377, -2.4058380126953125, -1.5998296737670898, -0.7938213348388672, 0.012186884880065918, 0.818195104598999, 1.6242032051086426, 2.4302115440368652, 3.236219882965088, 4.042227745056152, 4.848236083984375, 5.654244422912598, 6.46025276184082, 7.266261100769043, 8.072269439697266, 8.878276824951172, 9.684286117553711, 10.490293502807617, 11.29630184173584, 12.102310180664062, 12.908318519592285, 13.714326858520508, 14.520334243774414, 15.326343536376953, 16.13235092163086, 16.938358306884766, 17.744367599487305, 18.550376892089844, 19.35638427734375, 20.16239356994629, 20.968400955200195, 21.774410247802734, 22.58041763305664, 23.386425018310547, 24.192434310913086, 24.998441696166992]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 8.0, 6.0, 9.0, 4.0, 5.0, 8.0, 10.0, 11.0, 15.0, 20.0, 22.0, 25.0, 14.0, 21.0, 28.0, 27.0, 30.0, 33.0, 46.0, 36.0, 35.0, 35.0, 47.0, 42.0, 44.0, 41.0, 37.0, 22.0, 34.0, 39.0, 31.0, 24.0, 26.0, 20.0, 20.0, 20.0, 19.0, 12.0, 8.0, 18.0, 9.0, 7.0, 8.0, 7.0, 4.0, 8.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.53162956237793, -11.173201560974121, -10.814773559570312, -10.456345558166504, -10.097917556762695, -9.73948860168457, -9.381060600280762, -9.022632598876953, -8.664204597473145, -8.305776596069336, -7.947348594665527, -7.5889201164245605, -7.230492115020752, -6.872064113616943, -6.513635635375977, -6.155207633972168, -5.796779632568359, -5.438351631164551, -5.079923629760742, -4.721495151519775, -4.363067150115967, -4.004639148712158, -3.6462109088897705, -3.287782669067383, -2.929354667663574, -2.5709266662597656, -2.212498426437378, -1.8540703058242798, -1.4956421852111816, -1.1372140645980835, -0.7787859439849854, -0.42035770416259766, -0.06193065643310547, 0.2964974641799927, 0.6549255847930908, 1.013353705406189, 1.371781826019287, 1.7302099466323853, 2.0886380672454834, 2.447066307067871, 2.8054943084716797, 3.1639223098754883, 3.522350549697876, 3.8807787895202637, 4.239206790924072, 4.597634792327881, 4.956063270568848, 5.314491271972656, 5.672919273376465, 6.031347274780273, 6.389775276184082, 6.748203754425049, 7.106631755828857, 7.465059757232666, 7.823488235473633, 8.181916236877441, 8.54034423828125, 8.898772239685059, 9.257200241088867, 9.615628242492676, 9.974056243896484, 10.33248519897461, 10.690913200378418, 11.049341201782227, 11.407769203186035]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 10.0, 15.0, 16.0, 39.0, 59.0, 63.0, 84.0, 120.0, 200.0, 263.0, 442.0, 657.0, 959.0, 1489.0, 2370.0, 3817.0, 6401.0, 11086.0, 20727.0, 40907.0, 87016.0, 202355.0, 506477.0, 1131189.0, 1206890.0, 562011.0, 220409.0, 93614.0, 43576.0, 21949.0, 11726.0, 6697.0, 3803.0, 2432.0, 1518.0, 976.0, 602.0, 446.0, 288.0, 175.0, 113.0, 93.0, 75.0, 38.0, 25.0, 25.0, 14.0, 9.0, 2.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-27.03125, -26.06787109375, -25.1044921875, -24.14111328125, -23.177734375, -22.21435546875, -21.2509765625, -20.28759765625, -19.32421875, -18.36083984375, -17.3974609375, -16.43408203125, -15.470703125, -14.50732421875, -13.5439453125, -12.58056640625, -11.6171875, -10.65380859375, -9.6904296875, -8.72705078125, -7.763671875, -6.80029296875, -5.8369140625, -4.87353515625, -3.91015625, -2.94677734375, -1.9833984375, -1.02001953125, -0.056640625, 0.90673828125, 1.8701171875, 2.83349609375, 3.796875, 4.76025390625, 5.7236328125, 6.68701171875, 7.650390625, 8.61376953125, 9.5771484375, 10.54052734375, 11.50390625, 12.46728515625, 13.4306640625, 14.39404296875, 15.357421875, 16.32080078125, 17.2841796875, 18.24755859375, 19.2109375, 20.17431640625, 21.1376953125, 22.10107421875, 23.064453125, 24.02783203125, 24.9912109375, 25.95458984375, 26.91796875, 27.88134765625, 28.8447265625, 29.80810546875, 30.771484375, 31.73486328125, 32.6982421875, 33.66162109375, 34.625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 5.0, 4.0, 6.0, 7.0, 10.0, 8.0, 10.0, 9.0, 17.0, 5.0, 11.0, 13.0, 17.0, 21.0, 20.0, 15.0, 23.0, 30.0, 19.0, 33.0, 35.0, 39.0, 32.0, 42.0, 46.0, 41.0, 30.0, 34.0, 35.0, 55.0, 33.0, 42.0, 26.0, 29.0, 17.0, 27.0, 16.0, 30.0, 20.0, 16.0, 8.0, 15.0, 12.0, 8.0, 4.0, 9.0, 4.0, 3.0, 3.0, 1.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.515625, -9.224365234375, -8.93310546875, -8.641845703125, -8.3505859375, -8.059326171875, -7.76806640625, -7.476806640625, -7.185546875, -6.894287109375, -6.60302734375, -6.311767578125, -6.0205078125, -5.729248046875, -5.43798828125, -5.146728515625, -4.85546875, -4.564208984375, -4.27294921875, -3.981689453125, -3.6904296875, -3.399169921875, -3.10791015625, -2.816650390625, -2.525390625, -2.234130859375, -1.94287109375, -1.651611328125, -1.3603515625, -1.069091796875, -0.77783203125, -0.486572265625, -0.1953125, 0.095947265625, 0.38720703125, 0.678466796875, 0.9697265625, 1.260986328125, 1.55224609375, 1.843505859375, 2.134765625, 2.426025390625, 2.71728515625, 3.008544921875, 3.2998046875, 3.591064453125, 3.88232421875, 4.173583984375, 4.46484375, 4.756103515625, 5.04736328125, 5.338623046875, 5.6298828125, 5.921142578125, 6.21240234375, 6.503662109375, 6.794921875, 7.086181640625, 7.37744140625, 7.668701171875, 7.9599609375, 8.251220703125, 8.54248046875, 8.833740234375, 9.125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 8.0, 6.0, 10.0, 12.0, 16.0, 35.0, 37.0, 54.0, 77.0, 90.0, 179.0, 214.0, 294.0, 416.0, 654.0, 1005.0, 1597.0, 2577.0, 4284.0, 7173.0, 12487.0, 23043.0, 44672.0, 90940.0, 199664.0, 467754.0, 1025652.0, 1194052.0, 617783.0, 261357.0, 116548.0, 55524.0, 28471.0, 15467.0, 8581.0, 5022.0, 3055.0, 1887.0, 1196.0, 766.0, 538.0, 311.0, 252.0, 172.0, 123.0, 78.0, 47.0, 33.0, 29.0, 16.0, 12.0, 9.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-37.90625, -36.76318359375, -35.6201171875, -34.47705078125, -33.333984375, -32.19091796875, -31.0478515625, -29.90478515625, -28.76171875, -27.61865234375, -26.4755859375, -25.33251953125, -24.189453125, -23.04638671875, -21.9033203125, -20.76025390625, -19.6171875, -18.47412109375, -17.3310546875, -16.18798828125, -15.044921875, -13.90185546875, -12.7587890625, -11.61572265625, -10.47265625, -9.32958984375, -8.1865234375, -7.04345703125, -5.900390625, -4.75732421875, -3.6142578125, -2.47119140625, -1.328125, -0.18505859375, 0.9580078125, 2.10107421875, 3.244140625, 4.38720703125, 5.5302734375, 6.67333984375, 7.81640625, 8.95947265625, 10.1025390625, 11.24560546875, 12.388671875, 13.53173828125, 14.6748046875, 15.81787109375, 16.9609375, 18.10400390625, 19.2470703125, 20.39013671875, 21.533203125, 22.67626953125, 23.8193359375, 24.96240234375, 26.10546875, 27.24853515625, 28.3916015625, 29.53466796875, 30.677734375, 31.82080078125, 32.9638671875, 34.10693359375, 35.25]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 13.0, 7.0, 10.0, 10.0, 15.0, 19.0, 22.0, 36.0, 43.0, 56.0, 100.0, 102.0, 113.0, 150.0, 200.0, 243.0, 289.0, 288.0, 294.0, 308.0, 329.0, 268.0, 225.0, 204.0, 144.0, 120.0, 99.0, 88.0, 51.0, 47.0, 40.0, 30.0, 25.0, 15.0, 12.0, 21.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.2950439453125, -8.011962890625, -7.7288818359375, -7.44580078125, -7.1627197265625, -6.879638671875, -6.5965576171875, -6.3134765625, -6.0303955078125, -5.747314453125, -5.4642333984375, -5.18115234375, -4.8980712890625, -4.614990234375, -4.3319091796875, -4.048828125, -3.7657470703125, -3.482666015625, -3.1995849609375, -2.91650390625, -2.6334228515625, -2.350341796875, -2.0672607421875, -1.7841796875, -1.5010986328125, -1.218017578125, -0.9349365234375, -0.65185546875, -0.3687744140625, -0.085693359375, 0.1973876953125, 0.48046875, 0.7635498046875, 1.046630859375, 1.3297119140625, 1.61279296875, 1.8958740234375, 2.178955078125, 2.4620361328125, 2.7451171875, 3.0281982421875, 3.311279296875, 3.5943603515625, 3.87744140625, 4.1605224609375, 4.443603515625, 4.7266845703125, 5.009765625, 5.2928466796875, 5.575927734375, 5.8590087890625, 6.14208984375, 6.4251708984375, 6.708251953125, 6.9913330078125, 7.2744140625, 7.5574951171875, 7.840576171875, 8.1236572265625, 8.40673828125, 8.6898193359375, 8.972900390625, 9.2559814453125, 9.5390625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 6.0, 5.0, 3.0, 11.0, 18.0, 11.0, 15.0, 16.0, 18.0, 24.0, 41.0, 32.0, 35.0, 32.0, 60.0, 73.0, 53.0, 50.0, 63.0, 61.0, 63.0, 39.0, 41.0, 44.0, 20.0, 19.0, 29.0, 27.0, 17.0, 12.0, 9.0, 11.0, 8.0, 4.0, 5.0, 7.0, 2.0, 2.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.729507446289062, -27.8569393157959, -26.984371185302734, -26.11180305480957, -25.239234924316406, -24.36666488647461, -23.494098663330078, -22.62152862548828, -21.748960494995117, -20.876392364501953, -20.00382423400879, -19.131256103515625, -18.25868797302246, -17.386119842529297, -16.5135498046875, -15.640981674194336, -14.768414497375488, -13.895846366882324, -13.02327823638916, -12.15070915222168, -11.278141021728516, -10.405572891235352, -9.533004760742188, -8.660436630249023, -7.787868022918701, -6.915299892425537, -6.042731285095215, -5.170163154602051, -4.297595024108887, -3.4250264167785645, -2.5524582862854004, -1.6798896789550781, -0.8073215484619141, 0.06524676084518433, 0.9378150701522827, 1.8103833198547363, 2.6829516887664795, 3.5555200576782227, 4.428088188171387, 5.300656795501709, 6.173224925994873, 7.045793056488037, 7.918361663818359, 8.790929794311523, 9.663497924804688, 10.536066055297852, 11.408634185791016, 12.281203269958496, 13.15377140045166, 14.026339530944824, 14.898907661437988, 15.771476745605469, 16.644044876098633, 17.516613006591797, 18.38918113708496, 19.261749267578125, 20.13431739807129, 21.006885528564453, 21.879453659057617, 22.75202178955078, 23.624589920043945, 24.49715805053711, 25.369728088378906, 26.24229621887207, 27.114864349365234]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 8.0, 7.0, 10.0, 16.0, 14.0, 10.0, 12.0, 17.0, 14.0, 21.0, 18.0, 27.0, 39.0, 33.0, 35.0, 38.0, 36.0, 41.0, 32.0, 31.0, 38.0, 30.0, 43.0, 37.0, 46.0, 35.0, 31.0, 35.0, 34.0, 35.0, 31.0, 26.0, 19.0, 20.0, 19.0, 11.0, 12.0, 9.0, 5.0, 7.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.919206619262695, -12.46863842010498, -12.01806926727295, -11.567501068115234, -11.116931915283203, -10.666363716125488, -10.215795516967773, -9.765226364135742, -9.314658164978027, -8.864089965820312, -8.413520812988281, -7.962952613830566, -7.512383937835693, -7.06181526184082, -6.6112470626831055, -6.160678386688232, -5.710109710693359, -5.259541034698486, -4.808972358703613, -4.358404159545898, -3.9078354835510254, -3.4572668075561523, -3.0066983699798584, -2.5561299324035645, -2.1055612564086914, -1.654992699623108, -1.2044241428375244, -0.7538555860519409, -0.3032870292663574, 0.14728164672851562, 0.5978500843048096, 1.0484185218811035, 1.4989862442016602, 1.9495548009872437, 2.400123357772827, 2.850691795349121, 3.301260471343994, 3.751829147338867, 4.202397346496582, 4.652966022491455, 5.103534698486328, 5.554103374481201, 6.004672050476074, 6.455240249633789, 6.905808925628662, 7.356377601623535, 7.80694580078125, 8.257514953613281, 8.708083152770996, 9.158651351928711, 9.609220504760742, 10.059788703918457, 10.510356903076172, 10.960926055908203, 11.411494255065918, 11.862062454223633, 12.312631607055664, 12.763199806213379, 13.21376895904541, 13.664337158203125, 14.114906311035156, 14.565474510192871, 15.016042709350586, 15.466611862182617, 15.917180061340332]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 8.0, 10.0, 11.0, 24.0, 30.0, 37.0, 44.0, 75.0, 110.0, 178.0, 241.0, 383.0, 564.0, 894.0, 1429.0, 2271.0, 3848.0, 6357.0, 11174.0, 19267.0, 34310.0, 59987.0, 102008.0, 157984.0, 197521.0, 171634.0, 115424.0, 68894.0, 39555.0, 22758.0, 12829.0, 7445.0, 4261.0, 2563.0, 1517.0, 991.0, 644.0, 450.0, 270.0, 183.0, 112.0, 69.0, 61.0, 35.0, 40.0, 16.0, 12.0, 13.0, 4.0, 6.0, 0.0, 4.0, 2.0, 5.0, 1.0, 2.0], "bins": [-13.46875, -13.055908203125, -12.64306640625, -12.230224609375, -11.8173828125, -11.404541015625, -10.99169921875, -10.578857421875, -10.166015625, -9.753173828125, -9.34033203125, -8.927490234375, -8.5146484375, -8.101806640625, -7.68896484375, -7.276123046875, -6.86328125, -6.450439453125, -6.03759765625, -5.624755859375, -5.2119140625, -4.799072265625, -4.38623046875, -3.973388671875, -3.560546875, -3.147705078125, -2.73486328125, -2.322021484375, -1.9091796875, -1.496337890625, -1.08349609375, -0.670654296875, -0.2578125, 0.155029296875, 0.56787109375, 0.980712890625, 1.3935546875, 1.806396484375, 2.21923828125, 2.632080078125, 3.044921875, 3.457763671875, 3.87060546875, 4.283447265625, 4.6962890625, 5.109130859375, 5.52197265625, 5.934814453125, 6.34765625, 6.760498046875, 7.17333984375, 7.586181640625, 7.9990234375, 8.411865234375, 8.82470703125, 9.237548828125, 9.650390625, 10.063232421875, 10.47607421875, 10.888916015625, 11.3017578125, 11.714599609375, 12.12744140625, 12.540283203125, 12.953125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 7.0, 4.0, 7.0, 14.0, 13.0, 21.0, 11.0, 14.0, 22.0, 27.0, 36.0, 30.0, 32.0, 41.0, 45.0, 40.0, 47.0, 40.0, 47.0, 52.0, 43.0, 45.0, 48.0, 39.0, 39.0, 44.0, 28.0, 30.0, 28.0, 19.0, 19.0, 9.0, 14.0, 13.0, 5.0, 6.0, 6.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.625, -19.0390625, -18.453125, -17.8671875, -17.28125, -16.6953125, -16.109375, -15.5234375, -14.9375, -14.3515625, -13.765625, -13.1796875, -12.59375, -12.0078125, -11.421875, -10.8359375, -10.25, -9.6640625, -9.078125, -8.4921875, -7.90625, -7.3203125, -6.734375, -6.1484375, -5.5625, -4.9765625, -4.390625, -3.8046875, -3.21875, -2.6328125, -2.046875, -1.4609375, -0.875, -0.2890625, 0.296875, 0.8828125, 1.46875, 2.0546875, 2.640625, 3.2265625, 3.8125, 4.3984375, 4.984375, 5.5703125, 6.15625, 6.7421875, 7.328125, 7.9140625, 8.5, 9.0859375, 9.671875, 10.2578125, 10.84375, 11.4296875, 12.015625, 12.6015625, 13.1875, 13.7734375, 14.359375, 14.9453125, 15.53125, 16.1171875, 16.703125, 17.2890625, 17.875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 7.0, 7.0, 9.0, 17.0, 21.0, 35.0, 39.0, 76.0, 96.0, 145.0, 192.0, 277.0, 401.0, 543.0, 722.0, 1045.0, 1697.0, 2364.0, 3652.0, 6019.0, 9909.0, 17444.0, 30944.0, 57335.0, 106197.0, 186184.0, 236937.0, 170766.0, 95407.0, 51447.0, 27991.0, 15608.0, 8947.0, 5536.0, 3491.0, 2210.0, 1467.0, 997.0, 720.0, 472.0, 331.0, 236.0, 181.0, 137.0, 85.0, 58.0, 45.0, 27.0, 34.0, 18.0, 12.0, 5.0, 5.0, 6.0, 3.0, 4.0, 0.0, 3.0], "bins": [-16.578125, -16.066650390625, -15.55517578125, -15.043701171875, -14.5322265625, -14.020751953125, -13.50927734375, -12.997802734375, -12.486328125, -11.974853515625, -11.46337890625, -10.951904296875, -10.4404296875, -9.928955078125, -9.41748046875, -8.906005859375, -8.39453125, -7.883056640625, -7.37158203125, -6.860107421875, -6.3486328125, -5.837158203125, -5.32568359375, -4.814208984375, -4.302734375, -3.791259765625, -3.27978515625, -2.768310546875, -2.2568359375, -1.745361328125, -1.23388671875, -0.722412109375, -0.2109375, 0.300537109375, 0.81201171875, 1.323486328125, 1.8349609375, 2.346435546875, 2.85791015625, 3.369384765625, 3.880859375, 4.392333984375, 4.90380859375, 5.415283203125, 5.9267578125, 6.438232421875, 6.94970703125, 7.461181640625, 7.97265625, 8.484130859375, 8.99560546875, 9.507080078125, 10.0185546875, 10.530029296875, 11.04150390625, 11.552978515625, 12.064453125, 12.575927734375, 13.08740234375, 13.598876953125, 14.1103515625, 14.621826171875, 15.13330078125, 15.644775390625, 16.15625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 15.0, 11.0, 12.0, 9.0, 5.0, 22.0, 29.0, 21.0, 34.0, 32.0, 38.0, 40.0, 52.0, 52.0, 40.0, 45.0, 59.0, 46.0, 42.0, 40.0, 45.0, 32.0, 41.0, 32.0, 28.0, 24.0, 18.0, 20.0, 14.0, 18.0, 14.0, 14.0, 11.0, 9.0, 8.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7109375, -9.372314453125, -9.03369140625, -8.695068359375, -8.3564453125, -8.017822265625, -7.67919921875, -7.340576171875, -7.001953125, -6.663330078125, -6.32470703125, -5.986083984375, -5.6474609375, -5.308837890625, -4.97021484375, -4.631591796875, -4.29296875, -3.954345703125, -3.61572265625, -3.277099609375, -2.9384765625, -2.599853515625, -2.26123046875, -1.922607421875, -1.583984375, -1.245361328125, -0.90673828125, -0.568115234375, -0.2294921875, 0.109130859375, 0.44775390625, 0.786376953125, 1.125, 1.463623046875, 1.80224609375, 2.140869140625, 2.4794921875, 2.818115234375, 3.15673828125, 3.495361328125, 3.833984375, 4.172607421875, 4.51123046875, 4.849853515625, 5.1884765625, 5.527099609375, 5.86572265625, 6.204345703125, 6.54296875, 6.881591796875, 7.22021484375, 7.558837890625, 7.8974609375, 8.236083984375, 8.57470703125, 8.913330078125, 9.251953125, 9.590576171875, 9.92919921875, 10.267822265625, 10.6064453125, 10.945068359375, 11.28369140625, 11.622314453125, 11.9609375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 8.0, 8.0, 18.0, 24.0, 33.0, 49.0, 63.0, 110.0, 192.0, 286.0, 457.0, 816.0, 1299.0, 2294.0, 4141.0, 7708.0, 14416.0, 28782.0, 59462.0, 124599.0, 242529.0, 270900.0, 149112.0, 70377.0, 33854.0, 16900.0, 8769.0, 4839.0, 2593.0, 1562.0, 906.0, 560.0, 319.0, 193.0, 120.0, 84.0, 47.0, 43.0, 20.0, 20.0, 12.0, 7.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9140625, -6.6766357421875, -6.439208984375, -6.2017822265625, -5.96435546875, -5.7269287109375, -5.489501953125, -5.2520751953125, -5.0146484375, -4.7772216796875, -4.539794921875, -4.3023681640625, -4.06494140625, -3.8275146484375, -3.590087890625, -3.3526611328125, -3.115234375, -2.8778076171875, -2.640380859375, -2.4029541015625, -2.16552734375, -1.9281005859375, -1.690673828125, -1.4532470703125, -1.2158203125, -0.9783935546875, -0.740966796875, -0.5035400390625, -0.26611328125, -0.0286865234375, 0.208740234375, 0.4461669921875, 0.68359375, 0.9210205078125, 1.158447265625, 1.3958740234375, 1.63330078125, 1.8707275390625, 2.108154296875, 2.3455810546875, 2.5830078125, 2.8204345703125, 3.057861328125, 3.2952880859375, 3.53271484375, 3.7701416015625, 4.007568359375, 4.2449951171875, 4.482421875, 4.7198486328125, 4.957275390625, 5.1947021484375, 5.43212890625, 5.6695556640625, 5.906982421875, 6.1444091796875, 6.3818359375, 6.6192626953125, 6.856689453125, 7.0941162109375, 7.33154296875, 7.5689697265625, 7.806396484375, 8.0438232421875, 8.28125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 4.0, 9.0, 13.0, 15.0, 20.0, 26.0, 41.0, 42.0, 56.0, 57.0, 86.0, 98.0, 81.0, 69.0, 85.0, 74.0, 50.0, 43.0, 37.0, 17.0, 23.0, 16.0, 8.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006275177001953125, -0.0006091967225074768, -0.0005908757448196411, -0.0005725547671318054, -0.0005542337894439697, -0.000535912811756134, -0.0005175918340682983, -0.0004992708563804626, -0.00048094987869262695, -0.00046262890100479126, -0.00044430792331695557, -0.0004259869456291199, -0.0004076659679412842, -0.0003893449902534485, -0.0003710240125656128, -0.0003527030348777771, -0.0003343820571899414, -0.0003160610795021057, -0.00029774010181427, -0.0002794191241264343, -0.00026109814643859863, -0.00024277716875076294, -0.00022445619106292725, -0.00020613521337509155, -0.00018781423568725586, -0.00016949325799942017, -0.00015117228031158447, -0.00013285130262374878, -0.00011453032493591309, -9.620934724807739e-05, -7.78883695602417e-05, -5.9567391872406006e-05, -4.124641418457031e-05, -2.292543649673462e-05, -4.604458808898926e-06, 1.3716518878936768e-05, 3.203749656677246e-05, 5.0358474254608154e-05, 6.867945194244385e-05, 8.700042963027954e-05, 0.00010532140731811523, 0.00012364238500595093, 0.00014196336269378662, 0.00016028434038162231, 0.000178605318069458, 0.0001969262957572937, 0.0002152472734451294, 0.0002335682511329651, 0.0002518892288208008, 0.0002702102065086365, 0.00028853118419647217, 0.00030685216188430786, 0.00032517313957214355, 0.00034349411725997925, 0.00036181509494781494, 0.00038013607263565063, 0.00039845705032348633, 0.000416778028011322, 0.0004350990056991577, 0.0004534199833869934, 0.0004717409610748291, 0.0004900619387626648, 0.0005083829164505005, 0.0005267038941383362, 0.0005450248718261719]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 8.0, 16.0, 14.0, 13.0, 25.0, 44.0, 78.0, 116.0, 169.0, 270.0, 368.0, 573.0, 884.0, 1370.0, 2226.0, 3564.0, 5674.0, 9347.0, 14794.0, 25067.0, 40996.0, 66863.0, 106444.0, 151599.0, 174914.0, 154667.0, 110087.0, 69088.0, 42370.0, 25667.0, 15652.0, 9512.0, 5829.0, 3743.0, 2274.0, 1436.0, 975.0, 611.0, 420.0, 263.0, 184.0, 117.0, 83.0, 39.0, 42.0, 24.0, 14.0, 9.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.359375, -5.17156982421875, -4.9837646484375, -4.79595947265625, -4.608154296875, -4.42034912109375, -4.2325439453125, -4.04473876953125, -3.85693359375, -3.66912841796875, -3.4813232421875, -3.29351806640625, -3.105712890625, -2.91790771484375, -2.7301025390625, -2.54229736328125, -2.3544921875, -2.16668701171875, -1.9788818359375, -1.79107666015625, -1.603271484375, -1.41546630859375, -1.2276611328125, -1.03985595703125, -0.85205078125, -0.66424560546875, -0.4764404296875, -0.28863525390625, -0.100830078125, 0.08697509765625, 0.2747802734375, 0.46258544921875, 0.650390625, 0.83819580078125, 1.0260009765625, 1.21380615234375, 1.401611328125, 1.58941650390625, 1.7772216796875, 1.96502685546875, 2.15283203125, 2.34063720703125, 2.5284423828125, 2.71624755859375, 2.904052734375, 3.09185791015625, 3.2796630859375, 3.46746826171875, 3.6552734375, 3.84307861328125, 4.0308837890625, 4.21868896484375, 4.406494140625, 4.59429931640625, 4.7821044921875, 4.96990966796875, 5.15771484375, 5.34552001953125, 5.5333251953125, 5.72113037109375, 5.908935546875, 6.09674072265625, 6.2845458984375, 6.47235107421875, 6.66015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 10.0, 13.0, 12.0, 19.0, 21.0, 13.0, 19.0, 28.0, 30.0, 45.0, 28.0, 43.0, 45.0, 54.0, 61.0, 60.0, 50.0, 35.0, 40.0, 43.0, 43.0, 46.0, 25.0, 34.0, 36.0, 29.0, 19.0, 13.0, 15.0, 18.0, 9.0, 10.0, 7.0, 8.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.673828125, -1.621368408203125, -1.56890869140625, -1.516448974609375, -1.4639892578125, -1.411529541015625, -1.35906982421875, -1.306610107421875, -1.254150390625, -1.201690673828125, -1.14923095703125, -1.096771240234375, -1.0443115234375, -0.991851806640625, -0.93939208984375, -0.886932373046875, -0.83447265625, -0.782012939453125, -0.72955322265625, -0.677093505859375, -0.6246337890625, -0.572174072265625, -0.51971435546875, -0.467254638671875, -0.414794921875, -0.362335205078125, -0.30987548828125, -0.257415771484375, -0.2049560546875, -0.152496337890625, -0.10003662109375, -0.047576904296875, 0.0048828125, 0.057342529296875, 0.10980224609375, 0.162261962890625, 0.2147216796875, 0.267181396484375, 0.31964111328125, 0.372100830078125, 0.424560546875, 0.477020263671875, 0.52947998046875, 0.581939697265625, 0.6343994140625, 0.686859130859375, 0.73931884765625, 0.791778564453125, 0.84423828125, 0.896697998046875, 0.94915771484375, 1.001617431640625, 1.0540771484375, 1.106536865234375, 1.15899658203125, 1.211456298828125, 1.263916015625, 1.316375732421875, 1.36883544921875, 1.421295166015625, 1.4737548828125, 1.526214599609375, 1.57867431640625, 1.631134033203125, 1.68359375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 10.0, 14.0, 12.0, 14.0, 11.0, 28.0, 23.0, 33.0, 32.0, 39.0, 46.0, 55.0, 49.0, 63.0, 53.0, 67.0, 65.0, 57.0, 49.0, 41.0, 39.0, 23.0, 24.0, 26.0, 23.0, 21.0, 14.0, 11.0, 6.0, 5.0, 5.0, 4.0, 6.0, 4.0, 3.0, 1.0, 3.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-29.114336013793945, -28.23215675354004, -27.3499755859375, -26.467796325683594, -25.585617065429688, -24.70343780517578, -23.821256637573242, -22.939077377319336, -22.05689811706543, -21.174718856811523, -20.292537689208984, -19.410358428955078, -18.528179168701172, -17.645999908447266, -16.763818740844727, -15.88163948059082, -14.999459266662598, -14.117279052734375, -13.235099792480469, -12.352919578552246, -11.47074031829834, -10.588560104370117, -9.706380844116211, -8.824200630187988, -7.942020893096924, -7.059841156005859, -6.177661418914795, -5.2954816818237305, -4.413301467895508, -3.5311217308044434, -2.648941993713379, -1.7667622566223145, -0.88458251953125, -0.0024027228355407715, 0.8797770738601685, 1.7619569301605225, 2.644136667251587, 3.5263166427612305, 4.408496379852295, 5.290676116943359, 6.172855854034424, 7.055035591125488, 7.937215328216553, 8.819395065307617, 9.70157527923584, 10.583755493164062, 11.465934753417969, 12.348114013671875, 13.230294227600098, 14.11247444152832, 14.994653701782227, 15.87683391571045, 16.759014129638672, 17.641193389892578, 18.523372650146484, 19.40555191040039, 20.28773307800293, 21.169912338256836, 22.052093505859375, 22.93427276611328, 23.816452026367188, 24.698631286621094, 25.580812454223633, 26.46299171447754, 27.345170974731445]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 5.0, 8.0, 8.0, 14.0, 14.0, 14.0, 11.0, 11.0, 18.0, 24.0, 17.0, 25.0, 30.0, 34.0, 38.0, 40.0, 37.0, 36.0, 36.0, 35.0, 35.0, 35.0, 37.0, 45.0, 35.0, 43.0, 29.0, 40.0, 34.0, 30.0, 31.0, 29.0, 17.0, 19.0, 15.0, 19.0, 13.0, 11.0, 4.0, 5.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.912052154541016, -12.462684631347656, -12.013318061828613, -11.563950538635254, -11.114583969116211, -10.665216445922852, -10.215848922729492, -9.76648235321045, -9.317115783691406, -8.867748260498047, -8.418381690979004, -7.9690141677856445, -7.519647598266602, -7.070280075073242, -6.620913028717041, -6.17154598236084, -5.7221784591674805, -5.272811412811279, -4.823444366455078, -4.374076843261719, -3.9247100353240967, -3.4753429889678955, -3.0259757041931152, -2.576608657836914, -2.127241611480713, -1.6778745651245117, -1.228507399559021, -0.7791402339935303, -0.3297731876373291, 0.11959385871887207, 0.5689611434936523, 1.0183281898498535, 1.467696189880371, 1.9170632362365723, 2.3664302825927734, 2.8157975673675537, 3.265164613723755, 3.714531660079956, 4.163898944854736, 4.6132659912109375, 5.062633037567139, 5.51200008392334, 5.961367130279541, 6.410734176635742, 6.860101699829102, 7.3094682693481445, 7.758835792541504, 8.208202362060547, 8.657569885253906, 9.106937408447266, 9.556303977966309, 10.005671501159668, 10.455038070678711, 10.90440559387207, 11.35377311706543, 11.803139686584473, 12.252506256103516, 12.701873779296875, 13.151240348815918, 13.600607872009277, 14.04997444152832, 14.49934196472168, 14.948709487915039, 15.398076057434082, 15.847443580627441]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 14.0, 24.0, 27.0, 53.0, 84.0, 113.0, 168.0, 244.0, 401.0, 632.0, 993.0, 1507.0, 2376.0, 3612.0, 5752.0, 8887.0, 13819.0, 21611.0, 33372.0, 51637.0, 76165.0, 105933.0, 133440.0, 143924.0, 130768.0, 102125.0, 72940.0, 48751.0, 31721.0, 20711.0, 13174.0, 8422.0, 5373.0, 3456.0, 2190.0, 1454.0, 919.0, 623.0, 387.0, 262.0, 156.0, 125.0, 71.0, 52.0, 36.0, 18.0, 14.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.890625, -16.31689453125, -15.7431640625, -15.16943359375, -14.595703125, -14.02197265625, -13.4482421875, -12.87451171875, -12.30078125, -11.72705078125, -11.1533203125, -10.57958984375, -10.005859375, -9.43212890625, -8.8583984375, -8.28466796875, -7.7109375, -7.13720703125, -6.5634765625, -5.98974609375, -5.416015625, -4.84228515625, -4.2685546875, -3.69482421875, -3.12109375, -2.54736328125, -1.9736328125, -1.39990234375, -0.826171875, -0.25244140625, 0.3212890625, 0.89501953125, 1.46875, 2.04248046875, 2.6162109375, 3.18994140625, 3.763671875, 4.33740234375, 4.9111328125, 5.48486328125, 6.05859375, 6.63232421875, 7.2060546875, 7.77978515625, 8.353515625, 8.92724609375, 9.5009765625, 10.07470703125, 10.6484375, 11.22216796875, 11.7958984375, 12.36962890625, 12.943359375, 13.51708984375, 14.0908203125, 14.66455078125, 15.23828125, 15.81201171875, 16.3857421875, 16.95947265625, 17.533203125, 18.10693359375, 18.6806640625, 19.25439453125, 19.828125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 9.0, 11.0, 11.0, 11.0, 15.0, 14.0, 19.0, 29.0, 25.0, 30.0, 38.0, 33.0, 42.0, 33.0, 41.0, 45.0, 37.0, 41.0, 39.0, 43.0, 49.0, 45.0, 33.0, 52.0, 36.0, 27.0, 32.0, 23.0, 16.0, 25.0, 17.0, 20.0, 10.0, 9.0, 1.0, 10.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.1875, -16.646240234375, -16.10498046875, -15.563720703125, -15.0224609375, -14.481201171875, -13.93994140625, -13.398681640625, -12.857421875, -12.316162109375, -11.77490234375, -11.233642578125, -10.6923828125, -10.151123046875, -9.60986328125, -9.068603515625, -8.52734375, -7.986083984375, -7.44482421875, -6.903564453125, -6.3623046875, -5.821044921875, -5.27978515625, -4.738525390625, -4.197265625, -3.656005859375, -3.11474609375, -2.573486328125, -2.0322265625, -1.490966796875, -0.94970703125, -0.408447265625, 0.1328125, 0.674072265625, 1.21533203125, 1.756591796875, 2.2978515625, 2.839111328125, 3.38037109375, 3.921630859375, 4.462890625, 5.004150390625, 5.54541015625, 6.086669921875, 6.6279296875, 7.169189453125, 7.71044921875, 8.251708984375, 8.79296875, 9.334228515625, 9.87548828125, 10.416748046875, 10.9580078125, 11.499267578125, 12.04052734375, 12.581787109375, 13.123046875, 13.664306640625, 14.20556640625, 14.746826171875, 15.2880859375, 15.829345703125, 16.37060546875, 16.911865234375, 17.453125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 9.0, 5.0, 22.0, 23.0, 26.0, 51.0, 68.0, 114.0, 178.0, 259.0, 406.0, 579.0, 926.0, 1500.0, 2307.0, 3770.0, 6196.0, 10354.0, 17192.0, 28598.0, 46367.0, 73544.0, 110327.0, 146516.0, 162154.0, 144047.0, 107484.0, 71367.0, 44570.0, 27120.0, 16809.0, 9820.0, 6014.0, 3631.0, 2265.0, 1361.0, 892.0, 583.0, 404.0, 238.0, 147.0, 104.0, 76.0, 37.0, 38.0, 21.0, 14.0, 10.0, 7.0, 8.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-22.0625, -21.3828125, -20.703125, -20.0234375, -19.34375, -18.6640625, -17.984375, -17.3046875, -16.625, -15.9453125, -15.265625, -14.5859375, -13.90625, -13.2265625, -12.546875, -11.8671875, -11.1875, -10.5078125, -9.828125, -9.1484375, -8.46875, -7.7890625, -7.109375, -6.4296875, -5.75, -5.0703125, -4.390625, -3.7109375, -3.03125, -2.3515625, -1.671875, -0.9921875, -0.3125, 0.3671875, 1.046875, 1.7265625, 2.40625, 3.0859375, 3.765625, 4.4453125, 5.125, 5.8046875, 6.484375, 7.1640625, 7.84375, 8.5234375, 9.203125, 9.8828125, 10.5625, 11.2421875, 11.921875, 12.6015625, 13.28125, 13.9609375, 14.640625, 15.3203125, 16.0, 16.6796875, 17.359375, 18.0390625, 18.71875, 19.3984375, 20.078125, 20.7578125, 21.4375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 11.0, 6.0, 3.0, 3.0, 13.0, 14.0, 14.0, 19.0, 28.0, 16.0, 26.0, 33.0, 35.0, 42.0, 35.0, 34.0, 48.0, 45.0, 58.0, 59.0, 45.0, 48.0, 49.0, 47.0, 41.0, 34.0, 31.0, 25.0, 22.0, 24.0, 23.0, 21.0, 15.0, 10.0, 8.0, 9.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.953125, -13.56005859375, -13.1669921875, -12.77392578125, -12.380859375, -11.98779296875, -11.5947265625, -11.20166015625, -10.80859375, -10.41552734375, -10.0224609375, -9.62939453125, -9.236328125, -8.84326171875, -8.4501953125, -8.05712890625, -7.6640625, -7.27099609375, -6.8779296875, -6.48486328125, -6.091796875, -5.69873046875, -5.3056640625, -4.91259765625, -4.51953125, -4.12646484375, -3.7333984375, -3.34033203125, -2.947265625, -2.55419921875, -2.1611328125, -1.76806640625, -1.375, -0.98193359375, -0.5888671875, -0.19580078125, 0.197265625, 0.59033203125, 0.9833984375, 1.37646484375, 1.76953125, 2.16259765625, 2.5556640625, 2.94873046875, 3.341796875, 3.73486328125, 4.1279296875, 4.52099609375, 4.9140625, 5.30712890625, 5.7001953125, 6.09326171875, 6.486328125, 6.87939453125, 7.2724609375, 7.66552734375, 8.05859375, 8.45166015625, 8.8447265625, 9.23779296875, 9.630859375, 10.02392578125, 10.4169921875, 10.81005859375, 11.203125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 4.0, 7.0, 9.0, 22.0, 31.0, 32.0, 42.0, 53.0, 89.0, 121.0, 213.0, 303.0, 524.0, 885.0, 1516.0, 2975.0, 6465.0, 14783.0, 38466.0, 115647.0, 342180.0, 341950.0, 115594.0, 38528.0, 14823.0, 6341.0, 3078.0, 1559.0, 872.0, 506.0, 282.0, 207.0, 131.0, 78.0, 58.0, 49.0, 34.0, 25.0, 11.0, 17.0, 13.0, 2.0, 12.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-32.21875, -31.2119140625, -30.205078125, -29.1982421875, -28.19140625, -27.1845703125, -26.177734375, -25.1708984375, -24.1640625, -23.1572265625, -22.150390625, -21.1435546875, -20.13671875, -19.1298828125, -18.123046875, -17.1162109375, -16.109375, -15.1025390625, -14.095703125, -13.0888671875, -12.08203125, -11.0751953125, -10.068359375, -9.0615234375, -8.0546875, -7.0478515625, -6.041015625, -5.0341796875, -4.02734375, -3.0205078125, -2.013671875, -1.0068359375, 0.0, 1.0068359375, 2.013671875, 3.0205078125, 4.02734375, 5.0341796875, 6.041015625, 7.0478515625, 8.0546875, 9.0615234375, 10.068359375, 11.0751953125, 12.08203125, 13.0888671875, 14.095703125, 15.1025390625, 16.109375, 17.1162109375, 18.123046875, 19.1298828125, 20.13671875, 21.1435546875, 22.150390625, 23.1572265625, 24.1640625, 25.1708984375, 26.177734375, 27.1845703125, 28.19140625, 29.1982421875, 30.205078125, 31.2119140625, 32.21875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 12.0, 9.0, 8.0, 12.0, 17.0, 49.0, 63.0, 110.0, 175.0, 183.0, 130.0, 91.0, 50.0, 31.0, 17.0, 8.0, 6.0, 4.0, 7.0, 1.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005340576171875, -0.005217015743255615, -0.0050934553146362305, -0.004969894886016846, -0.004846334457397461, -0.004722774028778076, -0.004599213600158691, -0.004475653171539307, -0.004352092742919922, -0.004228532314300537, -0.004104971885681152, -0.003981411457061768, -0.003857851028442383, -0.003734290599822998, -0.0036107301712036133, -0.0034871697425842285, -0.0033636093139648438, -0.003240048885345459, -0.0031164884567260742, -0.0029929280281066895, -0.0028693675994873047, -0.00274580717086792, -0.002622246742248535, -0.0024986863136291504, -0.0023751258850097656, -0.002251565456390381, -0.002128005027770996, -0.0020044445991516113, -0.0018808841705322266, -0.0017573237419128418, -0.001633763313293457, -0.0015102028846740723, -0.0013866424560546875, -0.0012630820274353027, -0.001139521598815918, -0.0010159611701965332, -0.0008924007415771484, -0.0007688403129577637, -0.0006452798843383789, -0.0005217194557189941, -0.0003981590270996094, -0.0002745985984802246, -0.00015103816986083984, -2.7477741241455078e-05, 9.608268737792969e-05, 0.00021964311599731445, 0.0003432035446166992, 0.000466763973236084, 0.0005903244018554688, 0.0007138848304748535, 0.0008374452590942383, 0.000961005687713623, 0.0010845661163330078, 0.0012081265449523926, 0.0013316869735717773, 0.0014552474021911621, 0.0015788078308105469, 0.0017023682594299316, 0.0018259286880493164, 0.0019494891166687012, 0.002073049545288086, 0.0021966099739074707, 0.0023201704025268555, 0.0024437308311462402, 0.002567291259765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 13.0, 16.0, 22.0, 24.0, 47.0, 70.0, 97.0, 167.0, 219.0, 365.0, 511.0, 854.0, 1310.0, 2161.0, 3502.0, 5789.0, 11030.0, 21588.0, 45769.0, 107532.0, 242739.0, 307724.0, 163404.0, 68109.0, 30809.0, 15001.0, 7904.0, 4423.0, 2701.0, 1738.0, 955.0, 646.0, 421.0, 306.0, 206.0, 116.0, 93.0, 65.0, 31.0, 23.0, 21.0, 11.0, 8.0, 6.0, 5.0, 0.0, 3.0, 2.0, 1.0], "bins": [-27.96875, -27.197021484375, -26.42529296875, -25.653564453125, -24.8818359375, -24.110107421875, -23.33837890625, -22.566650390625, -21.794921875, -21.023193359375, -20.25146484375, -19.479736328125, -18.7080078125, -17.936279296875, -17.16455078125, -16.392822265625, -15.62109375, -14.849365234375, -14.07763671875, -13.305908203125, -12.5341796875, -11.762451171875, -10.99072265625, -10.218994140625, -9.447265625, -8.675537109375, -7.90380859375, -7.132080078125, -6.3603515625, -5.588623046875, -4.81689453125, -4.045166015625, -3.2734375, -2.501708984375, -1.72998046875, -0.958251953125, -0.1865234375, 0.585205078125, 1.35693359375, 2.128662109375, 2.900390625, 3.672119140625, 4.44384765625, 5.215576171875, 5.9873046875, 6.759033203125, 7.53076171875, 8.302490234375, 9.07421875, 9.845947265625, 10.61767578125, 11.389404296875, 12.1611328125, 12.932861328125, 13.70458984375, 14.476318359375, 15.248046875, 16.019775390625, 16.79150390625, 17.563232421875, 18.3349609375, 19.106689453125, 19.87841796875, 20.650146484375, 21.421875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 5.0, 4.0, 2.0, 9.0, 18.0, 17.0, 30.0, 33.0, 37.0, 50.0, 52.0, 53.0, 77.0, 67.0, 90.0, 73.0, 64.0, 75.0, 56.0, 33.0, 32.0, 25.0, 16.0, 23.0, 14.0, 11.0, 5.0, 10.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -7.0006103515625, -6.790283203125, -6.5799560546875, -6.36962890625, -6.1593017578125, -5.948974609375, -5.7386474609375, -5.5283203125, -5.3179931640625, -5.107666015625, -4.8973388671875, -4.68701171875, -4.4766845703125, -4.266357421875, -4.0560302734375, -3.845703125, -3.6353759765625, -3.425048828125, -3.2147216796875, -3.00439453125, -2.7940673828125, -2.583740234375, -2.3734130859375, -2.1630859375, -1.9527587890625, -1.742431640625, -1.5321044921875, -1.32177734375, -1.1114501953125, -0.901123046875, -0.6907958984375, -0.48046875, -0.2701416015625, -0.059814453125, 0.1505126953125, 0.36083984375, 0.5711669921875, 0.781494140625, 0.9918212890625, 1.2021484375, 1.4124755859375, 1.622802734375, 1.8331298828125, 2.04345703125, 2.2537841796875, 2.464111328125, 2.6744384765625, 2.884765625, 3.0950927734375, 3.305419921875, 3.5157470703125, 3.72607421875, 3.9364013671875, 4.146728515625, 4.3570556640625, 4.5673828125, 4.7777099609375, 4.988037109375, 5.1983642578125, 5.40869140625, 5.6190185546875, 5.829345703125, 6.0396728515625, 6.25]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 3.0, 16.0, 5.0, 12.0, 16.0, 18.0, 13.0, 23.0, 35.0, 40.0, 39.0, 56.0, 53.0, 54.0, 71.0, 57.0, 69.0, 59.0, 58.0, 59.0, 45.0, 25.0, 38.0, 25.0, 13.0, 17.0, 13.0, 13.0, 6.0, 6.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.932640075683594, -28.98223876953125, -28.031837463378906, -27.08143424987793, -26.131032943725586, -25.180631637573242, -24.2302303314209, -23.279827117919922, -22.329425811767578, -21.379024505615234, -20.42862319946289, -19.478219985961914, -18.52781867980957, -17.577417373657227, -16.627016067504883, -15.676613807678223, -14.726212501525879, -13.775811195373535, -12.825408935546875, -11.875007629394531, -10.924605369567871, -9.974204063415527, -9.023801803588867, -8.073400497436523, -7.1229987144470215, -6.1725969314575195, -5.222195148468018, -4.271793365478516, -3.3213918209075928, -2.37099027633667, -1.420588493347168, -0.470186710357666, 0.48021507263183594, 1.430616855621338, 2.38101863861084, 3.3314201831817627, 4.281822204589844, 5.2322235107421875, 6.1826252937316895, 7.133027076721191, 8.083429336547852, 9.033830642700195, 9.984232902526855, 10.9346342086792, 11.88503646850586, 12.835437774658203, 13.785839080810547, 14.736241340637207, 15.68664264678955, 16.63704490661621, 17.587446212768555, 18.5378475189209, 19.488248825073242, 20.43865203857422, 21.389053344726562, 22.339454650878906, 23.28985595703125, 24.240257263183594, 25.190658569335938, 26.141061782836914, 27.091463088989258, 28.0418643951416, 28.992265701293945, 29.942668914794922, 30.893070220947266]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 8.0, 6.0, 4.0, 7.0, 7.0, 12.0, 8.0, 12.0, 18.0, 19.0, 25.0, 17.0, 18.0, 25.0, 19.0, 15.0, 27.0, 19.0, 33.0, 36.0, 43.0, 41.0, 28.0, 32.0, 41.0, 41.0, 36.0, 45.0, 31.0, 35.0, 31.0, 26.0, 29.0, 33.0, 27.0, 24.0, 21.0, 23.0, 9.0, 20.0, 6.0, 12.0, 8.0, 8.0, 7.0, 2.0, 0.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0], "bins": [-15.10141658782959, -14.670954704284668, -14.240493774414062, -13.81003189086914, -13.379570007324219, -12.949108123779297, -12.518647193908691, -12.08818531036377, -11.657724380493164, -11.227262496948242, -10.796801567077637, -10.366339683532715, -9.935877799987793, -9.505416870117188, -9.074954986572266, -8.644493103027344, -8.214031219482422, -7.783569812774658, -7.353107929229736, -6.922646522521973, -6.492184638977051, -6.061723232269287, -5.631261825561523, -5.200799942016602, -4.770338535308838, -4.339877128601074, -3.9094152450561523, -3.4789538383483887, -3.048492193222046, -2.618030548095703, -2.1875691413879395, -1.7571074962615967, -1.326645851135254, -0.8961842656135559, -0.4657226800918579, -0.03526115417480469, 0.3952004909515381, 0.8256621360778809, 1.2561235427856445, 1.6865851879119873, 2.11704683303833, 2.547508478164673, 2.9779701232910156, 3.4084315299987793, 3.838893175125122, 4.269354820251465, 4.6998162269592285, 5.130277633666992, 5.560739517211914, 5.991200923919678, 6.4216628074646, 6.852124214172363, 7.282586097717285, 7.713047504425049, 8.143508911132812, 8.573970794677734, 9.004432678222656, 9.434894561767578, 9.865355491638184, 10.295817375183105, 10.726279258728027, 11.156740188598633, 11.587202072143555, 12.017663955688477, 12.448124885559082]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [6.0, 10.0, 8.0, 14.0, 22.0, 31.0, 38.0, 67.0, 59.0, 104.0, 146.0, 172.0, 289.0, 425.0, 584.0, 835.0, 1248.0, 1839.0, 2813.0, 4104.0, 6404.0, 10299.0, 17048.0, 28523.0, 50450.0, 93648.0, 183404.0, 374914.0, 724937.0, 1017857.0, 796489.0, 427548.0, 210119.0, 104868.0, 55538.0, 30835.0, 18044.0, 10947.0, 6753.0, 4234.0, 2730.0, 1826.0, 1216.0, 899.0, 582.0, 411.0, 297.0, 167.0, 148.0, 106.0, 74.0, 45.0, 35.0, 29.0, 15.0, 11.0, 11.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0], "bins": [-28.140625, -27.189697265625, -26.23876953125, -25.287841796875, -24.3369140625, -23.385986328125, -22.43505859375, -21.484130859375, -20.533203125, -19.582275390625, -18.63134765625, -17.680419921875, -16.7294921875, -15.778564453125, -14.82763671875, -13.876708984375, -12.92578125, -11.974853515625, -11.02392578125, -10.072998046875, -9.1220703125, -8.171142578125, -7.22021484375, -6.269287109375, -5.318359375, -4.367431640625, -3.41650390625, -2.465576171875, -1.5146484375, -0.563720703125, 0.38720703125, 1.338134765625, 2.2890625, 3.239990234375, 4.19091796875, 5.141845703125, 6.0927734375, 7.043701171875, 7.99462890625, 8.945556640625, 9.896484375, 10.847412109375, 11.79833984375, 12.749267578125, 13.7001953125, 14.651123046875, 15.60205078125, 16.552978515625, 17.50390625, 18.454833984375, 19.40576171875, 20.356689453125, 21.3076171875, 22.258544921875, 23.20947265625, 24.160400390625, 25.111328125, 26.062255859375, 27.01318359375, 27.964111328125, 28.9150390625, 29.865966796875, 30.81689453125, 31.767822265625, 32.71875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 0.0, 3.0, 4.0, 7.0, 7.0, 5.0, 5.0, 15.0, 17.0, 18.0, 14.0, 12.0, 20.0, 16.0, 23.0, 19.0, 28.0, 21.0, 32.0, 35.0, 28.0, 28.0, 36.0, 40.0, 27.0, 43.0, 40.0, 41.0, 34.0, 43.0, 33.0, 32.0, 32.0, 26.0, 31.0, 28.0, 24.0, 19.0, 16.0, 13.0, 11.0, 17.0, 16.0, 4.0, 8.0, 8.0, 8.0, 7.0, 2.0, 1.0, 2.0, 0.0, 5.0, 0.0, 3.0, 3.0, 1.0], "bins": [-12.375, -11.996826171875, -11.61865234375, -11.240478515625, -10.8623046875, -10.484130859375, -10.10595703125, -9.727783203125, -9.349609375, -8.971435546875, -8.59326171875, -8.215087890625, -7.8369140625, -7.458740234375, -7.08056640625, -6.702392578125, -6.32421875, -5.946044921875, -5.56787109375, -5.189697265625, -4.8115234375, -4.433349609375, -4.05517578125, -3.677001953125, -3.298828125, -2.920654296875, -2.54248046875, -2.164306640625, -1.7861328125, -1.407958984375, -1.02978515625, -0.651611328125, -0.2734375, 0.104736328125, 0.48291015625, 0.861083984375, 1.2392578125, 1.617431640625, 1.99560546875, 2.373779296875, 2.751953125, 3.130126953125, 3.50830078125, 3.886474609375, 4.2646484375, 4.642822265625, 5.02099609375, 5.399169921875, 5.77734375, 6.155517578125, 6.53369140625, 6.911865234375, 7.2900390625, 7.668212890625, 8.04638671875, 8.424560546875, 8.802734375, 9.180908203125, 9.55908203125, 9.937255859375, 10.3154296875, 10.693603515625, 11.07177734375, 11.449951171875, 11.828125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 18.0, 19.0, 30.0, 53.0, 80.0, 112.0, 134.0, 214.0, 263.0, 516.0, 642.0, 1015.0, 1639.0, 2511.0, 4025.0, 6452.0, 10721.0, 18083.0, 31593.0, 56477.0, 104166.0, 201484.0, 399547.0, 756170.0, 1022737.0, 747595.0, 394021.0, 198512.0, 102911.0, 55323.0, 30856.0, 17862.0, 10675.0, 6460.0, 3935.0, 2478.0, 1646.0, 1079.0, 725.0, 472.0, 316.0, 201.0, 159.0, 113.0, 77.0, 53.0, 41.0, 28.0, 17.0, 8.0, 7.0, 5.0, 2.0, 2.0], "bins": [-42.0, -40.7822265625, -39.564453125, -38.3466796875, -37.12890625, -35.9111328125, -34.693359375, -33.4755859375, -32.2578125, -31.0400390625, -29.822265625, -28.6044921875, -27.38671875, -26.1689453125, -24.951171875, -23.7333984375, -22.515625, -21.2978515625, -20.080078125, -18.8623046875, -17.64453125, -16.4267578125, -15.208984375, -13.9912109375, -12.7734375, -11.5556640625, -10.337890625, -9.1201171875, -7.90234375, -6.6845703125, -5.466796875, -4.2490234375, -3.03125, -1.8134765625, -0.595703125, 0.6220703125, 1.83984375, 3.0576171875, 4.275390625, 5.4931640625, 6.7109375, 7.9287109375, 9.146484375, 10.3642578125, 11.58203125, 12.7998046875, 14.017578125, 15.2353515625, 16.453125, 17.6708984375, 18.888671875, 20.1064453125, 21.32421875, 22.5419921875, 23.759765625, 24.9775390625, 26.1953125, 27.4130859375, 28.630859375, 29.8486328125, 31.06640625, 32.2841796875, 33.501953125, 34.7197265625, 35.9375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 10.0, 10.0, 15.0, 22.0, 23.0, 29.0, 54.0, 58.0, 71.0, 104.0, 103.0, 143.0, 163.0, 200.0, 244.0, 254.0, 291.0, 289.0, 295.0, 259.0, 243.0, 216.0, 187.0, 137.0, 117.0, 92.0, 92.0, 66.0, 72.0, 40.0, 48.0, 21.0, 30.0, 11.0, 11.0, 9.0, 12.0, 11.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1533203125, -8.814453125, -8.4755859375, -8.13671875, -7.7978515625, -7.458984375, -7.1201171875, -6.78125, -6.4423828125, -6.103515625, -5.7646484375, -5.42578125, -5.0869140625, -4.748046875, -4.4091796875, -4.0703125, -3.7314453125, -3.392578125, -3.0537109375, -2.71484375, -2.3759765625, -2.037109375, -1.6982421875, -1.359375, -1.0205078125, -0.681640625, -0.3427734375, -0.00390625, 0.3349609375, 0.673828125, 1.0126953125, 1.3515625, 1.6904296875, 2.029296875, 2.3681640625, 2.70703125, 3.0458984375, 3.384765625, 3.7236328125, 4.0625, 4.4013671875, 4.740234375, 5.0791015625, 5.41796875, 5.7568359375, 6.095703125, 6.4345703125, 6.7734375, 7.1123046875, 7.451171875, 7.7900390625, 8.12890625, 8.4677734375, 8.806640625, 9.1455078125, 9.484375, 9.8232421875, 10.162109375, 10.5009765625, 10.83984375, 11.1787109375, 11.517578125, 11.8564453125, 12.1953125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 11.0, 14.0, 8.0, 15.0, 15.0, 24.0, 30.0, 44.0, 52.0, 56.0, 55.0, 69.0, 70.0, 86.0, 59.0, 59.0, 71.0, 45.0, 46.0, 34.0, 23.0, 23.0, 17.0, 13.0, 8.0, 8.0, 3.0, 11.0, 6.0, 8.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.60175323486328, -43.22584533691406, -41.84994125366211, -40.47403335571289, -39.09812927246094, -37.72222137451172, -36.3463134765625, -34.97040939331055, -33.594505310058594, -32.218597412109375, -30.842693328857422, -29.466785430908203, -28.09088134765625, -26.71497344970703, -25.339067459106445, -23.96316146850586, -22.58725357055664, -21.211347579956055, -19.83544158935547, -18.45953369140625, -17.083629608154297, -15.707722663879395, -14.331815719604492, -12.955909729003906, -11.58000373840332, -10.204097747802734, -8.828191757202148, -7.452284812927246, -6.07637882232666, -4.700472831726074, -3.324565887451172, -1.948659896850586, -0.5727500915527344, 0.8031561374664307, 2.1790623664855957, 3.55496883392334, 4.930874824523926, 6.306780815124512, 7.682687759399414, 9.05859375, 10.434499740600586, 11.810405731201172, 13.186311721801758, 14.56221866607666, 15.938124656677246, 17.314029693603516, 18.689937591552734, 20.06584358215332, 21.441749572753906, 22.817655563354492, 24.193561553955078, 25.569469451904297, 26.94537353515625, 28.32128143310547, 29.697187423706055, 31.07309341430664, 32.448997497558594, 33.82490539550781, 35.200809478759766, 36.576717376708984, 37.95262145996094, 39.328529357910156, 40.704437255859375, 42.08034133911133, 43.45624923706055]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 7.0, 2.0, 8.0, 11.0, 7.0, 11.0, 8.0, 15.0, 20.0, 22.0, 14.0, 19.0, 21.0, 37.0, 40.0, 38.0, 27.0, 37.0, 43.0, 37.0, 51.0, 45.0, 37.0, 46.0, 36.0, 43.0, 46.0, 31.0, 42.0, 33.0, 22.0, 29.0, 16.0, 19.0, 13.0, 13.0, 14.0, 8.0, 9.0, 7.0, 6.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.908977508544922, -19.299041748046875, -18.68910789489746, -18.079172134399414, -17.46923828125, -16.859302520751953, -16.24936866760254, -15.639432907104492, -15.029498100280762, -14.419563293457031, -13.8096284866333, -13.19969367980957, -12.589757919311523, -11.97982406616211, -11.369888305664062, -10.759953498840332, -10.150018692016602, -9.540083885192871, -8.93014907836914, -8.32021427154541, -7.7102789878845215, -7.100344181060791, -6.490408897399902, -5.880474090576172, -5.270539283752441, -4.660604476928711, -4.0506696701049805, -3.440734386444092, -2.8307995796203613, -2.220864772796631, -1.6109297275543213, -1.0009946823120117, -0.39105796813964844, 0.21887695789337158, 0.8288118839263916, 1.4387468099594116, 2.0486817359924316, 2.658616542816162, 3.2685515880584717, 3.8784866333007812, 4.488421440124512, 5.098356246948242, 5.708291053771973, 6.318226337432861, 6.928161144256592, 7.538095951080322, 8.148031234741211, 8.757966041564941, 9.367900848388672, 9.977835655212402, 10.587770462036133, 11.197705268859863, 11.807640075683594, 12.41757583618164, 13.027510643005371, 13.637445449829102, 14.247380256652832, 14.857315063476562, 15.467249870300293, 16.077184677124023, 16.68712043762207, 17.297054290771484, 17.90699005126953, 18.516925811767578, 19.126859664916992]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 9.0, 11.0, 11.0, 15.0, 23.0, 29.0, 52.0, 67.0, 103.0, 173.0, 263.0, 463.0, 729.0, 1154.0, 2086.0, 3557.0, 6674.0, 12440.0, 23712.0, 46946.0, 90648.0, 165019.0, 234085.0, 204354.0, 121901.0, 64378.0, 32654.0, 17028.0, 8654.0, 4811.0, 2532.0, 1580.0, 826.0, 592.0, 358.0, 226.0, 133.0, 83.0, 59.0, 39.0, 29.0, 16.0, 15.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.53125, -19.88427734375, -19.2373046875, -18.59033203125, -17.943359375, -17.29638671875, -16.6494140625, -16.00244140625, -15.35546875, -14.70849609375, -14.0615234375, -13.41455078125, -12.767578125, -12.12060546875, -11.4736328125, -10.82666015625, -10.1796875, -9.53271484375, -8.8857421875, -8.23876953125, -7.591796875, -6.94482421875, -6.2978515625, -5.65087890625, -5.00390625, -4.35693359375, -3.7099609375, -3.06298828125, -2.416015625, -1.76904296875, -1.1220703125, -0.47509765625, 0.171875, 0.81884765625, 1.4658203125, 2.11279296875, 2.759765625, 3.40673828125, 4.0537109375, 4.70068359375, 5.34765625, 5.99462890625, 6.6416015625, 7.28857421875, 7.935546875, 8.58251953125, 9.2294921875, 9.87646484375, 10.5234375, 11.17041015625, 11.8173828125, 12.46435546875, 13.111328125, 13.75830078125, 14.4052734375, 15.05224609375, 15.69921875, 16.34619140625, 16.9931640625, 17.64013671875, 18.287109375, 18.93408203125, 19.5810546875, 20.22802734375, 20.875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 3.0, 10.0, 6.0, 9.0, 7.0, 14.0, 11.0, 23.0, 15.0, 21.0, 23.0, 24.0, 34.0, 38.0, 27.0, 50.0, 34.0, 46.0, 42.0, 47.0, 42.0, 59.0, 42.0, 28.0, 45.0, 42.0, 40.0, 30.0, 30.0, 18.0, 22.0, 20.0, 21.0, 16.0, 11.0, 6.0, 7.0, 6.0, 9.0, 2.0, 2.0, 9.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-24.078125, -23.36474609375, -22.6513671875, -21.93798828125, -21.224609375, -20.51123046875, -19.7978515625, -19.08447265625, -18.37109375, -17.65771484375, -16.9443359375, -16.23095703125, -15.517578125, -14.80419921875, -14.0908203125, -13.37744140625, -12.6640625, -11.95068359375, -11.2373046875, -10.52392578125, -9.810546875, -9.09716796875, -8.3837890625, -7.67041015625, -6.95703125, -6.24365234375, -5.5302734375, -4.81689453125, -4.103515625, -3.39013671875, -2.6767578125, -1.96337890625, -1.25, -0.53662109375, 0.1767578125, 0.89013671875, 1.603515625, 2.31689453125, 3.0302734375, 3.74365234375, 4.45703125, 5.17041015625, 5.8837890625, 6.59716796875, 7.310546875, 8.02392578125, 8.7373046875, 9.45068359375, 10.1640625, 10.87744140625, 11.5908203125, 12.30419921875, 13.017578125, 13.73095703125, 14.4443359375, 15.15771484375, 15.87109375, 16.58447265625, 17.2978515625, 18.01123046875, 18.724609375, 19.43798828125, 20.1513671875, 20.86474609375, 21.578125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 8.0, 14.0, 18.0, 26.0, 20.0, 35.0, 58.0, 69.0, 106.0, 150.0, 208.0, 307.0, 461.0, 637.0, 1008.0, 1488.0, 2343.0, 3739.0, 6211.0, 10920.0, 19573.0, 37521.0, 72875.0, 138790.0, 229829.0, 228871.0, 137996.0, 71866.0, 36771.0, 19151.0, 10623.0, 6225.0, 3707.0, 2340.0, 1498.0, 967.0, 626.0, 468.0, 295.0, 225.0, 155.0, 108.0, 76.0, 50.0, 38.0, 23.0, 21.0, 13.0, 8.0, 12.0, 5.0, 3.0, 3.0, 3.0], "bins": [-24.578125, -23.875732421875, -23.17333984375, -22.470947265625, -21.7685546875, -21.066162109375, -20.36376953125, -19.661376953125, -18.958984375, -18.256591796875, -17.55419921875, -16.851806640625, -16.1494140625, -15.447021484375, -14.74462890625, -14.042236328125, -13.33984375, -12.637451171875, -11.93505859375, -11.232666015625, -10.5302734375, -9.827880859375, -9.12548828125, -8.423095703125, -7.720703125, -7.018310546875, -6.31591796875, -5.613525390625, -4.9111328125, -4.208740234375, -3.50634765625, -2.803955078125, -2.1015625, -1.399169921875, -0.69677734375, 0.005615234375, 0.7080078125, 1.410400390625, 2.11279296875, 2.815185546875, 3.517578125, 4.219970703125, 4.92236328125, 5.624755859375, 6.3271484375, 7.029541015625, 7.73193359375, 8.434326171875, 9.13671875, 9.839111328125, 10.54150390625, 11.243896484375, 11.9462890625, 12.648681640625, 13.35107421875, 14.053466796875, 14.755859375, 15.458251953125, 16.16064453125, 16.863037109375, 17.5654296875, 18.267822265625, 18.97021484375, 19.672607421875, 20.375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 6.0, 4.0, 7.0, 6.0, 5.0, 12.0, 12.0, 22.0, 20.0, 21.0, 21.0, 27.0, 21.0, 31.0, 35.0, 38.0, 37.0, 47.0, 46.0, 50.0, 32.0, 45.0, 39.0, 32.0, 47.0, 35.0, 35.0, 34.0, 31.0, 27.0, 35.0, 17.0, 20.0, 19.0, 20.0, 10.0, 17.0, 9.0, 6.0, 7.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.703125, -12.2801513671875, -11.857177734375, -11.4342041015625, -11.01123046875, -10.5882568359375, -10.165283203125, -9.7423095703125, -9.3193359375, -8.8963623046875, -8.473388671875, -8.0504150390625, -7.62744140625, -7.2044677734375, -6.781494140625, -6.3585205078125, -5.935546875, -5.5125732421875, -5.089599609375, -4.6666259765625, -4.24365234375, -3.8206787109375, -3.397705078125, -2.9747314453125, -2.5517578125, -2.1287841796875, -1.705810546875, -1.2828369140625, -0.85986328125, -0.4368896484375, -0.013916015625, 0.4090576171875, 0.83203125, 1.2550048828125, 1.677978515625, 2.1009521484375, 2.52392578125, 2.9468994140625, 3.369873046875, 3.7928466796875, 4.2158203125, 4.6387939453125, 5.061767578125, 5.4847412109375, 5.90771484375, 6.3306884765625, 6.753662109375, 7.1766357421875, 7.599609375, 8.0225830078125, 8.445556640625, 8.8685302734375, 9.29150390625, 9.7144775390625, 10.137451171875, 10.5604248046875, 10.9833984375, 11.4063720703125, 11.829345703125, 12.2523193359375, 12.67529296875, 13.0982666015625, 13.521240234375, 13.9442138671875, 14.3671875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 9.0, 11.0, 16.0, 34.0, 28.0, 72.0, 90.0, 117.0, 211.0, 331.0, 411.0, 646.0, 984.0, 1712.0, 2579.0, 4350.0, 7260.0, 12144.0, 21578.0, 39509.0, 74092.0, 141039.0, 238310.0, 223527.0, 126829.0, 67450.0, 36007.0, 20125.0, 11226.0, 6736.0, 4178.0, 2501.0, 1526.0, 978.0, 654.0, 416.0, 261.0, 209.0, 116.0, 88.0, 57.0, 41.0, 21.0, 19.0, 16.0, 10.0, 7.0, 8.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5, -8.2159423828125, -7.931884765625, -7.6478271484375, -7.36376953125, -7.0797119140625, -6.795654296875, -6.5115966796875, -6.2275390625, -5.9434814453125, -5.659423828125, -5.3753662109375, -5.09130859375, -4.8072509765625, -4.523193359375, -4.2391357421875, -3.955078125, -3.6710205078125, -3.386962890625, -3.1029052734375, -2.81884765625, -2.5347900390625, -2.250732421875, -1.9666748046875, -1.6826171875, -1.3985595703125, -1.114501953125, -0.8304443359375, -0.54638671875, -0.2623291015625, 0.021728515625, 0.3057861328125, 0.58984375, 0.8739013671875, 1.157958984375, 1.4420166015625, 1.72607421875, 2.0101318359375, 2.294189453125, 2.5782470703125, 2.8623046875, 3.1463623046875, 3.430419921875, 3.7144775390625, 3.99853515625, 4.2825927734375, 4.566650390625, 4.8507080078125, 5.134765625, 5.4188232421875, 5.702880859375, 5.9869384765625, 6.27099609375, 6.5550537109375, 6.839111328125, 7.1231689453125, 7.4072265625, 7.6912841796875, 7.975341796875, 8.2593994140625, 8.54345703125, 8.8275146484375, 9.111572265625, 9.3956298828125, 9.6796875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 10.0, 8.0, 10.0, 6.0, 18.0, 23.0, 28.0, 23.0, 49.0, 54.0, 49.0, 82.0, 90.0, 81.0, 90.0, 68.0, 85.0, 57.0, 47.0, 31.0, 23.0, 20.0, 8.0, 14.0, 8.0, 4.0, 3.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010890960693359375, -0.001062937080860138, -0.0010367780923843384, -0.0010106191039085388, -0.0009844601154327393, -0.0009583011269569397, -0.0009321421384811401, -0.0009059831500053406, -0.000879824161529541, -0.0008536651730537415, -0.0008275061845779419, -0.0008013471961021423, -0.0007751882076263428, -0.0007490292191505432, -0.0007228702306747437, -0.0006967112421989441, -0.0006705522537231445, -0.000644393265247345, -0.0006182342767715454, -0.0005920752882957458, -0.0005659162998199463, -0.0005397573113441467, -0.0005135983228683472, -0.0004874393343925476, -0.00046128034591674805, -0.0004351213574409485, -0.0004089623689651489, -0.00038280338048934937, -0.0003566443920135498, -0.00033048540353775024, -0.0003043264150619507, -0.0002781674265861511, -0.00025200843811035156, -0.000225849449634552, -0.00019969046115875244, -0.00017353147268295288, -0.00014737248420715332, -0.00012121349573135376, -9.50545072555542e-05, -6.889551877975464e-05, -4.273653030395508e-05, -1.6577541828155518e-05, 9.581446647644043e-06, 3.5740435123443604e-05, 6.189942359924316e-05, 8.805841207504272e-05, 0.00011421740055084229, 0.00014037638902664185, 0.0001665353775024414, 0.00019269436597824097, 0.00021885335445404053, 0.0002450123429298401, 0.00027117133140563965, 0.0002973303198814392, 0.00032348930835723877, 0.00034964829683303833, 0.0003758072853088379, 0.00040196627378463745, 0.000428125262260437, 0.00045428425073623657, 0.00048044323921203613, 0.0005066022276878357, 0.0005327612161636353, 0.0005589202046394348, 0.0005850791931152344]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 14.0, 22.0, 18.0, 41.0, 67.0, 87.0, 116.0, 207.0, 335.0, 536.0, 826.0, 1241.0, 2039.0, 3355.0, 5399.0, 8793.0, 14640.0, 24744.0, 42429.0, 72384.0, 119859.0, 173297.0, 189904.0, 150367.0, 97256.0, 57374.0, 33343.0, 19633.0, 11671.0, 7044.0, 4266.0, 2701.0, 1696.0, 1034.0, 641.0, 415.0, 265.0, 165.0, 122.0, 73.0, 41.0, 28.0, 23.0, 11.0, 11.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0], "bins": [-9.765625, -9.47216796875, -9.1787109375, -8.88525390625, -8.591796875, -8.29833984375, -8.0048828125, -7.71142578125, -7.41796875, -7.12451171875, -6.8310546875, -6.53759765625, -6.244140625, -5.95068359375, -5.6572265625, -5.36376953125, -5.0703125, -4.77685546875, -4.4833984375, -4.18994140625, -3.896484375, -3.60302734375, -3.3095703125, -3.01611328125, -2.72265625, -2.42919921875, -2.1357421875, -1.84228515625, -1.548828125, -1.25537109375, -0.9619140625, -0.66845703125, -0.375, -0.08154296875, 0.2119140625, 0.50537109375, 0.798828125, 1.09228515625, 1.3857421875, 1.67919921875, 1.97265625, 2.26611328125, 2.5595703125, 2.85302734375, 3.146484375, 3.43994140625, 3.7333984375, 4.02685546875, 4.3203125, 4.61376953125, 4.9072265625, 5.20068359375, 5.494140625, 5.78759765625, 6.0810546875, 6.37451171875, 6.66796875, 6.96142578125, 7.2548828125, 7.54833984375, 7.841796875, 8.13525390625, 8.4287109375, 8.72216796875, 9.015625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 3.0, 7.0, 5.0, 6.0, 14.0, 11.0, 15.0, 10.0, 17.0, 18.0, 24.0, 23.0, 26.0, 24.0, 28.0, 30.0, 47.0, 51.0, 57.0, 42.0, 45.0, 48.0, 42.0, 37.0, 35.0, 44.0, 31.0, 41.0, 31.0, 24.0, 24.0, 20.0, 18.0, 18.0, 11.0, 17.0, 12.0, 9.0, 5.0, 2.0, 8.0, 11.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.29296875, -2.22393798828125, -2.1549072265625, -2.08587646484375, -2.016845703125, -1.94781494140625, -1.8787841796875, -1.80975341796875, -1.74072265625, -1.67169189453125, -1.6026611328125, -1.53363037109375, -1.464599609375, -1.39556884765625, -1.3265380859375, -1.25750732421875, -1.1884765625, -1.11944580078125, -1.0504150390625, -0.98138427734375, -0.912353515625, -0.84332275390625, -0.7742919921875, -0.70526123046875, -0.63623046875, -0.56719970703125, -0.4981689453125, -0.42913818359375, -0.360107421875, -0.29107666015625, -0.2220458984375, -0.15301513671875, -0.083984375, -0.01495361328125, 0.0540771484375, 0.12310791015625, 0.192138671875, 0.26116943359375, 0.3302001953125, 0.39923095703125, 0.46826171875, 0.53729248046875, 0.6063232421875, 0.67535400390625, 0.744384765625, 0.81341552734375, 0.8824462890625, 0.95147705078125, 1.0205078125, 1.08953857421875, 1.1585693359375, 1.22760009765625, 1.296630859375, 1.36566162109375, 1.4346923828125, 1.50372314453125, 1.57275390625, 1.64178466796875, 1.7108154296875, 1.77984619140625, 1.848876953125, 1.91790771484375, 1.9869384765625, 2.05596923828125, 2.125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 8.0, 10.0, 12.0, 11.0, 11.0, 9.0, 19.0, 28.0, 34.0, 48.0, 55.0, 48.0, 64.0, 61.0, 92.0, 75.0, 60.0, 63.0, 62.0, 46.0, 44.0, 28.0, 19.0, 21.0, 13.0, 9.0, 14.0, 4.0, 13.0, 8.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.70714569091797, -43.313541412353516, -41.91993713378906, -40.526329040527344, -39.13272476196289, -37.73912048339844, -36.345516204833984, -34.95191192626953, -33.55830383300781, -32.16469955444336, -30.771093368530273, -29.37748908996582, -27.983882904052734, -26.59027862548828, -25.196674346923828, -23.803068161010742, -22.40946388244629, -21.015859603881836, -19.62225341796875, -18.228649139404297, -16.83504295349121, -15.441438674926758, -14.047833442687988, -12.654228210449219, -11.26062297821045, -9.86701774597168, -8.47341251373291, -7.079807758331299, -5.686202526092529, -4.29259729385376, -2.8989925384521484, -1.505387306213379, -0.11178207397460938, 1.2818230390548706, 2.6754281520843506, 4.069033145904541, 5.4626383781433105, 6.85624361038208, 8.249848365783691, 9.643453598022461, 11.03705883026123, 12.4306640625, 13.82426929473877, 15.217874526977539, 16.611478805541992, 18.005084991455078, 19.39868927001953, 20.792293548583984, 22.18589973449707, 23.579504013061523, 24.97311019897461, 26.366714477539062, 27.76032066345215, 29.1539249420166, 30.547531127929688, 31.94113540649414, 33.334739685058594, 34.72834396362305, 36.1219482421875, 37.51555633544922, 38.90916061401367, 40.302764892578125, 41.69636917114258, 43.08997344970703, 44.48358154296875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 3.0, 4.0, 5.0, 9.0, 9.0, 6.0, 11.0, 13.0, 11.0, 26.0, 15.0, 16.0, 22.0, 29.0, 39.0, 32.0, 36.0, 31.0, 40.0, 35.0, 46.0, 44.0, 48.0, 42.0, 41.0, 35.0, 48.0, 41.0, 35.0, 35.0, 28.0, 26.0, 28.0, 18.0, 17.0, 15.0, 7.0, 14.0, 11.0, 6.0, 5.0, 6.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.435171127319336, -18.831344604492188, -18.22751808166504, -17.62369155883789, -17.019865036010742, -16.416038513183594, -15.812211990356445, -15.208385467529297, -14.604558944702148, -14.000732421875, -13.396905899047852, -12.793079376220703, -12.189252853393555, -11.585426330566406, -10.981599807739258, -10.37777328491211, -9.773947715759277, -9.170121192932129, -8.56629467010498, -7.962468147277832, -7.358641624450684, -6.754815101623535, -6.150989055633545, -5.5471625328063965, -4.943336009979248, -4.3395094871521, -3.735682964324951, -3.131856679916382, -2.5280301570892334, -1.924203634262085, -1.3203773498535156, -0.7165508270263672, -0.11272430419921875, 0.4911021590232849, 1.0949286222457886, 1.6987550258636475, 2.302581548690796, 2.9064080715179443, 3.5102343559265137, 4.114060878753662, 4.7178874015808105, 5.321713924407959, 5.925540447235107, 6.529366493225098, 7.133193016052246, 7.7370195388793945, 8.340846061706543, 8.944672584533691, 9.54849910736084, 10.152325630187988, 10.756152153015137, 11.359978675842285, 11.963805198669434, 12.567631721496582, 13.171457290649414, 13.775283813476562, 14.379110336303711, 14.98293685913086, 15.586763381958008, 16.190589904785156, 16.794416427612305, 17.398242950439453, 18.0020694732666, 18.60589599609375, 19.2097225189209]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 1.0, 3.0, 8.0, 17.0, 14.0, 27.0, 50.0, 51.0, 90.0, 118.0, 193.0, 280.0, 473.0, 706.0, 1112.0, 1653.0, 2653.0, 4246.0, 6877.0, 11074.0, 17710.0, 28271.0, 43554.0, 66369.0, 95733.0, 124681.0, 143461.0, 139065.0, 115462.0, 84940.0, 57685.0, 37799.0, 23874.0, 15018.0, 9376.0, 5728.0, 3767.0, 2324.0, 1427.0, 941.0, 604.0, 388.0, 246.0, 155.0, 97.0, 92.0, 56.0, 31.0, 23.0, 17.0, 11.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.34375, -20.628173828125, -19.91259765625, -19.197021484375, -18.4814453125, -17.765869140625, -17.05029296875, -16.334716796875, -15.619140625, -14.903564453125, -14.18798828125, -13.472412109375, -12.7568359375, -12.041259765625, -11.32568359375, -10.610107421875, -9.89453125, -9.178955078125, -8.46337890625, -7.747802734375, -7.0322265625, -6.316650390625, -5.60107421875, -4.885498046875, -4.169921875, -3.454345703125, -2.73876953125, -2.023193359375, -1.3076171875, -0.592041015625, 0.12353515625, 0.839111328125, 1.5546875, 2.270263671875, 2.98583984375, 3.701416015625, 4.4169921875, 5.132568359375, 5.84814453125, 6.563720703125, 7.279296875, 7.994873046875, 8.71044921875, 9.426025390625, 10.1416015625, 10.857177734375, 11.57275390625, 12.288330078125, 13.00390625, 13.719482421875, 14.43505859375, 15.150634765625, 15.8662109375, 16.581787109375, 17.29736328125, 18.012939453125, 18.728515625, 19.444091796875, 20.15966796875, 20.875244140625, 21.5908203125, 22.306396484375, 23.02197265625, 23.737548828125, 24.453125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 1.0, 11.0, 8.0, 10.0, 13.0, 14.0, 11.0, 18.0, 29.0, 23.0, 31.0, 34.0, 25.0, 31.0, 35.0, 42.0, 40.0, 42.0, 65.0, 46.0, 43.0, 37.0, 42.0, 39.0, 48.0, 41.0, 27.0, 25.0, 38.0, 17.0, 17.0, 14.0, 10.0, 18.0, 13.0, 12.0, 12.0, 4.0, 2.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.875, -23.161865234375, -22.44873046875, -21.735595703125, -21.0224609375, -20.309326171875, -19.59619140625, -18.883056640625, -18.169921875, -17.456787109375, -16.74365234375, -16.030517578125, -15.3173828125, -14.604248046875, -13.89111328125, -13.177978515625, -12.46484375, -11.751708984375, -11.03857421875, -10.325439453125, -9.6123046875, -8.899169921875, -8.18603515625, -7.472900390625, -6.759765625, -6.046630859375, -5.33349609375, -4.620361328125, -3.9072265625, -3.194091796875, -2.48095703125, -1.767822265625, -1.0546875, -0.341552734375, 0.37158203125, 1.084716796875, 1.7978515625, 2.510986328125, 3.22412109375, 3.937255859375, 4.650390625, 5.363525390625, 6.07666015625, 6.789794921875, 7.5029296875, 8.216064453125, 8.92919921875, 9.642333984375, 10.35546875, 11.068603515625, 11.78173828125, 12.494873046875, 13.2080078125, 13.921142578125, 14.63427734375, 15.347412109375, 16.060546875, 16.773681640625, 17.48681640625, 18.199951171875, 18.9130859375, 19.626220703125, 20.33935546875, 21.052490234375, 21.765625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 4.0, 14.0, 13.0, 28.0, 33.0, 43.0, 93.0, 115.0, 158.0, 283.0, 392.0, 610.0, 955.0, 1517.0, 2406.0, 3886.0, 6120.0, 9550.0, 14720.0, 22577.0, 34967.0, 51612.0, 74038.0, 100231.0, 124486.0, 135388.0, 125727.0, 103497.0, 77112.0, 54242.0, 36407.0, 24107.0, 15633.0, 10110.0, 6361.0, 4095.0, 2548.0, 1573.0, 1000.0, 665.0, 432.0, 281.0, 176.0, 100.0, 83.0, 51.0, 35.0, 20.0, 16.0, 18.0, 7.0, 2.0, 10.0, 4.0, 1.0, 4.0, 2.0], "bins": [-23.609375, -22.88427734375, -22.1591796875, -21.43408203125, -20.708984375, -19.98388671875, -19.2587890625, -18.53369140625, -17.80859375, -17.08349609375, -16.3583984375, -15.63330078125, -14.908203125, -14.18310546875, -13.4580078125, -12.73291015625, -12.0078125, -11.28271484375, -10.5576171875, -9.83251953125, -9.107421875, -8.38232421875, -7.6572265625, -6.93212890625, -6.20703125, -5.48193359375, -4.7568359375, -4.03173828125, -3.306640625, -2.58154296875, -1.8564453125, -1.13134765625, -0.40625, 0.31884765625, 1.0439453125, 1.76904296875, 2.494140625, 3.21923828125, 3.9443359375, 4.66943359375, 5.39453125, 6.11962890625, 6.8447265625, 7.56982421875, 8.294921875, 9.02001953125, 9.7451171875, 10.47021484375, 11.1953125, 11.92041015625, 12.6455078125, 13.37060546875, 14.095703125, 14.82080078125, 15.5458984375, 16.27099609375, 16.99609375, 17.72119140625, 18.4462890625, 19.17138671875, 19.896484375, 20.62158203125, 21.3466796875, 22.07177734375, 22.796875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 10.0, 11.0, 9.0, 9.0, 12.0, 13.0, 14.0, 19.0, 22.0, 24.0, 21.0, 27.0, 28.0, 30.0, 38.0, 33.0, 36.0, 33.0, 36.0, 42.0, 32.0, 36.0, 31.0, 30.0, 32.0, 43.0, 33.0, 36.0, 27.0, 22.0, 32.0, 18.0, 23.0, 15.0, 19.0, 18.0, 16.0, 15.0, 7.0, 9.0, 5.0, 0.0, 5.0, 7.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0], "bins": [-13.078125, -12.689453125, -12.30078125, -11.912109375, -11.5234375, -11.134765625, -10.74609375, -10.357421875, -9.96875, -9.580078125, -9.19140625, -8.802734375, -8.4140625, -8.025390625, -7.63671875, -7.248046875, -6.859375, -6.470703125, -6.08203125, -5.693359375, -5.3046875, -4.916015625, -4.52734375, -4.138671875, -3.75, -3.361328125, -2.97265625, -2.583984375, -2.1953125, -1.806640625, -1.41796875, -1.029296875, -0.640625, -0.251953125, 0.13671875, 0.525390625, 0.9140625, 1.302734375, 1.69140625, 2.080078125, 2.46875, 2.857421875, 3.24609375, 3.634765625, 4.0234375, 4.412109375, 4.80078125, 5.189453125, 5.578125, 5.966796875, 6.35546875, 6.744140625, 7.1328125, 7.521484375, 7.91015625, 8.298828125, 8.6875, 9.076171875, 9.46484375, 9.853515625, 10.2421875, 10.630859375, 11.01953125, 11.408203125, 11.796875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 9.0, 10.0, 9.0, 14.0, 16.0, 24.0, 43.0, 53.0, 88.0, 125.0, 189.0, 315.0, 417.0, 710.0, 1081.0, 1753.0, 3012.0, 4774.0, 8088.0, 14016.0, 24863.0, 44343.0, 79219.0, 136989.0, 208511.0, 206602.0, 133737.0, 77602.0, 43713.0, 24213.0, 13710.0, 7956.0, 4612.0, 2811.0, 1736.0, 1082.0, 755.0, 467.0, 296.0, 211.0, 140.0, 90.0, 59.0, 49.0, 15.0, 9.0, 11.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 3.0], "bins": [-22.375, -21.7353515625, -21.095703125, -20.4560546875, -19.81640625, -19.1767578125, -18.537109375, -17.8974609375, -17.2578125, -16.6181640625, -15.978515625, -15.3388671875, -14.69921875, -14.0595703125, -13.419921875, -12.7802734375, -12.140625, -11.5009765625, -10.861328125, -10.2216796875, -9.58203125, -8.9423828125, -8.302734375, -7.6630859375, -7.0234375, -6.3837890625, -5.744140625, -5.1044921875, -4.46484375, -3.8251953125, -3.185546875, -2.5458984375, -1.90625, -1.2666015625, -0.626953125, 0.0126953125, 0.65234375, 1.2919921875, 1.931640625, 2.5712890625, 3.2109375, 3.8505859375, 4.490234375, 5.1298828125, 5.76953125, 6.4091796875, 7.048828125, 7.6884765625, 8.328125, 8.9677734375, 9.607421875, 10.2470703125, 10.88671875, 11.5263671875, 12.166015625, 12.8056640625, 13.4453125, 14.0849609375, 14.724609375, 15.3642578125, 16.00390625, 16.6435546875, 17.283203125, 17.9228515625, 18.5625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 8.0, 9.0, 10.0, 17.0, 12.0, 22.0, 30.0, 37.0, 45.0, 73.0, 78.0, 77.0, 89.0, 79.0, 67.0, 63.0, 58.0, 44.0, 40.0, 38.0, 15.0, 21.0, 13.0, 6.0, 6.0, 12.0, 4.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023136138916015625, -0.0022360682487487793, -0.002158522605895996, -0.002080976963043213, -0.0020034313201904297, -0.0019258856773376465, -0.0018483400344848633, -0.00177079439163208, -0.0016932487487792969, -0.0016157031059265137, -0.0015381574630737305, -0.0014606118202209473, -0.001383066177368164, -0.0013055205345153809, -0.0012279748916625977, -0.0011504292488098145, -0.0010728836059570312, -0.000995337963104248, -0.0009177923202514648, -0.0008402466773986816, -0.0007627010345458984, -0.0006851553916931152, -0.000607609748840332, -0.0005300641059875488, -0.0004525184631347656, -0.0003749728202819824, -0.0002974271774291992, -0.00021988153457641602, -0.0001423358917236328, -6.479024887084961e-05, 1.2755393981933594e-05, 9.03010368347168e-05, 0.0001678466796875, 0.0002453923225402832, 0.0003229379653930664, 0.0004004836082458496, 0.0004780292510986328, 0.000555574893951416, 0.0006331205368041992, 0.0007106661796569824, 0.0007882118225097656, 0.0008657574653625488, 0.000943303108215332, 0.0010208487510681152, 0.0010983943939208984, 0.0011759400367736816, 0.0012534856796264648, 0.001331031322479248, 0.0014085769653320312, 0.0014861226081848145, 0.0015636682510375977, 0.0016412138938903809, 0.001718759536743164, 0.0017963051795959473, 0.0018738508224487305, 0.0019513964653015137, 0.002028942108154297, 0.00210648775100708, 0.0021840333938598633, 0.0022615790367126465, 0.0023391246795654297, 0.002416670322418213, 0.002494215965270996, 0.0025717616081237793, 0.0026493072509765625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 5.0, 11.0, 7.0, 14.0, 11.0, 22.0, 36.0, 47.0, 81.0, 104.0, 150.0, 216.0, 305.0, 491.0, 767.0, 1189.0, 1848.0, 2858.0, 4484.0, 7288.0, 11952.0, 19677.0, 33278.0, 56142.0, 95757.0, 152513.0, 198836.0, 174488.0, 114616.0, 68687.0, 40791.0, 23729.0, 14259.0, 8698.0, 5473.0, 3451.0, 2135.0, 1388.0, 924.0, 591.0, 428.0, 261.0, 189.0, 118.0, 74.0, 54.0, 35.0, 32.0, 19.0, 8.0, 10.0, 2.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.171875, -18.547119140625, -17.92236328125, -17.297607421875, -16.6728515625, -16.048095703125, -15.42333984375, -14.798583984375, -14.173828125, -13.549072265625, -12.92431640625, -12.299560546875, -11.6748046875, -11.050048828125, -10.42529296875, -9.800537109375, -9.17578125, -8.551025390625, -7.92626953125, -7.301513671875, -6.6767578125, -6.052001953125, -5.42724609375, -4.802490234375, -4.177734375, -3.552978515625, -2.92822265625, -2.303466796875, -1.6787109375, -1.053955078125, -0.42919921875, 0.195556640625, 0.8203125, 1.445068359375, 2.06982421875, 2.694580078125, 3.3193359375, 3.944091796875, 4.56884765625, 5.193603515625, 5.818359375, 6.443115234375, 7.06787109375, 7.692626953125, 8.3173828125, 8.942138671875, 9.56689453125, 10.191650390625, 10.81640625, 11.441162109375, 12.06591796875, 12.690673828125, 13.3154296875, 13.940185546875, 14.56494140625, 15.189697265625, 15.814453125, 16.439208984375, 17.06396484375, 17.688720703125, 18.3134765625, 18.938232421875, 19.56298828125, 20.187744140625, 20.8125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 13.0, 8.0, 8.0, 10.0, 17.0, 18.0, 23.0, 28.0, 35.0, 38.0, 41.0, 55.0, 55.0, 55.0, 48.0, 51.0, 56.0, 52.0, 54.0, 52.0, 52.0, 34.0, 35.0, 19.0, 23.0, 27.0, 14.0, 15.0, 12.0, 7.0, 16.0, 8.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.059326171875, -4.86865234375, -4.677978515625, -4.4873046875, -4.296630859375, -4.10595703125, -3.915283203125, -3.724609375, -3.533935546875, -3.34326171875, -3.152587890625, -2.9619140625, -2.771240234375, -2.58056640625, -2.389892578125, -2.19921875, -2.008544921875, -1.81787109375, -1.627197265625, -1.4365234375, -1.245849609375, -1.05517578125, -0.864501953125, -0.673828125, -0.483154296875, -0.29248046875, -0.101806640625, 0.0888671875, 0.279541015625, 0.47021484375, 0.660888671875, 0.8515625, 1.042236328125, 1.23291015625, 1.423583984375, 1.6142578125, 1.804931640625, 1.99560546875, 2.186279296875, 2.376953125, 2.567626953125, 2.75830078125, 2.948974609375, 3.1396484375, 3.330322265625, 3.52099609375, 3.711669921875, 3.90234375, 4.093017578125, 4.28369140625, 4.474365234375, 4.6650390625, 4.855712890625, 5.04638671875, 5.237060546875, 5.427734375, 5.618408203125, 5.80908203125, 5.999755859375, 6.1904296875, 6.381103515625, 6.57177734375, 6.762451171875, 6.953125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 13.0, 9.0, 22.0, 15.0, 27.0, 32.0, 45.0, 41.0, 39.0, 46.0, 65.0, 66.0, 64.0, 50.0, 68.0, 58.0, 39.0, 49.0, 50.0, 30.0, 22.0, 25.0, 22.0, 19.0, 19.0, 10.0, 7.0, 3.0, 4.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-43.08380126953125, -41.820255279541016, -40.55670928955078, -39.29316329956055, -38.02961730957031, -36.76606750488281, -35.50252151489258, -34.238975524902344, -32.97542953491211, -31.711883544921875, -30.44833755493164, -29.184789657592773, -27.92124366760254, -26.657697677612305, -25.394149780273438, -24.130603790283203, -22.86705780029297, -21.603511810302734, -20.3399658203125, -19.076417922973633, -17.8128719329834, -16.549325942993164, -15.285778999328613, -14.022232055664062, -12.758686065673828, -11.495140075683594, -10.231593132019043, -8.968046188354492, -7.704500198364258, -6.440953731536865, -5.177407264709473, -3.913860321044922, -2.650310516357422, -1.3867640495300293, -0.12321758270263672, 1.1403288841247559, 2.4038753509521484, 3.667421817779541, 4.930968284606934, 6.194515228271484, 7.458061218261719, 8.721607208251953, 9.985154151916504, 11.248701095581055, 12.512247085571289, 13.775793075561523, 15.039340019226074, 16.302886962890625, 17.56643295288086, 18.829978942871094, 20.093524932861328, 21.357072830200195, 22.62061882019043, 23.884164810180664, 25.14771270751953, 26.411258697509766, 27.6748046875, 28.938350677490234, 30.20189666748047, 31.465444564819336, 32.72898864746094, 33.99253845214844, 35.25608444213867, 36.519630432128906, 37.78317642211914]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 3.0, 5.0, 10.0, 9.0, 17.0, 9.0, 12.0, 23.0, 21.0, 20.0, 22.0, 31.0, 26.0, 28.0, 30.0, 28.0, 35.0, 31.0, 42.0, 30.0, 38.0, 48.0, 42.0, 34.0, 43.0, 40.0, 28.0, 36.0, 28.0, 29.0, 27.0, 23.0, 23.0, 17.0, 12.0, 20.0, 11.0, 15.0, 11.0, 12.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.468355178833008, -17.85744285583496, -17.246530532836914, -16.635618209838867, -16.02470588684082, -15.413792610168457, -14.80288028717041, -14.191967010498047, -13.5810546875, -12.970142364501953, -12.359230041503906, -11.74831771850586, -11.137404441833496, -10.52649211883545, -9.915579795837402, -9.304666519165039, -8.693755149841309, -8.082842826843262, -7.471930027008057, -6.86101770401001, -6.250104904174805, -5.639192581176758, -5.028280258178711, -4.417367458343506, -3.806455135345459, -3.195542573928833, -2.584630012512207, -1.9737176895141602, -1.3628051280975342, -0.7518925666809082, -0.14098024368286133, 0.46993255615234375, 1.0808448791503906, 1.6917574405670166, 2.3026700019836426, 2.9135823249816895, 3.5244948863983154, 4.135407447814941, 4.746319770812988, 5.357232570648193, 5.96814489364624, 6.579057216644287, 7.189970016479492, 7.800882339477539, 8.411794662475586, 9.022706985473633, 9.63361930847168, 10.244532585144043, 10.85544490814209, 11.466357231140137, 12.077269554138184, 12.688182830810547, 13.299095153808594, 13.91000747680664, 14.520919799804688, 15.131832122802734, 15.742744445800781, 16.353656768798828, 16.964569091796875, 17.575481414794922, 18.18639373779297, 18.797306060791016, 19.408218383789062, 20.019132614135742, 20.63004493713379]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 6.0, 8.0, 12.0, 21.0, 32.0, 54.0, 75.0, 93.0, 172.0, 235.0, 333.0, 488.0, 763.0, 1169.0, 1918.0, 2862.0, 4614.0, 7404.0, 12280.0, 21128.0, 37721.0, 69967.0, 136537.0, 282396.0, 590653.0, 1001840.0, 950315.0, 532218.0, 256779.0, 127270.0, 66374.0, 35957.0, 20584.0, 11912.0, 7260.0, 4539.0, 2979.0, 1829.0, 1184.0, 760.0, 518.0, 354.0, 236.0, 155.0, 98.0, 55.0, 39.0, 34.0, 13.0, 19.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-41.90625, -40.59375, -39.28125, -37.96875, -36.65625, -35.34375, -34.03125, -32.71875, -31.40625, -30.09375, -28.78125, -27.46875, -26.15625, -24.84375, -23.53125, -22.21875, -20.90625, -19.59375, -18.28125, -16.96875, -15.65625, -14.34375, -13.03125, -11.71875, -10.40625, -9.09375, -7.78125, -6.46875, -5.15625, -3.84375, -2.53125, -1.21875, 0.09375, 1.40625, 2.71875, 4.03125, 5.34375, 6.65625, 7.96875, 9.28125, 10.59375, 11.90625, 13.21875, 14.53125, 15.84375, 17.15625, 18.46875, 19.78125, 21.09375, 22.40625, 23.71875, 25.03125, 26.34375, 27.65625, 28.96875, 30.28125, 31.59375, 32.90625, 34.21875, 35.53125, 36.84375, 38.15625, 39.46875, 40.78125, 42.09375]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 6.0, 6.0, 4.0, 8.0, 7.0, 8.0, 14.0, 8.0, 15.0, 23.0, 16.0, 14.0, 34.0, 31.0, 19.0, 37.0, 26.0, 40.0, 36.0, 24.0, 26.0, 45.0, 35.0, 41.0, 36.0, 31.0, 52.0, 47.0, 31.0, 33.0, 38.0, 26.0, 26.0, 20.0, 20.0, 21.0, 12.0, 12.0, 14.0, 17.0, 14.0, 5.0, 7.0, 3.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.28125, -17.7041015625, -17.126953125, -16.5498046875, -15.97265625, -15.3955078125, -14.818359375, -14.2412109375, -13.6640625, -13.0869140625, -12.509765625, -11.9326171875, -11.35546875, -10.7783203125, -10.201171875, -9.6240234375, -9.046875, -8.4697265625, -7.892578125, -7.3154296875, -6.73828125, -6.1611328125, -5.583984375, -5.0068359375, -4.4296875, -3.8525390625, -3.275390625, -2.6982421875, -2.12109375, -1.5439453125, -0.966796875, -0.3896484375, 0.1875, 0.7646484375, 1.341796875, 1.9189453125, 2.49609375, 3.0732421875, 3.650390625, 4.2275390625, 4.8046875, 5.3818359375, 5.958984375, 6.5361328125, 7.11328125, 7.6904296875, 8.267578125, 8.8447265625, 9.421875, 9.9990234375, 10.576171875, 11.1533203125, 11.73046875, 12.3076171875, 12.884765625, 13.4619140625, 14.0390625, 14.6162109375, 15.193359375, 15.7705078125, 16.34765625, 16.9248046875, 17.501953125, 18.0791015625, 18.65625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 10.0, 11.0, 9.0, 25.0, 26.0, 35.0, 59.0, 77.0, 102.0, 163.0, 242.0, 302.0, 520.0, 673.0, 995.0, 1495.0, 2145.0, 3416.0, 5336.0, 8252.0, 13418.0, 22692.0, 38614.0, 68958.0, 127282.0, 244231.0, 480860.0, 853872.0, 982046.0, 631984.0, 326818.0, 166949.0, 89392.0, 49252.0, 28424.0, 16527.0, 10248.0, 6538.0, 4090.0, 2737.0, 1771.0, 1147.0, 744.0, 565.0, 374.0, 244.0, 193.0, 128.0, 80.0, 71.0, 52.0, 29.0, 17.0, 18.0, 15.0, 8.0, 6.0, 3.0, 3.0, 1.0], "bins": [-53.96875, -52.29345703125, -50.6181640625, -48.94287109375, -47.267578125, -45.59228515625, -43.9169921875, -42.24169921875, -40.56640625, -38.89111328125, -37.2158203125, -35.54052734375, -33.865234375, -32.18994140625, -30.5146484375, -28.83935546875, -27.1640625, -25.48876953125, -23.8134765625, -22.13818359375, -20.462890625, -18.78759765625, -17.1123046875, -15.43701171875, -13.76171875, -12.08642578125, -10.4111328125, -8.73583984375, -7.060546875, -5.38525390625, -3.7099609375, -2.03466796875, -0.359375, 1.31591796875, 2.9912109375, 4.66650390625, 6.341796875, 8.01708984375, 9.6923828125, 11.36767578125, 13.04296875, 14.71826171875, 16.3935546875, 18.06884765625, 19.744140625, 21.41943359375, 23.0947265625, 24.77001953125, 26.4453125, 28.12060546875, 29.7958984375, 31.47119140625, 33.146484375, 34.82177734375, 36.4970703125, 38.17236328125, 39.84765625, 41.52294921875, 43.1982421875, 44.87353515625, 46.548828125, 48.22412109375, 49.8994140625, 51.57470703125, 53.25]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 6.0, 9.0, 12.0, 18.0, 20.0, 25.0, 59.0, 51.0, 91.0, 102.0, 132.0, 146.0, 192.0, 286.0, 311.0, 309.0, 321.0, 328.0, 288.0, 233.0, 250.0, 182.0, 149.0, 124.0, 98.0, 78.0, 55.0, 45.0, 37.0, 21.0, 17.0, 15.0, 14.0, 12.0, 13.0, 3.0, 6.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.625, -17.07275390625, -16.5205078125, -15.96826171875, -15.416015625, -14.86376953125, -14.3115234375, -13.75927734375, -13.20703125, -12.65478515625, -12.1025390625, -11.55029296875, -10.998046875, -10.44580078125, -9.8935546875, -9.34130859375, -8.7890625, -8.23681640625, -7.6845703125, -7.13232421875, -6.580078125, -6.02783203125, -5.4755859375, -4.92333984375, -4.37109375, -3.81884765625, -3.2666015625, -2.71435546875, -2.162109375, -1.60986328125, -1.0576171875, -0.50537109375, 0.046875, 0.59912109375, 1.1513671875, 1.70361328125, 2.255859375, 2.80810546875, 3.3603515625, 3.91259765625, 4.46484375, 5.01708984375, 5.5693359375, 6.12158203125, 6.673828125, 7.22607421875, 7.7783203125, 8.33056640625, 8.8828125, 9.43505859375, 9.9873046875, 10.53955078125, 11.091796875, 11.64404296875, 12.1962890625, 12.74853515625, 13.30078125, 13.85302734375, 14.4052734375, 14.95751953125, 15.509765625, 16.06201171875, 16.6142578125, 17.16650390625, 17.71875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 8.0, 6.0, 5.0, 11.0, 15.0, 9.0, 17.0, 18.0, 29.0, 25.0, 41.0, 61.0, 50.0, 47.0, 64.0, 69.0, 77.0, 58.0, 78.0, 55.0, 54.0, 35.0, 33.0, 27.0, 21.0, 20.0, 18.0, 14.0, 9.0, 5.0, 7.0, 2.0, 1.0, 1.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.71512985229492, -55.800018310546875, -53.88490676879883, -51.96979522705078, -50.0546875, -48.13957214355469, -46.224464416503906, -44.30935287475586, -42.39424133300781, -40.479129791259766, -38.56401824951172, -36.64890670776367, -34.733795166015625, -32.818687438964844, -30.903575897216797, -28.98846435546875, -27.073352813720703, -25.158241271972656, -23.24312973022461, -21.328020095825195, -19.41290855407715, -17.4977970123291, -15.582686424255371, -13.66757583618164, -11.752464294433594, -9.837352752685547, -7.922242164611816, -6.007131099700928, -4.092020034790039, -2.176908493041992, -0.2617979049682617, 1.6533126831054688, 3.5684280395507812, 5.48353910446167, 7.398650169372559, 9.313760757446289, 11.228872299194336, 13.143983840942383, 15.059094429016113, 16.974205017089844, 18.88931655883789, 20.804428100585938, 22.719539642333984, 24.6346492767334, 26.549760818481445, 28.464872360229492, 30.379981994628906, 32.29509353637695, 34.210205078125, 36.12531661987305, 38.040428161621094, 39.95553970336914, 41.87065124511719, 43.78575897216797, 45.700870513916016, 47.61598205566406, 49.53109359741211, 51.446205139160156, 53.3613166809082, 55.27642822265625, 57.19153594970703, 59.106651306152344, 61.021759033203125, 62.93687057495117, 64.85198211669922]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 5.0, 5.0, 15.0, 10.0, 19.0, 22.0, 26.0, 14.0, 22.0, 33.0, 41.0, 26.0, 41.0, 41.0, 48.0, 45.0, 47.0, 39.0, 46.0, 53.0, 27.0, 39.0, 43.0, 35.0, 38.0, 33.0, 22.0, 26.0, 25.0, 25.0, 15.0, 8.0, 9.0, 11.0, 8.0, 10.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.67736053466797, -28.741315841674805, -27.80527114868164, -26.869226455688477, -25.933181762695312, -24.997135162353516, -24.06109046936035, -23.125045776367188, -22.189001083374023, -21.25295639038086, -20.316911697387695, -19.38086700439453, -18.444820404052734, -17.508777618408203, -16.572731018066406, -15.636686325073242, -14.700641632080078, -13.764596939086914, -12.82855224609375, -11.89250659942627, -10.956461906433105, -10.020417213439941, -9.084371566772461, -8.148326873779297, -7.212282180786133, -6.276237487792969, -5.3401923179626465, -4.404147148132324, -3.46810245513916, -2.532057762145996, -1.5960125923156738, -0.6599674224853516, 0.2760772705078125, 1.2121222019195557, 2.148167133331299, 3.084212064743042, 4.020256996154785, 4.956301689147949, 5.8923468589782715, 6.828392028808594, 7.764436721801758, 8.700481414794922, 9.636526107788086, 10.572571754455566, 11.50861644744873, 12.444661140441895, 13.380706787109375, 14.316751480102539, 15.252796173095703, 16.188840866088867, 17.12488555908203, 18.060930252075195, 18.99697494506836, 19.933021545410156, 20.86906623840332, 21.805110931396484, 22.74115562438965, 23.677200317382812, 24.613245010375977, 25.54928970336914, 26.485336303710938, 27.42137908935547, 28.357425689697266, 29.29347038269043, 30.229515075683594]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 7.0, 9.0, 10.0, 10.0, 23.0, 46.0, 37.0, 60.0, 79.0, 115.0, 200.0, 317.0, 462.0, 747.0, 1275.0, 2083.0, 3596.0, 6684.0, 12752.0, 24701.0, 51566.0, 107161.0, 201498.0, 259158.0, 185653.0, 96170.0, 46027.0, 22412.0, 11288.0, 6020.0, 3291.0, 1992.0, 1114.0, 682.0, 410.0, 283.0, 162.0, 139.0, 90.0, 52.0, 45.0, 26.0, 34.0, 18.0, 19.0, 4.0, 11.0, 6.0, 2.0, 2.0, 3.0, 4.0], "bins": [-38.5625, -37.473876953125, -36.38525390625, -35.296630859375, -34.2080078125, -33.119384765625, -32.03076171875, -30.942138671875, -29.853515625, -28.764892578125, -27.67626953125, -26.587646484375, -25.4990234375, -24.410400390625, -23.32177734375, -22.233154296875, -21.14453125, -20.055908203125, -18.96728515625, -17.878662109375, -16.7900390625, -15.701416015625, -14.61279296875, -13.524169921875, -12.435546875, -11.346923828125, -10.25830078125, -9.169677734375, -8.0810546875, -6.992431640625, -5.90380859375, -4.815185546875, -3.7265625, -2.637939453125, -1.54931640625, -0.460693359375, 0.6279296875, 1.716552734375, 2.80517578125, 3.893798828125, 4.982421875, 6.071044921875, 7.15966796875, 8.248291015625, 9.3369140625, 10.425537109375, 11.51416015625, 12.602783203125, 13.69140625, 14.780029296875, 15.86865234375, 16.957275390625, 18.0458984375, 19.134521484375, 20.22314453125, 21.311767578125, 22.400390625, 23.489013671875, 24.57763671875, 25.666259765625, 26.7548828125, 27.843505859375, 28.93212890625, 30.020751953125, 31.109375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 6.0, 9.0, 15.0, 15.0, 13.0, 26.0, 32.0, 28.0, 35.0, 26.0, 40.0, 53.0, 63.0, 51.0, 64.0, 56.0, 49.0, 48.0, 56.0, 52.0, 36.0, 33.0, 44.0, 25.0, 18.0, 18.0, 20.0, 13.0, 13.0, 9.0, 7.0, 2.0, 6.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.46875, -39.20703125, -37.9453125, -36.68359375, -35.421875, -34.16015625, -32.8984375, -31.63671875, -30.375, -29.11328125, -27.8515625, -26.58984375, -25.328125, -24.06640625, -22.8046875, -21.54296875, -20.28125, -19.01953125, -17.7578125, -16.49609375, -15.234375, -13.97265625, -12.7109375, -11.44921875, -10.1875, -8.92578125, -7.6640625, -6.40234375, -5.140625, -3.87890625, -2.6171875, -1.35546875, -0.09375, 1.16796875, 2.4296875, 3.69140625, 4.953125, 6.21484375, 7.4765625, 8.73828125, 10.0, 11.26171875, 12.5234375, 13.78515625, 15.046875, 16.30859375, 17.5703125, 18.83203125, 20.09375, 21.35546875, 22.6171875, 23.87890625, 25.140625, 26.40234375, 27.6640625, 28.92578125, 30.1875, 31.44921875, 32.7109375, 33.97265625, 35.234375, 36.49609375, 37.7578125, 39.01953125, 40.28125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 6.0, 5.0, 8.0, 9.0, 23.0, 39.0, 39.0, 71.0, 80.0, 112.0, 186.0, 258.0, 378.0, 536.0, 827.0, 1233.0, 1871.0, 3018.0, 5083.0, 9185.0, 17091.0, 35353.0, 76162.0, 166436.0, 284794.0, 228921.0, 111931.0, 50897.0, 24129.0, 12272.0, 6581.0, 3947.0, 2362.0, 1541.0, 999.0, 680.0, 475.0, 307.0, 203.0, 174.0, 107.0, 82.0, 39.0, 39.0, 30.0, 14.0, 13.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.34375, -35.0791015625, -33.814453125, -32.5498046875, -31.28515625, -30.0205078125, -28.755859375, -27.4912109375, -26.2265625, -24.9619140625, -23.697265625, -22.4326171875, -21.16796875, -19.9033203125, -18.638671875, -17.3740234375, -16.109375, -14.8447265625, -13.580078125, -12.3154296875, -11.05078125, -9.7861328125, -8.521484375, -7.2568359375, -5.9921875, -4.7275390625, -3.462890625, -2.1982421875, -0.93359375, 0.3310546875, 1.595703125, 2.8603515625, 4.125, 5.3896484375, 6.654296875, 7.9189453125, 9.18359375, 10.4482421875, 11.712890625, 12.9775390625, 14.2421875, 15.5068359375, 16.771484375, 18.0361328125, 19.30078125, 20.5654296875, 21.830078125, 23.0947265625, 24.359375, 25.6240234375, 26.888671875, 28.1533203125, 29.41796875, 30.6826171875, 31.947265625, 33.2119140625, 34.4765625, 35.7412109375, 37.005859375, 38.2705078125, 39.53515625, 40.7998046875, 42.064453125, 43.3291015625, 44.59375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 7.0, 4.0, 10.0, 10.0, 11.0, 9.0, 19.0, 12.0, 18.0, 23.0, 25.0, 29.0, 28.0, 35.0, 32.0, 53.0, 44.0, 37.0, 42.0, 31.0, 39.0, 43.0, 49.0, 39.0, 43.0, 49.0, 39.0, 31.0, 26.0, 32.0, 28.0, 24.0, 16.0, 6.0, 11.0, 11.0, 12.0, 7.0, 7.0, 4.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.328125, -16.72265625, -16.1171875, -15.51171875, -14.90625, -14.30078125, -13.6953125, -13.08984375, -12.484375, -11.87890625, -11.2734375, -10.66796875, -10.0625, -9.45703125, -8.8515625, -8.24609375, -7.640625, -7.03515625, -6.4296875, -5.82421875, -5.21875, -4.61328125, -4.0078125, -3.40234375, -2.796875, -2.19140625, -1.5859375, -0.98046875, -0.375, 0.23046875, 0.8359375, 1.44140625, 2.046875, 2.65234375, 3.2578125, 3.86328125, 4.46875, 5.07421875, 5.6796875, 6.28515625, 6.890625, 7.49609375, 8.1015625, 8.70703125, 9.3125, 9.91796875, 10.5234375, 11.12890625, 11.734375, 12.33984375, 12.9453125, 13.55078125, 14.15625, 14.76171875, 15.3671875, 15.97265625, 16.578125, 17.18359375, 17.7890625, 18.39453125, 19.0, 19.60546875, 20.2109375, 20.81640625, 21.421875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 2.0, 10.0, 11.0, 15.0, 29.0, 42.0, 56.0, 85.0, 135.0, 242.0, 356.0, 546.0, 902.0, 1585.0, 2711.0, 4909.0, 8827.0, 16014.0, 30717.0, 59821.0, 120098.0, 233612.0, 266382.0, 148419.0, 73170.0, 36775.0, 19175.0, 10417.0, 5702.0, 3086.0, 1821.0, 1102.0, 694.0, 349.0, 257.0, 166.0, 123.0, 53.0, 46.0, 36.0, 22.0, 13.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.4609375, -14.0111083984375, -13.561279296875, -13.1114501953125, -12.66162109375, -12.2117919921875, -11.761962890625, -11.3121337890625, -10.8623046875, -10.4124755859375, -9.962646484375, -9.5128173828125, -9.06298828125, -8.6131591796875, -8.163330078125, -7.7135009765625, -7.263671875, -6.8138427734375, -6.364013671875, -5.9141845703125, -5.46435546875, -5.0145263671875, -4.564697265625, -4.1148681640625, -3.6650390625, -3.2152099609375, -2.765380859375, -2.3155517578125, -1.86572265625, -1.4158935546875, -0.966064453125, -0.5162353515625, -0.06640625, 0.3834228515625, 0.833251953125, 1.2830810546875, 1.73291015625, 2.1827392578125, 2.632568359375, 3.0823974609375, 3.5322265625, 3.9820556640625, 4.431884765625, 4.8817138671875, 5.33154296875, 5.7813720703125, 6.231201171875, 6.6810302734375, 7.130859375, 7.5806884765625, 8.030517578125, 8.4803466796875, 8.93017578125, 9.3800048828125, 9.829833984375, 10.2796630859375, 10.7294921875, 11.1793212890625, 11.629150390625, 12.0789794921875, 12.52880859375, 12.9786376953125, 13.428466796875, 13.8782958984375, 14.328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 6.0, 10.0, 13.0, 11.0, 17.0, 25.0, 33.0, 31.0, 43.0, 53.0, 63.0, 60.0, 68.0, 84.0, 74.0, 57.0, 81.0, 54.0, 37.0, 32.0, 30.0, 25.0, 17.0, 15.0, 15.0, 9.0, 3.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010166168212890625, -0.0009861737489700317, -0.000955730676651001, -0.0009252876043319702, -0.0008948445320129395, -0.0008644014596939087, -0.0008339583873748779, -0.0008035153150558472, -0.0007730722427368164, -0.0007426291704177856, -0.0007121860980987549, -0.0006817430257797241, -0.0006512999534606934, -0.0006208568811416626, -0.0005904138088226318, -0.0005599707365036011, -0.0005295276641845703, -0.0004990845918655396, -0.0004686415195465088, -0.00043819844722747803, -0.00040775537490844727, -0.0003773123025894165, -0.00034686923027038574, -0.000316426157951355, -0.0002859830856323242, -0.00025554001331329346, -0.0002250969409942627, -0.00019465386867523193, -0.00016421079635620117, -0.0001337677240371704, -0.00010332465171813965, -7.288157939910889e-05, -4.2438507080078125e-05, -1.1995434761047363e-05, 1.84476375579834e-05, 4.889070987701416e-05, 7.933378219604492e-05, 0.00010977685451507568, 0.00014021992683410645, 0.0001706629991531372, 0.00020110607147216797, 0.00023154914379119873, 0.0002619922161102295, 0.00029243528842926025, 0.000322878360748291, 0.0003533214330673218, 0.00038376450538635254, 0.0004142075777053833, 0.00044465065002441406, 0.0004750937223434448, 0.0005055367946624756, 0.0005359798669815063, 0.0005664229393005371, 0.0005968660116195679, 0.0006273090839385986, 0.0006577521562576294, 0.0006881952285766602, 0.0007186383008956909, 0.0007490813732147217, 0.0007795244455337524, 0.0008099675178527832, 0.000840410590171814, 0.0008708536624908447, 0.0009012967348098755, 0.0009317398071289062]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 11.0, 12.0, 25.0, 20.0, 41.0, 51.0, 84.0, 112.0, 146.0, 232.0, 316.0, 447.0, 664.0, 1024.0, 1530.0, 2390.0, 3697.0, 6113.0, 10086.0, 16336.0, 28105.0, 48284.0, 81123.0, 129324.0, 177759.0, 182732.0, 138100.0, 88541.0, 53574.0, 30779.0, 17887.0, 10627.0, 6548.0, 4098.0, 2626.0, 1751.0, 1055.0, 745.0, 479.0, 328.0, 237.0, 151.0, 115.0, 80.0, 57.0, 43.0, 26.0, 16.0, 10.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0], "bins": [-13.0546875, -12.6478271484375, -12.240966796875, -11.8341064453125, -11.42724609375, -11.0203857421875, -10.613525390625, -10.2066650390625, -9.7998046875, -9.3929443359375, -8.986083984375, -8.5792236328125, -8.17236328125, -7.7655029296875, -7.358642578125, -6.9517822265625, -6.544921875, -6.1380615234375, -5.731201171875, -5.3243408203125, -4.91748046875, -4.5106201171875, -4.103759765625, -3.6968994140625, -3.2900390625, -2.8831787109375, -2.476318359375, -2.0694580078125, -1.66259765625, -1.2557373046875, -0.848876953125, -0.4420166015625, -0.03515625, 0.3717041015625, 0.778564453125, 1.1854248046875, 1.59228515625, 1.9991455078125, 2.406005859375, 2.8128662109375, 3.2197265625, 3.6265869140625, 4.033447265625, 4.4403076171875, 4.84716796875, 5.2540283203125, 5.660888671875, 6.0677490234375, 6.474609375, 6.8814697265625, 7.288330078125, 7.6951904296875, 8.10205078125, 8.5089111328125, 8.915771484375, 9.3226318359375, 9.7294921875, 10.1363525390625, 10.543212890625, 10.9500732421875, 11.35693359375, 11.7637939453125, 12.170654296875, 12.5775146484375, 12.984375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 5.0, 12.0, 17.0, 20.0, 23.0, 23.0, 32.0, 46.0, 52.0, 56.0, 50.0, 58.0, 63.0, 77.0, 73.0, 74.0, 55.0, 58.0, 32.0, 42.0, 20.0, 25.0, 20.0, 12.0, 9.0, 11.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.03692626953125, -3.8980712890625, -3.75921630859375, -3.620361328125, -3.48150634765625, -3.3426513671875, -3.20379638671875, -3.06494140625, -2.92608642578125, -2.7872314453125, -2.64837646484375, -2.509521484375, -2.37066650390625, -2.2318115234375, -2.09295654296875, -1.9541015625, -1.81524658203125, -1.6763916015625, -1.53753662109375, -1.398681640625, -1.25982666015625, -1.1209716796875, -0.98211669921875, -0.84326171875, -0.70440673828125, -0.5655517578125, -0.42669677734375, -0.287841796875, -0.14898681640625, -0.0101318359375, 0.12872314453125, 0.267578125, 0.40643310546875, 0.5452880859375, 0.68414306640625, 0.822998046875, 0.96185302734375, 1.1007080078125, 1.23956298828125, 1.37841796875, 1.51727294921875, 1.6561279296875, 1.79498291015625, 1.933837890625, 2.07269287109375, 2.2115478515625, 2.35040283203125, 2.4892578125, 2.62811279296875, 2.7669677734375, 2.90582275390625, 3.044677734375, 3.18353271484375, 3.3223876953125, 3.46124267578125, 3.60009765625, 3.73895263671875, 3.8778076171875, 4.01666259765625, 4.155517578125, 4.29437255859375, 4.4332275390625, 4.57208251953125, 4.7109375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 4.0, 5.0, 9.0, 9.0, 12.0, 11.0, 18.0, 18.0, 27.0, 27.0, 47.0, 50.0, 53.0, 56.0, 72.0, 62.0, 72.0, 71.0, 63.0, 62.0, 38.0, 46.0, 31.0, 31.0, 19.0, 21.0, 12.0, 13.0, 13.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.996620178222656, -56.07065963745117, -54.14469909667969, -52.21874237060547, -50.292781829833984, -48.3668212890625, -46.440860748291016, -44.51490020751953, -42.58894348144531, -40.66298294067383, -38.737022399902344, -36.811065673828125, -34.88510513305664, -32.959144592285156, -31.033184051513672, -29.10722541809082, -27.181264877319336, -25.25530433654785, -23.329345703125, -21.403385162353516, -19.477426528930664, -17.55146598815918, -15.625506401062012, -13.699546813964844, -11.773587226867676, -9.847627639770508, -7.92166805267334, -5.995707988739014, -4.069748401641846, -2.1437883377075195, -0.21782875061035156, 1.7081308364868164, 3.6340904235839844, 5.560050010681152, 7.48600959777832, 9.411970138549805, 11.337928771972656, 13.26388931274414, 15.189848899841309, 17.115808486938477, 19.041767120361328, 20.967727661132812, 22.893686294555664, 24.81964683532715, 26.74560546875, 28.671566009521484, 30.59752655029297, 32.52348327636719, 34.44944763183594, 36.37540817260742, 38.301368713378906, 40.227325439453125, 42.15328598022461, 44.079246520996094, 46.00520706176758, 47.93116760253906, 49.85712432861328, 51.783084869384766, 53.70904541015625, 55.63500213623047, 57.56096267700195, 59.48692321777344, 61.41288375854492, 63.338844299316406, 65.26480102539062]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 10.0, 2.0, 13.0, 8.0, 22.0, 17.0, 20.0, 26.0, 24.0, 29.0, 33.0, 31.0, 35.0, 41.0, 57.0, 43.0, 48.0, 43.0, 44.0, 48.0, 40.0, 40.0, 36.0, 40.0, 40.0, 22.0, 33.0, 21.0, 27.0, 26.0, 15.0, 8.0, 11.0, 9.0, 7.0, 8.0, 8.0, 1.0, 1.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.31357765197754, -29.365747451782227, -28.41791534423828, -27.47008514404297, -26.522254943847656, -25.574424743652344, -24.6265926361084, -23.678762435913086, -22.73093032836914, -21.783100128173828, -20.835268020629883, -19.88743782043457, -18.939607620239258, -17.991775512695312, -17.0439453125, -16.096115112304688, -15.148284912109375, -14.200453758239746, -13.252623558044434, -12.304792404174805, -11.356962203979492, -10.409131050109863, -9.461299896240234, -8.513469696044922, -7.565638542175293, -6.617807865142822, -5.669977188110352, -4.722146034240723, -3.774315357208252, -2.8264846801757812, -1.8786535263061523, -0.9308228492736816, 0.017009735107421875, 0.9648405313491821, 1.9126713275909424, 2.860502243041992, 3.808332920074463, 4.756163597106934, 5.7039947509765625, 6.651825428009033, 7.599656105041504, 8.547487258911133, 9.495317459106445, 10.443148612976074, 11.390979766845703, 12.338809967041016, 13.286641120910645, 14.234472274780273, 15.182302474975586, 16.1301326751709, 17.077964782714844, 18.025794982910156, 18.97362518310547, 19.92145538330078, 20.869287490844727, 21.81711769104004, 22.764949798583984, 23.712779998779297, 24.660612106323242, 25.608442306518555, 26.556272506713867, 27.504104614257812, 28.451934814453125, 29.399765014648438, 30.34759521484375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 10.0, 17.0, 27.0, 35.0, 55.0, 85.0, 105.0, 193.0, 241.0, 338.0, 556.0, 852.0, 1323.0, 2004.0, 3397.0, 5505.0, 9227.0, 15639.0, 26672.0, 45988.0, 77027.0, 118631.0, 159962.0, 173651.0, 147509.0, 103010.0, 63736.0, 37880.0, 21802.0, 12720.0, 7514.0, 4577.0, 2934.0, 1847.0, 1163.0, 779.0, 479.0, 344.0, 220.0, 157.0, 104.0, 75.0, 52.0, 37.0, 23.0, 22.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-40.375, -39.1259765625, -37.876953125, -36.6279296875, -35.37890625, -34.1298828125, -32.880859375, -31.6318359375, -30.3828125, -29.1337890625, -27.884765625, -26.6357421875, -25.38671875, -24.1376953125, -22.888671875, -21.6396484375, -20.390625, -19.1416015625, -17.892578125, -16.6435546875, -15.39453125, -14.1455078125, -12.896484375, -11.6474609375, -10.3984375, -9.1494140625, -7.900390625, -6.6513671875, -5.40234375, -4.1533203125, -2.904296875, -1.6552734375, -0.40625, 0.8427734375, 2.091796875, 3.3408203125, 4.58984375, 5.8388671875, 7.087890625, 8.3369140625, 9.5859375, 10.8349609375, 12.083984375, 13.3330078125, 14.58203125, 15.8310546875, 17.080078125, 18.3291015625, 19.578125, 20.8271484375, 22.076171875, 23.3251953125, 24.57421875, 25.8232421875, 27.072265625, 28.3212890625, 29.5703125, 30.8193359375, 32.068359375, 33.3173828125, 34.56640625, 35.8154296875, 37.064453125, 38.3134765625, 39.5625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 5.0, 14.0, 7.0, 8.0, 12.0, 18.0, 16.0, 21.0, 22.0, 26.0, 40.0, 39.0, 44.0, 35.0, 33.0, 43.0, 44.0, 49.0, 44.0, 42.0, 48.0, 39.0, 38.0, 29.0, 47.0, 33.0, 21.0, 33.0, 20.0, 19.0, 19.0, 15.0, 10.0, 9.0, 8.0, 8.0, 4.0, 6.0, 2.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.34375, -27.32470703125, -26.3056640625, -25.28662109375, -24.267578125, -23.24853515625, -22.2294921875, -21.21044921875, -20.19140625, -19.17236328125, -18.1533203125, -17.13427734375, -16.115234375, -15.09619140625, -14.0771484375, -13.05810546875, -12.0390625, -11.02001953125, -10.0009765625, -8.98193359375, -7.962890625, -6.94384765625, -5.9248046875, -4.90576171875, -3.88671875, -2.86767578125, -1.8486328125, -0.82958984375, 0.189453125, 1.20849609375, 2.2275390625, 3.24658203125, 4.265625, 5.28466796875, 6.3037109375, 7.32275390625, 8.341796875, 9.36083984375, 10.3798828125, 11.39892578125, 12.41796875, 13.43701171875, 14.4560546875, 15.47509765625, 16.494140625, 17.51318359375, 18.5322265625, 19.55126953125, 20.5703125, 21.58935546875, 22.6083984375, 23.62744140625, 24.646484375, 25.66552734375, 26.6845703125, 27.70361328125, 28.72265625, 29.74169921875, 30.7607421875, 31.77978515625, 32.798828125, 33.81787109375, 34.8369140625, 35.85595703125, 36.875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 8.0, 4.0, 6.0, 13.0, 16.0, 26.0, 32.0, 67.0, 100.0, 135.0, 181.0, 317.0, 493.0, 743.0, 1230.0, 2017.0, 3449.0, 6011.0, 11253.0, 21073.0, 39988.0, 73380.0, 124816.0, 181345.0, 199355.0, 158602.0, 100442.0, 56771.0, 30289.0, 15979.0, 8510.0, 4797.0, 2714.0, 1624.0, 989.0, 633.0, 414.0, 264.0, 153.0, 122.0, 65.0, 55.0, 31.0, 22.0, 12.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.15625, -45.5458984375, -43.935546875, -42.3251953125, -40.71484375, -39.1044921875, -37.494140625, -35.8837890625, -34.2734375, -32.6630859375, -31.052734375, -29.4423828125, -27.83203125, -26.2216796875, -24.611328125, -23.0009765625, -21.390625, -19.7802734375, -18.169921875, -16.5595703125, -14.94921875, -13.3388671875, -11.728515625, -10.1181640625, -8.5078125, -6.8974609375, -5.287109375, -3.6767578125, -2.06640625, -0.4560546875, 1.154296875, 2.7646484375, 4.375, 5.9853515625, 7.595703125, 9.2060546875, 10.81640625, 12.4267578125, 14.037109375, 15.6474609375, 17.2578125, 18.8681640625, 20.478515625, 22.0888671875, 23.69921875, 25.3095703125, 26.919921875, 28.5302734375, 30.140625, 31.7509765625, 33.361328125, 34.9716796875, 36.58203125, 38.1923828125, 39.802734375, 41.4130859375, 43.0234375, 44.6337890625, 46.244140625, 47.8544921875, 49.46484375, 51.0751953125, 52.685546875, 54.2958984375, 55.90625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 15.0, 14.0, 13.0, 22.0, 18.0, 20.0, 20.0, 22.0, 35.0, 28.0, 27.0, 23.0, 44.0, 28.0, 53.0, 43.0, 50.0, 56.0, 41.0, 27.0, 32.0, 34.0, 30.0, 30.0, 30.0, 24.0, 21.0, 27.0, 21.0, 29.0, 24.0, 10.0, 20.0, 11.0, 6.0, 8.0, 9.0, 1.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0], "bins": [-21.09375, -20.48193359375, -19.8701171875, -19.25830078125, -18.646484375, -18.03466796875, -17.4228515625, -16.81103515625, -16.19921875, -15.58740234375, -14.9755859375, -14.36376953125, -13.751953125, -13.14013671875, -12.5283203125, -11.91650390625, -11.3046875, -10.69287109375, -10.0810546875, -9.46923828125, -8.857421875, -8.24560546875, -7.6337890625, -7.02197265625, -6.41015625, -5.79833984375, -5.1865234375, -4.57470703125, -3.962890625, -3.35107421875, -2.7392578125, -2.12744140625, -1.515625, -0.90380859375, -0.2919921875, 0.31982421875, 0.931640625, 1.54345703125, 2.1552734375, 2.76708984375, 3.37890625, 3.99072265625, 4.6025390625, 5.21435546875, 5.826171875, 6.43798828125, 7.0498046875, 7.66162109375, 8.2734375, 8.88525390625, 9.4970703125, 10.10888671875, 10.720703125, 11.33251953125, 11.9443359375, 12.55615234375, 13.16796875, 13.77978515625, 14.3916015625, 15.00341796875, 15.615234375, 16.22705078125, 16.8388671875, 17.45068359375, 18.0625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 3.0, 11.0, 14.0, 28.0, 34.0, 46.0, 60.0, 97.0, 143.0, 196.0, 276.0, 348.0, 539.0, 820.0, 1205.0, 1825.0, 2801.0, 4175.0, 6763.0, 10610.0, 17537.0, 29451.0, 50977.0, 90048.0, 153786.0, 207712.0, 185050.0, 118512.0, 67086.0, 38318.0, 22421.0, 13555.0, 8440.0, 5261.0, 3488.0, 2214.0, 1483.0, 1051.0, 680.0, 464.0, 288.0, 216.0, 163.0, 104.0, 77.0, 51.0, 47.0, 23.0, 17.0, 13.0, 3.0, 9.0, 5.0, 3.0, 4.0, 4.0], "bins": [-31.90625, -30.960693359375, -30.01513671875, -29.069580078125, -28.1240234375, -27.178466796875, -26.23291015625, -25.287353515625, -24.341796875, -23.396240234375, -22.45068359375, -21.505126953125, -20.5595703125, -19.614013671875, -18.66845703125, -17.722900390625, -16.77734375, -15.831787109375, -14.88623046875, -13.940673828125, -12.9951171875, -12.049560546875, -11.10400390625, -10.158447265625, -9.212890625, -8.267333984375, -7.32177734375, -6.376220703125, -5.4306640625, -4.485107421875, -3.53955078125, -2.593994140625, -1.6484375, -0.702880859375, 0.24267578125, 1.188232421875, 2.1337890625, 3.079345703125, 4.02490234375, 4.970458984375, 5.916015625, 6.861572265625, 7.80712890625, 8.752685546875, 9.6982421875, 10.643798828125, 11.58935546875, 12.534912109375, 13.48046875, 14.426025390625, 15.37158203125, 16.317138671875, 17.2626953125, 18.208251953125, 19.15380859375, 20.099365234375, 21.044921875, 21.990478515625, 22.93603515625, 23.881591796875, 24.8271484375, 25.772705078125, 26.71826171875, 27.663818359375, 28.609375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 8.0, 10.0, 11.0, 5.0, 14.0, 15.0, 23.0, 18.0, 28.0, 27.0, 34.0, 46.0, 68.0, 75.0, 67.0, 65.0, 79.0, 70.0, 58.0, 54.0, 42.0, 40.0, 28.0, 22.0, 11.0, 20.0, 15.0, 7.0, 9.0, 5.0, 3.0, 7.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00377655029296875, -0.003665328025817871, -0.003554105758666992, -0.0034428834915161133, -0.0033316612243652344, -0.0032204389572143555, -0.0031092166900634766, -0.0029979944229125977, -0.0028867721557617188, -0.00277554988861084, -0.002664327621459961, -0.002553105354309082, -0.002441883087158203, -0.0023306608200073242, -0.0022194385528564453, -0.0021082162857055664, -0.0019969940185546875, -0.0018857717514038086, -0.0017745494842529297, -0.0016633272171020508, -0.0015521049499511719, -0.001440882682800293, -0.001329660415649414, -0.0012184381484985352, -0.0011072158813476562, -0.0009959936141967773, -0.0008847713470458984, -0.0007735490798950195, -0.0006623268127441406, -0.0005511045455932617, -0.0004398822784423828, -0.0003286600112915039, -0.000217437744140625, -0.0001062154769897461, 5.0067901611328125e-06, 0.00011622905731201172, 0.00022745132446289062, 0.00033867359161376953, 0.00044989585876464844, 0.0005611181259155273, 0.0006723403930664062, 0.0007835626602172852, 0.0008947849273681641, 0.001006007194519043, 0.0011172294616699219, 0.0012284517288208008, 0.0013396739959716797, 0.0014508962631225586, 0.0015621185302734375, 0.0016733407974243164, 0.0017845630645751953, 0.0018957853317260742, 0.002007007598876953, 0.002118229866027832, 0.002229452133178711, 0.00234067440032959, 0.0024518966674804688, 0.0025631189346313477, 0.0026743412017822266, 0.0027855634689331055, 0.0028967857360839844, 0.0030080080032348633, 0.003119230270385742, 0.003230452537536621, 0.0033416748046875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 9.0, 10.0, 10.0, 16.0, 17.0, 34.0, 46.0, 82.0, 139.0, 190.0, 244.0, 392.0, 676.0, 1056.0, 1613.0, 2706.0, 4370.0, 7440.0, 13185.0, 23801.0, 44707.0, 88091.0, 167820.0, 248088.0, 203895.0, 112920.0, 57675.0, 30009.0, 16175.0, 9166.0, 5186.0, 3324.0, 2029.0, 1224.0, 746.0, 537.0, 306.0, 220.0, 147.0, 89.0, 56.0, 38.0, 29.0, 14.0, 9.0, 7.0, 9.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-37.21875, -36.080078125, -34.94140625, -33.802734375, -32.6640625, -31.525390625, -30.38671875, -29.248046875, -28.109375, -26.970703125, -25.83203125, -24.693359375, -23.5546875, -22.416015625, -21.27734375, -20.138671875, -19.0, -17.861328125, -16.72265625, -15.583984375, -14.4453125, -13.306640625, -12.16796875, -11.029296875, -9.890625, -8.751953125, -7.61328125, -6.474609375, -5.3359375, -4.197265625, -3.05859375, -1.919921875, -0.78125, 0.357421875, 1.49609375, 2.634765625, 3.7734375, 4.912109375, 6.05078125, 7.189453125, 8.328125, 9.466796875, 10.60546875, 11.744140625, 12.8828125, 14.021484375, 15.16015625, 16.298828125, 17.4375, 18.576171875, 19.71484375, 20.853515625, 21.9921875, 23.130859375, 24.26953125, 25.408203125, 26.546875, 27.685546875, 28.82421875, 29.962890625, 31.1015625, 32.240234375, 33.37890625, 34.517578125, 35.65625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 15.0, 8.0, 3.0, 20.0, 17.0, 22.0, 26.0, 34.0, 45.0, 61.0, 62.0, 56.0, 71.0, 67.0, 82.0, 70.0, 58.0, 58.0, 47.0, 42.0, 26.0, 28.0, 19.0, 15.0, 9.0, 6.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.7578125, -11.4296875, -11.1015625, -10.7734375, -10.4453125, -10.1171875, -9.7890625, -9.4609375, -9.1328125, -8.8046875, -8.4765625, -8.1484375, -7.8203125, -7.4921875, -7.1640625, -6.8359375, -6.5078125, -6.1796875, -5.8515625, -5.5234375, -5.1953125, -4.8671875, -4.5390625, -4.2109375, -3.8828125, -3.5546875, -3.2265625, -2.8984375, -2.5703125, -2.2421875, -1.9140625, -1.5859375, -1.2578125, -0.9296875, -0.6015625, -0.2734375, 0.0546875, 0.3828125, 0.7109375, 1.0390625, 1.3671875, 1.6953125, 2.0234375, 2.3515625, 2.6796875, 3.0078125, 3.3359375, 3.6640625, 3.9921875, 4.3203125, 4.6484375, 4.9765625, 5.3046875, 5.6328125, 5.9609375, 6.2890625, 6.6171875, 6.9453125, 7.2734375, 7.6015625, 7.9296875, 8.2578125, 8.5859375, 8.9140625]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 6.0, 6.0, 13.0, 7.0, 13.0, 11.0, 22.0, 17.0, 24.0, 41.0, 39.0, 35.0, 62.0, 52.0, 73.0, 63.0, 58.0, 64.0, 67.0, 63.0, 41.0, 36.0, 30.0, 29.0, 27.0, 16.0, 12.0, 16.0, 10.0, 11.0, 7.0, 5.0, 3.0, 2.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.947601318359375, -56.02047348022461, -54.09334945678711, -52.166221618652344, -50.239097595214844, -48.31196975708008, -46.38484191894531, -44.45771789550781, -42.53059005737305, -40.60346221923828, -38.67633819580078, -36.749210357666016, -34.82208251953125, -32.89495849609375, -30.967830657958984, -29.04070472717285, -27.11357879638672, -25.186452865600586, -23.259326934814453, -21.332199096679688, -19.405073165893555, -17.477947235107422, -15.550820350646973, -13.623693466186523, -11.69656753540039, -9.769441604614258, -7.842314720153809, -5.915188312530518, -3.9880619049072266, -2.0609359741210938, -0.13380908966064453, 1.7933177947998047, 3.7204437255859375, 5.6475701332092285, 7.5746965408325195, 9.501823425292969, 11.428949356079102, 13.356075286865234, 15.283202171325684, 17.210329055786133, 19.137454986572266, 21.0645809173584, 22.99170684814453, 24.918834686279297, 26.84596061706543, 28.773086547851562, 30.700214385986328, 32.627342224121094, 34.554466247558594, 36.48159408569336, 38.40871810913086, 40.335845947265625, 42.262969970703125, 44.19009780883789, 46.117225646972656, 48.044349670410156, 49.97147750854492, 51.89860534667969, 53.82572937011719, 55.75285720825195, 57.67998504638672, 59.60710906982422, 61.534236907958984, 63.46136474609375, 65.38848876953125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 13.0, 13.0, 2.0, 13.0, 17.0, 19.0, 19.0, 18.0, 22.0, 23.0, 33.0, 25.0, 24.0, 33.0, 43.0, 38.0, 40.0, 45.0, 40.0, 46.0, 47.0, 28.0, 43.0, 33.0, 34.0, 32.0, 23.0, 41.0, 23.0, 14.0, 24.0, 21.0, 15.0, 22.0, 9.0, 6.0, 12.0, 14.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.10472297668457, -29.111766815185547, -28.118812561035156, -27.125856399536133, -26.13290023803711, -25.13994598388672, -24.146989822387695, -23.154033660888672, -22.16107940673828, -21.168123245239258, -20.175168991088867, -19.182212829589844, -18.18925666809082, -17.196300506591797, -16.203346252441406, -15.210390090942383, -14.21743392944336, -13.224478721618652, -12.231522560119629, -11.238567352294922, -10.245611190795898, -9.252655982971191, -8.259700775146484, -7.266745090484619, -6.273789405822754, -5.280833721160889, -4.287878036499023, -3.2949228286743164, -2.301967144012451, -1.309011459350586, -0.3160562515258789, 0.6768994331359863, 1.6698532104492188, 2.662808895111084, 3.65576434135437, 4.648719787597656, 5.6416754722595215, 6.634631156921387, 7.627586364746094, 8.620542526245117, 9.613497734069824, 10.606452941894531, 11.599409103393555, 12.592364311218262, 13.585319519042969, 14.578275680541992, 15.5712308883667, 16.564186096191406, 17.55714225769043, 18.550098419189453, 19.543052673339844, 20.536008834838867, 21.52896499633789, 22.52191925048828, 23.514875411987305, 24.507831573486328, 25.50078582763672, 26.493741989135742, 27.486696243286133, 28.479652404785156, 29.47260856628418, 30.465564727783203, 31.458518981933594, 32.451473236083984, 33.44443130493164]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 3.0, 20.0, 23.0, 27.0, 58.0, 85.0, 129.0, 191.0, 329.0, 503.0, 869.0, 1321.0, 2151.0, 3515.0, 5962.0, 10276.0, 18720.0, 36664.0, 77148.0, 180342.0, 468196.0, 1141569.0, 1271929.0, 580505.0, 218598.0, 89358.0, 40266.0, 19853.0, 10785.0, 5999.0, 3454.0, 2050.0, 1242.0, 803.0, 510.0, 302.0, 189.0, 123.0, 69.0, 56.0, 25.0, 20.0, 19.0, 12.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.75, -76.1337890625, -73.517578125, -70.9013671875, -68.28515625, -65.6689453125, -63.052734375, -60.4365234375, -57.8203125, -55.2041015625, -52.587890625, -49.9716796875, -47.35546875, -44.7392578125, -42.123046875, -39.5068359375, -36.890625, -34.2744140625, -31.658203125, -29.0419921875, -26.42578125, -23.8095703125, -21.193359375, -18.5771484375, -15.9609375, -13.3447265625, -10.728515625, -8.1123046875, -5.49609375, -2.8798828125, -0.263671875, 2.3525390625, 4.96875, 7.5849609375, 10.201171875, 12.8173828125, 15.43359375, 18.0498046875, 20.666015625, 23.2822265625, 25.8984375, 28.5146484375, 31.130859375, 33.7470703125, 36.36328125, 38.9794921875, 41.595703125, 44.2119140625, 46.828125, 49.4443359375, 52.060546875, 54.6767578125, 57.29296875, 59.9091796875, 62.525390625, 65.1416015625, 67.7578125, 70.3740234375, 72.990234375, 75.6064453125, 78.22265625, 80.8388671875, 83.455078125, 86.0712890625, 88.6875]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 3.0, 13.0, 8.0, 10.0, 20.0, 26.0, 17.0, 17.0, 12.0, 25.0, 18.0, 24.0, 26.0, 40.0, 48.0, 30.0, 47.0, 53.0, 39.0, 53.0, 38.0, 42.0, 36.0, 42.0, 33.0, 31.0, 24.0, 30.0, 25.0, 27.0, 22.0, 26.0, 14.0, 13.0, 20.0, 8.0, 4.0, 10.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.0625, -30.9677734375, -29.873046875, -28.7783203125, -27.68359375, -26.5888671875, -25.494140625, -24.3994140625, -23.3046875, -22.2099609375, -21.115234375, -20.0205078125, -18.92578125, -17.8310546875, -16.736328125, -15.6416015625, -14.546875, -13.4521484375, -12.357421875, -11.2626953125, -10.16796875, -9.0732421875, -7.978515625, -6.8837890625, -5.7890625, -4.6943359375, -3.599609375, -2.5048828125, -1.41015625, -0.3154296875, 0.779296875, 1.8740234375, 2.96875, 4.0634765625, 5.158203125, 6.2529296875, 7.34765625, 8.4423828125, 9.537109375, 10.6318359375, 11.7265625, 12.8212890625, 13.916015625, 15.0107421875, 16.10546875, 17.2001953125, 18.294921875, 19.3896484375, 20.484375, 21.5791015625, 22.673828125, 23.7685546875, 24.86328125, 25.9580078125, 27.052734375, 28.1474609375, 29.2421875, 30.3369140625, 31.431640625, 32.5263671875, 33.62109375, 34.7158203125, 35.810546875, 36.9052734375, 38.0]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 13.0, 10.0, 17.0, 38.0, 46.0, 69.0, 101.0, 171.0, 237.0, 393.0, 510.0, 798.0, 1245.0, 1994.0, 3066.0, 5001.0, 8009.0, 13565.0, 22844.0, 40154.0, 73579.0, 142946.0, 295891.0, 642609.0, 1159845.0, 914642.0, 432861.0, 203383.0, 101333.0, 54046.0, 29846.0, 17434.0, 10139.0, 6481.0, 3918.0, 2494.0, 1590.0, 964.0, 647.0, 454.0, 306.0, 190.0, 117.0, 86.0, 73.0, 42.0, 32.0, 18.0, 15.0, 11.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-101.8125, -98.60546875, -95.3984375, -92.19140625, -88.984375, -85.77734375, -82.5703125, -79.36328125, -76.15625, -72.94921875, -69.7421875, -66.53515625, -63.328125, -60.12109375, -56.9140625, -53.70703125, -50.5, -47.29296875, -44.0859375, -40.87890625, -37.671875, -34.46484375, -31.2578125, -28.05078125, -24.84375, -21.63671875, -18.4296875, -15.22265625, -12.015625, -8.80859375, -5.6015625, -2.39453125, 0.8125, 4.01953125, 7.2265625, 10.43359375, 13.640625, 16.84765625, 20.0546875, 23.26171875, 26.46875, 29.67578125, 32.8828125, 36.08984375, 39.296875, 42.50390625, 45.7109375, 48.91796875, 52.125, 55.33203125, 58.5390625, 61.74609375, 64.953125, 68.16015625, 71.3671875, 74.57421875, 77.78125, 80.98828125, 84.1953125, 87.40234375, 90.609375, 93.81640625, 97.0234375, 100.23046875, 103.4375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 3.0, 10.0, 16.0, 16.0, 13.0, 18.0, 32.0, 34.0, 36.0, 60.0, 66.0, 86.0, 105.0, 115.0, 164.0, 164.0, 205.0, 240.0, 284.0, 261.0, 286.0, 292.0, 246.0, 211.0, 192.0, 165.0, 138.0, 111.0, 98.0, 87.0, 59.0, 46.0, 47.0, 35.0, 23.0, 21.0, 19.0, 14.0, 4.0, 9.0, 4.0, 8.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-25.84375, -25.043701171875, -24.24365234375, -23.443603515625, -22.6435546875, -21.843505859375, -21.04345703125, -20.243408203125, -19.443359375, -18.643310546875, -17.84326171875, -17.043212890625, -16.2431640625, -15.443115234375, -14.64306640625, -13.843017578125, -13.04296875, -12.242919921875, -11.44287109375, -10.642822265625, -9.8427734375, -9.042724609375, -8.24267578125, -7.442626953125, -6.642578125, -5.842529296875, -5.04248046875, -4.242431640625, -3.4423828125, -2.642333984375, -1.84228515625, -1.042236328125, -0.2421875, 0.557861328125, 1.35791015625, 2.157958984375, 2.9580078125, 3.758056640625, 4.55810546875, 5.358154296875, 6.158203125, 6.958251953125, 7.75830078125, 8.558349609375, 9.3583984375, 10.158447265625, 10.95849609375, 11.758544921875, 12.55859375, 13.358642578125, 14.15869140625, 14.958740234375, 15.7587890625, 16.558837890625, 17.35888671875, 18.158935546875, 18.958984375, 19.759033203125, 20.55908203125, 21.359130859375, 22.1591796875, 22.959228515625, 23.75927734375, 24.559326171875, 25.359375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 11.0, 13.0, 9.0, 14.0, 15.0, 24.0, 32.0, 39.0, 36.0, 50.0, 69.0, 72.0, 90.0, 69.0, 75.0, 64.0, 50.0, 61.0, 42.0, 38.0, 21.0, 24.0, 15.0, 8.0, 12.0, 7.0, 6.0, 3.0, 8.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-124.36991882324219, -120.25525665283203, -116.14058685302734, -112.02592468261719, -107.91126251220703, -103.79660034179688, -99.68193054199219, -95.56726837158203, -91.45260620117188, -87.33794403076172, -83.22327423095703, -79.10861206054688, -74.99394989013672, -70.87928771972656, -66.76461791992188, -62.64995574951172, -58.53528594970703, -54.42061996459961, -50.30595779418945, -46.19129180908203, -42.076629638671875, -37.96196365356445, -33.84729766845703, -29.732633590698242, -25.617969512939453, -21.503305435180664, -17.388641357421875, -13.273975372314453, -9.159311294555664, -5.044647216796875, -0.9299812316894531, 3.184682846069336, 7.299346923828125, 11.414011001586914, 15.52867603302002, 19.643341064453125, 23.758005142211914, 27.872669219970703, 31.987335205078125, 36.10199737548828, 40.2166633605957, 44.331329345703125, 48.44599151611328, 52.5606575012207, 56.675323486328125, 60.78998565673828, 64.90464782714844, 69.01931762695312, 73.13397979736328, 77.24864196777344, 81.36331176757812, 85.47797393798828, 89.59263610839844, 93.70730590820312, 97.82196807861328, 101.93663024902344, 106.05130004882812, 110.16596221923828, 114.28063201904297, 118.39529418945312, 122.50995635986328, 126.62461853027344, 130.73928833007812, 134.8539581298828, 138.96861267089844]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 4.0, 6.0, 4.0, 9.0, 10.0, 10.0, 19.0, 18.0, 9.0, 17.0, 22.0, 26.0, 26.0, 23.0, 26.0, 32.0, 46.0, 28.0, 41.0, 56.0, 37.0, 46.0, 40.0, 37.0, 57.0, 41.0, 49.0, 41.0, 28.0, 22.0, 32.0, 22.0, 18.0, 19.0, 11.0, 12.0, 10.0, 7.0, 7.0, 4.0, 1.0, 11.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-58.71641540527344, -56.88956069946289, -55.06270980834961, -53.23585510253906, -51.409000396728516, -49.582149505615234, -47.75529479980469, -45.928443908691406, -44.10158920288086, -42.27473449707031, -40.44788360595703, -38.621028900146484, -36.79417419433594, -34.967323303222656, -33.14046859741211, -31.313615798950195, -29.48676109313965, -27.659908294677734, -25.833053588867188, -24.006200790405273, -22.17934799194336, -20.352493286132812, -18.5256404876709, -16.698787689208984, -14.871933937072754, -13.045080184936523, -11.21822738647461, -9.391373634338379, -7.564520359039307, -5.737667083740234, -3.910813331604004, -2.08396053314209, -0.2571067810058594, 1.5697466135025024, 3.3966000080108643, 5.223453521728516, 7.050306797027588, 8.87716007232666, 10.70401382446289, 12.530866622924805, 14.357720375061035, 16.184574127197266, 18.01142692565918, 19.838279724121094, 21.66513442993164, 23.491987228393555, 25.31884002685547, 27.145694732666016, 28.97254753112793, 30.799400329589844, 32.62625503540039, 34.45310974121094, 36.27996063232422, 38.106815338134766, 39.93367004394531, 41.760520935058594, 43.58737564086914, 45.41423034667969, 47.24108123779297, 49.067935943603516, 50.89479064941406, 52.721641540527344, 54.54849624633789, 56.37535095214844, 58.20220184326172]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 7.0, 5.0, 6.0, 14.0, 19.0, 25.0, 50.0, 58.0, 80.0, 109.0, 178.0, 296.0, 432.0, 691.0, 1128.0, 1809.0, 3131.0, 5604.0, 10275.0, 20127.0, 41831.0, 90331.0, 186709.0, 282818.0, 205411.0, 101782.0, 47041.0, 22471.0, 11306.0, 6078.0, 3434.0, 1991.0, 1214.0, 736.0, 436.0, 304.0, 189.0, 134.0, 103.0, 58.0, 38.0, 35.0, 21.0, 11.0, 12.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.125, -62.9951171875, -60.865234375, -58.7353515625, -56.60546875, -54.4755859375, -52.345703125, -50.2158203125, -48.0859375, -45.9560546875, -43.826171875, -41.6962890625, -39.56640625, -37.4365234375, -35.306640625, -33.1767578125, -31.046875, -28.9169921875, -26.787109375, -24.6572265625, -22.52734375, -20.3974609375, -18.267578125, -16.1376953125, -14.0078125, -11.8779296875, -9.748046875, -7.6181640625, -5.48828125, -3.3583984375, -1.228515625, 0.9013671875, 3.03125, 5.1611328125, 7.291015625, 9.4208984375, 11.55078125, 13.6806640625, 15.810546875, 17.9404296875, 20.0703125, 22.2001953125, 24.330078125, 26.4599609375, 28.58984375, 30.7197265625, 32.849609375, 34.9794921875, 37.109375, 39.2392578125, 41.369140625, 43.4990234375, 45.62890625, 47.7587890625, 49.888671875, 52.0185546875, 54.1484375, 56.2783203125, 58.408203125, 60.5380859375, 62.66796875, 64.7978515625, 66.927734375, 69.0576171875, 71.1875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 9.0, 7.0, 10.0, 8.0, 17.0, 28.0, 24.0, 26.0, 30.0, 38.0, 34.0, 45.0, 51.0, 47.0, 66.0, 57.0, 63.0, 68.0, 59.0, 48.0, 45.0, 45.0, 26.0, 33.0, 24.0, 20.0, 14.0, 8.0, 10.0, 9.0, 10.0, 1.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.5, -95.8134765625, -93.126953125, -90.4404296875, -87.75390625, -85.0673828125, -82.380859375, -79.6943359375, -77.0078125, -74.3212890625, -71.634765625, -68.9482421875, -66.26171875, -63.5751953125, -60.888671875, -58.2021484375, -55.515625, -52.8291015625, -50.142578125, -47.4560546875, -44.76953125, -42.0830078125, -39.396484375, -36.7099609375, -34.0234375, -31.3369140625, -28.650390625, -25.9638671875, -23.27734375, -20.5908203125, -17.904296875, -15.2177734375, -12.53125, -9.8447265625, -7.158203125, -4.4716796875, -1.78515625, 0.9013671875, 3.587890625, 6.2744140625, 8.9609375, 11.6474609375, 14.333984375, 17.0205078125, 19.70703125, 22.3935546875, 25.080078125, 27.7666015625, 30.453125, 33.1396484375, 35.826171875, 38.5126953125, 41.19921875, 43.8857421875, 46.572265625, 49.2587890625, 51.9453125, 54.6318359375, 57.318359375, 60.0048828125, 62.69140625, 65.3779296875, 68.064453125, 70.7509765625, 73.4375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 12.0, 15.0, 24.0, 31.0, 39.0, 52.0, 77.0, 107.0, 138.0, 233.0, 312.0, 454.0, 770.0, 1180.0, 1971.0, 3343.0, 6218.0, 12603.0, 26088.0, 58466.0, 138174.0, 281084.0, 275252.0, 133256.0, 56860.0, 25154.0, 11828.0, 6141.0, 3378.0, 1924.0, 1179.0, 698.0, 473.0, 318.0, 208.0, 135.0, 98.0, 79.0, 44.0, 26.0, 31.0, 17.0, 16.0, 10.0, 11.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.75, -73.3046875, -70.859375, -68.4140625, -65.96875, -63.5234375, -61.078125, -58.6328125, -56.1875, -53.7421875, -51.296875, -48.8515625, -46.40625, -43.9609375, -41.515625, -39.0703125, -36.625, -34.1796875, -31.734375, -29.2890625, -26.84375, -24.3984375, -21.953125, -19.5078125, -17.0625, -14.6171875, -12.171875, -9.7265625, -7.28125, -4.8359375, -2.390625, 0.0546875, 2.5, 4.9453125, 7.390625, 9.8359375, 12.28125, 14.7265625, 17.171875, 19.6171875, 22.0625, 24.5078125, 26.953125, 29.3984375, 31.84375, 34.2890625, 36.734375, 39.1796875, 41.625, 44.0703125, 46.515625, 48.9609375, 51.40625, 53.8515625, 56.296875, 58.7421875, 61.1875, 63.6328125, 66.078125, 68.5234375, 70.96875, 73.4140625, 75.859375, 78.3046875, 80.75]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 5.0, 10.0, 6.0, 4.0, 11.0, 14.0, 9.0, 14.0, 16.0, 22.0, 15.0, 23.0, 36.0, 25.0, 52.0, 38.0, 24.0, 33.0, 51.0, 34.0, 40.0, 32.0, 45.0, 33.0, 41.0, 54.0, 29.0, 33.0, 31.0, 31.0, 31.0, 23.0, 24.0, 17.0, 15.0, 8.0, 17.0, 9.0, 10.0, 12.0, 9.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.4375, -33.30029296875, -32.1630859375, -31.02587890625, -29.888671875, -28.75146484375, -27.6142578125, -26.47705078125, -25.33984375, -24.20263671875, -23.0654296875, -21.92822265625, -20.791015625, -19.65380859375, -18.5166015625, -17.37939453125, -16.2421875, -15.10498046875, -13.9677734375, -12.83056640625, -11.693359375, -10.55615234375, -9.4189453125, -8.28173828125, -7.14453125, -6.00732421875, -4.8701171875, -3.73291015625, -2.595703125, -1.45849609375, -0.3212890625, 0.81591796875, 1.953125, 3.09033203125, 4.2275390625, 5.36474609375, 6.501953125, 7.63916015625, 8.7763671875, 9.91357421875, 11.05078125, 12.18798828125, 13.3251953125, 14.46240234375, 15.599609375, 16.73681640625, 17.8740234375, 19.01123046875, 20.1484375, 21.28564453125, 22.4228515625, 23.56005859375, 24.697265625, 25.83447265625, 26.9716796875, 28.10888671875, 29.24609375, 30.38330078125, 31.5205078125, 32.65771484375, 33.794921875, 34.93212890625, 36.0693359375, 37.20654296875, 38.34375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 12.0, 12.0, 20.0, 25.0, 32.0, 43.0, 77.0, 101.0, 149.0, 211.0, 323.0, 452.0, 656.0, 1016.0, 1620.0, 2651.0, 4230.0, 7071.0, 12397.0, 21790.0, 40528.0, 76765.0, 148799.0, 252792.0, 220259.0, 118589.0, 61340.0, 32617.0, 17874.0, 10146.0, 5919.0, 3599.0, 2246.0, 1446.0, 848.0, 601.0, 401.0, 294.0, 196.0, 125.0, 84.0, 63.0, 50.0, 29.0, 25.0, 10.0, 8.0, 11.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-23.15625, -22.4287109375, -21.701171875, -20.9736328125, -20.24609375, -19.5185546875, -18.791015625, -18.0634765625, -17.3359375, -16.6083984375, -15.880859375, -15.1533203125, -14.42578125, -13.6982421875, -12.970703125, -12.2431640625, -11.515625, -10.7880859375, -10.060546875, -9.3330078125, -8.60546875, -7.8779296875, -7.150390625, -6.4228515625, -5.6953125, -4.9677734375, -4.240234375, -3.5126953125, -2.78515625, -2.0576171875, -1.330078125, -0.6025390625, 0.125, 0.8525390625, 1.580078125, 2.3076171875, 3.03515625, 3.7626953125, 4.490234375, 5.2177734375, 5.9453125, 6.6728515625, 7.400390625, 8.1279296875, 8.85546875, 9.5830078125, 10.310546875, 11.0380859375, 11.765625, 12.4931640625, 13.220703125, 13.9482421875, 14.67578125, 15.4033203125, 16.130859375, 16.8583984375, 17.5859375, 18.3134765625, 19.041015625, 19.7685546875, 20.49609375, 21.2236328125, 21.951171875, 22.6787109375, 23.40625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 1.0, 4.0, 3.0, 3.0, 8.0, 4.0, 13.0, 16.0, 21.0, 24.0, 25.0, 27.0, 46.0, 65.0, 68.0, 86.0, 92.0, 69.0, 74.0, 67.0, 46.0, 53.0, 30.0, 30.0, 25.0, 17.0, 18.0, 15.0, 10.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0020923614501953125, -0.002036452293395996, -0.0019805431365966797, -0.0019246339797973633, -0.0018687248229980469, -0.0018128156661987305, -0.001756906509399414, -0.0017009973526000977, -0.0016450881958007812, -0.0015891790390014648, -0.0015332698822021484, -0.001477360725402832, -0.0014214515686035156, -0.0013655424118041992, -0.0013096332550048828, -0.0012537240982055664, -0.00119781494140625, -0.0011419057846069336, -0.0010859966278076172, -0.0010300874710083008, -0.0009741783142089844, -0.000918269157409668, -0.0008623600006103516, -0.0008064508438110352, -0.0007505416870117188, -0.0006946325302124023, -0.0006387233734130859, -0.0005828142166137695, -0.0005269050598144531, -0.0004709959030151367, -0.0004150867462158203, -0.0003591775894165039, -0.0003032684326171875, -0.0002473592758178711, -0.0001914501190185547, -0.00013554096221923828, -7.963180541992188e-05, -2.372264862060547e-05, 3.218650817871094e-05, 8.809566497802734e-05, 0.00014400482177734375, 0.00019991397857666016, 0.00025582313537597656, 0.00031173229217529297, 0.0003676414489746094, 0.0004235506057739258, 0.0004794597625732422, 0.0005353689193725586, 0.000591278076171875, 0.0006471872329711914, 0.0007030963897705078, 0.0007590055465698242, 0.0008149147033691406, 0.000870823860168457, 0.0009267330169677734, 0.0009826421737670898, 0.0010385513305664062, 0.0010944604873657227, 0.001150369644165039, 0.0012062788009643555, 0.0012621879577636719, 0.0013180971145629883, 0.0013740062713623047, 0.001429915428161621, 0.0014858245849609375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 11.0, 12.0, 13.0, 34.0, 30.0, 36.0, 58.0, 106.0, 112.0, 175.0, 252.0, 353.0, 488.0, 773.0, 1274.0, 2077.0, 3975.0, 7958.0, 18097.0, 44108.0, 108161.0, 244979.0, 316514.0, 172923.0, 71125.0, 29065.0, 12563.0, 5604.0, 2888.0, 1686.0, 981.0, 647.0, 430.0, 320.0, 194.0, 151.0, 105.0, 79.0, 55.0, 38.0, 29.0, 17.0, 20.0, 6.0, 9.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-37.46875, -36.2705078125, -35.072265625, -33.8740234375, -32.67578125, -31.4775390625, -30.279296875, -29.0810546875, -27.8828125, -26.6845703125, -25.486328125, -24.2880859375, -23.08984375, -21.8916015625, -20.693359375, -19.4951171875, -18.296875, -17.0986328125, -15.900390625, -14.7021484375, -13.50390625, -12.3056640625, -11.107421875, -9.9091796875, -8.7109375, -7.5126953125, -6.314453125, -5.1162109375, -3.91796875, -2.7197265625, -1.521484375, -0.3232421875, 0.875, 2.0732421875, 3.271484375, 4.4697265625, 5.66796875, 6.8662109375, 8.064453125, 9.2626953125, 10.4609375, 11.6591796875, 12.857421875, 14.0556640625, 15.25390625, 16.4521484375, 17.650390625, 18.8486328125, 20.046875, 21.2451171875, 22.443359375, 23.6416015625, 24.83984375, 26.0380859375, 27.236328125, 28.4345703125, 29.6328125, 30.8310546875, 32.029296875, 33.2275390625, 34.42578125, 35.6240234375, 36.822265625, 38.0205078125, 39.21875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 14.0, 12.0, 18.0, 18.0, 22.0, 15.0, 48.0, 36.0, 39.0, 51.0, 52.0, 53.0, 55.0, 59.0, 76.0, 56.0, 52.0, 56.0, 45.0, 37.0, 36.0, 26.0, 20.0, 8.0, 14.0, 12.0, 8.0, 6.0, 9.0, 9.0, 5.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.12109375, -6.9097900390625, -6.698486328125, -6.4871826171875, -6.27587890625, -6.0645751953125, -5.853271484375, -5.6419677734375, -5.4306640625, -5.2193603515625, -5.008056640625, -4.7967529296875, -4.58544921875, -4.3741455078125, -4.162841796875, -3.9515380859375, -3.740234375, -3.5289306640625, -3.317626953125, -3.1063232421875, -2.89501953125, -2.6837158203125, -2.472412109375, -2.2611083984375, -2.0498046875, -1.8385009765625, -1.627197265625, -1.4158935546875, -1.20458984375, -0.9932861328125, -0.781982421875, -0.5706787109375, -0.359375, -0.1480712890625, 0.063232421875, 0.2745361328125, 0.48583984375, 0.6971435546875, 0.908447265625, 1.1197509765625, 1.3310546875, 1.5423583984375, 1.753662109375, 1.9649658203125, 2.17626953125, 2.3875732421875, 2.598876953125, 2.8101806640625, 3.021484375, 3.2327880859375, 3.444091796875, 3.6553955078125, 3.86669921875, 4.0780029296875, 4.289306640625, 4.5006103515625, 4.7119140625, 4.9232177734375, 5.134521484375, 5.3458251953125, 5.55712890625, 5.7684326171875, 5.979736328125, 6.1910400390625, 6.40234375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 12.0, 8.0, 10.0, 12.0, 20.0, 18.0, 34.0, 34.0, 46.0, 51.0, 53.0, 83.0, 82.0, 73.0, 78.0, 66.0, 59.0, 51.0, 40.0, 38.0, 21.0, 26.0, 15.0, 10.0, 9.0, 9.0, 6.0, 7.0, 4.0, 2.0, 6.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-134.5395050048828, -130.36776733398438, -126.1960220336914, -122.02428436279297, -117.85254669189453, -113.68080139160156, -109.50906372070312, -105.33732604980469, -101.16558837890625, -96.99385070800781, -92.82210540771484, -88.6503677368164, -84.47863006591797, -80.306884765625, -76.13514709472656, -71.96340942382812, -67.79166412353516, -63.61992263793945, -59.448184967041016, -55.27644348144531, -51.104705810546875, -46.93296432495117, -42.76122283935547, -38.58948516845703, -34.41774368286133, -30.246004104614258, -26.074264526367188, -21.902523040771484, -17.730783462524414, -13.559043884277344, -9.38730239868164, -5.21556282043457, -1.0438232421875, 3.1279168128967285, 7.299656867980957, 11.471397399902344, 15.643136978149414, 19.814876556396484, 23.986618041992188, 28.158357620239258, 32.33009719848633, 36.50183868408203, 40.67357635498047, 44.84531784057617, 49.017059326171875, 53.18879699707031, 57.360538482666016, 61.53227996826172, 65.70401763916016, 69.8757553100586, 74.04750061035156, 78.21923828125, 82.39097595214844, 86.56271362304688, 90.73445892333984, 94.90619659423828, 99.07794189453125, 103.24967956542969, 107.42142486572266, 111.5931625366211, 115.76490020751953, 119.9366455078125, 124.10838317871094, 128.28012084960938, 132.4518585205078]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 3.0, 7.0, 4.0, 6.0, 8.0, 8.0, 8.0, 9.0, 23.0, 15.0, 13.0, 16.0, 21.0, 28.0, 23.0, 22.0, 31.0, 35.0, 41.0, 37.0, 48.0, 41.0, 43.0, 41.0, 44.0, 48.0, 48.0, 45.0, 39.0, 41.0, 24.0, 33.0, 29.0, 14.0, 20.0, 19.0, 10.0, 10.0, 10.0, 7.0, 5.0, 4.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-59.4119987487793, -57.544837951660156, -55.677677154541016, -53.810516357421875, -51.943355560302734, -50.076194763183594, -48.20903396606445, -46.34187316894531, -44.47471237182617, -42.60755157470703, -40.74039077758789, -38.87322998046875, -37.00606918334961, -35.13890838623047, -33.27174758911133, -31.404586791992188, -29.537424087524414, -27.670263290405273, -25.803102493286133, -23.935941696166992, -22.06878089904785, -20.201618194580078, -18.334457397460938, -16.467296600341797, -14.600136756896973, -12.732975959777832, -10.865815162658691, -8.998653411865234, -7.131493091583252, -5.264331817626953, -3.3971710205078125, -1.5300102233886719, 0.33715057373046875, 2.2043113708496094, 4.07147216796875, 5.938633441925049, 7.8057942390441895, 9.672955513000488, 11.540116310119629, 13.40727710723877, 15.27443790435791, 17.141599655151367, 19.008760452270508, 20.87592124938965, 22.74308204650879, 24.61024284362793, 26.47740364074707, 28.34456443786621, 30.21172523498535, 32.078887939453125, 33.946048736572266, 35.813209533691406, 37.68037033081055, 39.54753112792969, 41.41469192504883, 43.28185272216797, 45.14901351928711, 47.01617431640625, 48.88333511352539, 50.75049591064453, 52.61765670776367, 54.48481750488281, 56.35197830200195, 58.219139099121094, 60.086299896240234]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 8.0, 14.0, 18.0, 38.0, 51.0, 64.0, 90.0, 129.0, 191.0, 254.0, 381.0, 548.0, 873.0, 1263.0, 1878.0, 2792.0, 4518.0, 7025.0, 11092.0, 18232.0, 30394.0, 50629.0, 84402.0, 133408.0, 178032.0, 177311.0, 132835.0, 83947.0, 49866.0, 29517.0, 17854.0, 11105.0, 6736.0, 4478.0, 2852.0, 1885.0, 1231.0, 811.0, 580.0, 354.0, 277.0, 185.0, 119.0, 87.0, 67.0, 46.0, 25.0, 26.0, 15.0, 10.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-81.4375, -78.96875, -76.5, -74.03125, -71.5625, -69.09375, -66.625, -64.15625, -61.6875, -59.21875, -56.75, -54.28125, -51.8125, -49.34375, -46.875, -44.40625, -41.9375, -39.46875, -37.0, -34.53125, -32.0625, -29.59375, -27.125, -24.65625, -22.1875, -19.71875, -17.25, -14.78125, -12.3125, -9.84375, -7.375, -4.90625, -2.4375, 0.03125, 2.5, 4.96875, 7.4375, 9.90625, 12.375, 14.84375, 17.3125, 19.78125, 22.25, 24.71875, 27.1875, 29.65625, 32.125, 34.59375, 37.0625, 39.53125, 42.0, 44.46875, 46.9375, 49.40625, 51.875, 54.34375, 56.8125, 59.28125, 61.75, 64.21875, 66.6875, 69.15625, 71.625, 74.09375, 76.5625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 8.0, 4.0, 11.0, 9.0, 11.0, 12.0, 16.0, 23.0, 26.0, 27.0, 31.0, 38.0, 44.0, 45.0, 63.0, 54.0, 60.0, 49.0, 53.0, 55.0, 62.0, 45.0, 47.0, 35.0, 32.0, 29.0, 29.0, 20.0, 12.0, 8.0, 11.0, 7.0, 5.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.1875, -69.5283203125, -66.869140625, -64.2099609375, -61.55078125, -58.8916015625, -56.232421875, -53.5732421875, -50.9140625, -48.2548828125, -45.595703125, -42.9365234375, -40.27734375, -37.6181640625, -34.958984375, -32.2998046875, -29.640625, -26.9814453125, -24.322265625, -21.6630859375, -19.00390625, -16.3447265625, -13.685546875, -11.0263671875, -8.3671875, -5.7080078125, -3.048828125, -0.3896484375, 2.26953125, 4.9287109375, 7.587890625, 10.2470703125, 12.90625, 15.5654296875, 18.224609375, 20.8837890625, 23.54296875, 26.2021484375, 28.861328125, 31.5205078125, 34.1796875, 36.8388671875, 39.498046875, 42.1572265625, 44.81640625, 47.4755859375, 50.134765625, 52.7939453125, 55.453125, 58.1123046875, 60.771484375, 63.4306640625, 66.08984375, 68.7490234375, 71.408203125, 74.0673828125, 76.7265625, 79.3857421875, 82.044921875, 84.7041015625, 87.36328125, 90.0224609375, 92.681640625, 95.3408203125, 98.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 8.0, 10.0, 15.0, 17.0, 22.0, 38.0, 50.0, 64.0, 112.0, 136.0, 204.0, 325.0, 420.0, 667.0, 921.0, 1453.0, 2214.0, 3249.0, 5256.0, 8604.0, 14059.0, 24345.0, 43534.0, 77663.0, 137055.0, 204478.0, 204183.0, 136396.0, 77702.0, 43464.0, 24044.0, 14167.0, 8399.0, 5175.0, 3401.0, 2143.0, 1449.0, 1013.0, 669.0, 451.0, 282.0, 207.0, 149.0, 102.0, 89.0, 48.0, 25.0, 28.0, 17.0, 8.0, 9.0, 3.0, 4.0, 4.0, 5.0, 1.0, 2.0], "bins": [-138.5, -134.302734375, -130.10546875, -125.908203125, -121.7109375, -117.513671875, -113.31640625, -109.119140625, -104.921875, -100.724609375, -96.52734375, -92.330078125, -88.1328125, -83.935546875, -79.73828125, -75.541015625, -71.34375, -67.146484375, -62.94921875, -58.751953125, -54.5546875, -50.357421875, -46.16015625, -41.962890625, -37.765625, -33.568359375, -29.37109375, -25.173828125, -20.9765625, -16.779296875, -12.58203125, -8.384765625, -4.1875, 0.009765625, 4.20703125, 8.404296875, 12.6015625, 16.798828125, 20.99609375, 25.193359375, 29.390625, 33.587890625, 37.78515625, 41.982421875, 46.1796875, 50.376953125, 54.57421875, 58.771484375, 62.96875, 67.166015625, 71.36328125, 75.560546875, 79.7578125, 83.955078125, 88.15234375, 92.349609375, 96.546875, 100.744140625, 104.94140625, 109.138671875, 113.3359375, 117.533203125, 121.73046875, 125.927734375, 130.125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 5.0, 7.0, 7.0, 15.0, 6.0, 13.0, 12.0, 25.0, 27.0, 32.0, 29.0, 40.0, 30.0, 36.0, 49.0, 43.0, 43.0, 43.0, 53.0, 60.0, 46.0, 53.0, 39.0, 36.0, 39.0, 26.0, 35.0, 32.0, 20.0, 16.0, 18.0, 7.0, 11.0, 17.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0], "bins": [-65.4375, -63.68408203125, -61.9306640625, -60.17724609375, -58.423828125, -56.67041015625, -54.9169921875, -53.16357421875, -51.41015625, -49.65673828125, -47.9033203125, -46.14990234375, -44.396484375, -42.64306640625, -40.8896484375, -39.13623046875, -37.3828125, -35.62939453125, -33.8759765625, -32.12255859375, -30.369140625, -28.61572265625, -26.8623046875, -25.10888671875, -23.35546875, -21.60205078125, -19.8486328125, -18.09521484375, -16.341796875, -14.58837890625, -12.8349609375, -11.08154296875, -9.328125, -7.57470703125, -5.8212890625, -4.06787109375, -2.314453125, -0.56103515625, 1.1923828125, 2.94580078125, 4.69921875, 6.45263671875, 8.2060546875, 9.95947265625, 11.712890625, 13.46630859375, 15.2197265625, 16.97314453125, 18.7265625, 20.47998046875, 22.2333984375, 23.98681640625, 25.740234375, 27.49365234375, 29.2470703125, 31.00048828125, 32.75390625, 34.50732421875, 36.2607421875, 38.01416015625, 39.767578125, 41.52099609375, 43.2744140625, 45.02783203125, 46.78125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 12.0, 13.0, 9.0, 21.0, 51.0, 69.0, 87.0, 114.0, 182.0, 305.0, 488.0, 805.0, 1312.0, 2319.0, 3946.0, 7525.0, 14907.0, 30823.0, 65650.0, 141645.0, 260504.0, 255841.0, 137073.0, 63956.0, 29603.0, 14488.0, 7399.0, 3898.0, 2165.0, 1227.0, 755.0, 497.0, 269.0, 199.0, 117.0, 87.0, 68.0, 39.0, 23.0, 18.0, 14.0, 13.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-102.0, -98.998046875, -95.99609375, -92.994140625, -89.9921875, -86.990234375, -83.98828125, -80.986328125, -77.984375, -74.982421875, -71.98046875, -68.978515625, -65.9765625, -62.974609375, -59.97265625, -56.970703125, -53.96875, -50.966796875, -47.96484375, -44.962890625, -41.9609375, -38.958984375, -35.95703125, -32.955078125, -29.953125, -26.951171875, -23.94921875, -20.947265625, -17.9453125, -14.943359375, -11.94140625, -8.939453125, -5.9375, -2.935546875, 0.06640625, 3.068359375, 6.0703125, 9.072265625, 12.07421875, 15.076171875, 18.078125, 21.080078125, 24.08203125, 27.083984375, 30.0859375, 33.087890625, 36.08984375, 39.091796875, 42.09375, 45.095703125, 48.09765625, 51.099609375, 54.1015625, 57.103515625, 60.10546875, 63.107421875, 66.109375, 69.111328125, 72.11328125, 75.115234375, 78.1171875, 81.119140625, 84.12109375, 87.123046875, 90.125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 11.0, 8.0, 8.0, 15.0, 17.0, 22.0, 30.0, 42.0, 61.0, 102.0, 113.0, 123.0, 104.0, 97.0, 67.0, 64.0, 36.0, 24.0, 17.0, 13.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01335906982421875, -0.01296079158782959, -0.01256251335144043, -0.01216423511505127, -0.01176595687866211, -0.01136767864227295, -0.010969400405883789, -0.010571122169494629, -0.010172843933105469, -0.009774565696716309, -0.009376287460327148, -0.008978009223937988, -0.008579730987548828, -0.008181452751159668, -0.007783174514770508, -0.007384896278381348, -0.0069866180419921875, -0.006588339805603027, -0.006190061569213867, -0.005791783332824707, -0.005393505096435547, -0.004995226860046387, -0.0045969486236572266, -0.004198670387268066, -0.0038003921508789062, -0.003402113914489746, -0.003003835678100586, -0.0026055574417114258, -0.0022072792053222656, -0.0018090009689331055, -0.0014107227325439453, -0.0010124444961547852, -0.000614166259765625, -0.00021588802337646484, 0.0001823902130126953, 0.0005806684494018555, 0.0009789466857910156, 0.0013772249221801758, 0.001775503158569336, 0.002173781394958496, 0.0025720596313476562, 0.0029703378677368164, 0.0033686161041259766, 0.0037668943405151367, 0.004165172576904297, 0.004563450813293457, 0.004961729049682617, 0.005360007286071777, 0.0057582855224609375, 0.006156563758850098, 0.006554841995239258, 0.006953120231628418, 0.007351398468017578, 0.007749676704406738, 0.008147954940795898, 0.008546233177185059, 0.008944511413574219, 0.009342789649963379, 0.009741067886352539, 0.0101393461227417, 0.01053762435913086, 0.01093590259552002, 0.01133418083190918, 0.01173245906829834, 0.0121307373046875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 14.0, 18.0, 38.0, 50.0, 82.0, 106.0, 165.0, 236.0, 330.0, 525.0, 757.0, 1108.0, 1655.0, 2384.0, 3560.0, 5314.0, 8347.0, 12739.0, 20757.0, 33003.0, 54842.0, 91852.0, 147850.0, 196867.0, 173021.0, 112977.0, 68700.0, 41366.0, 25094.0, 15666.0, 9798.0, 6403.0, 4247.0, 2723.0, 1866.0, 1294.0, 867.0, 603.0, 409.0, 284.0, 193.0, 143.0, 95.0, 66.0, 56.0, 30.0, 28.0, 9.0, 5.0, 6.0, 4.0, 1.0, 3.0], "bins": [-64.1875, -62.33837890625, -60.4892578125, -58.64013671875, -56.791015625, -54.94189453125, -53.0927734375, -51.24365234375, -49.39453125, -47.54541015625, -45.6962890625, -43.84716796875, -41.998046875, -40.14892578125, -38.2998046875, -36.45068359375, -34.6015625, -32.75244140625, -30.9033203125, -29.05419921875, -27.205078125, -25.35595703125, -23.5068359375, -21.65771484375, -19.80859375, -17.95947265625, -16.1103515625, -14.26123046875, -12.412109375, -10.56298828125, -8.7138671875, -6.86474609375, -5.015625, -3.16650390625, -1.3173828125, 0.53173828125, 2.380859375, 4.22998046875, 6.0791015625, 7.92822265625, 9.77734375, 11.62646484375, 13.4755859375, 15.32470703125, 17.173828125, 19.02294921875, 20.8720703125, 22.72119140625, 24.5703125, 26.41943359375, 28.2685546875, 30.11767578125, 31.966796875, 33.81591796875, 35.6650390625, 37.51416015625, 39.36328125, 41.21240234375, 43.0615234375, 44.91064453125, 46.759765625, 48.60888671875, 50.4580078125, 52.30712890625, 54.15625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 8.0, 11.0, 9.0, 20.0, 22.0, 22.0, 18.0, 22.0, 29.0, 30.0, 29.0, 38.0, 45.0, 35.0, 52.0, 49.0, 38.0, 47.0, 49.0, 42.0, 31.0, 38.0, 29.0, 42.0, 33.0, 29.0, 21.0, 20.0, 21.0, 16.0, 13.0, 8.0, 10.0, 8.0, 6.0, 8.0, 6.0, 6.0, 7.0, 3.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.875, -13.407470703125, -12.93994140625, -12.472412109375, -12.0048828125, -11.537353515625, -11.06982421875, -10.602294921875, -10.134765625, -9.667236328125, -9.19970703125, -8.732177734375, -8.2646484375, -7.797119140625, -7.32958984375, -6.862060546875, -6.39453125, -5.927001953125, -5.45947265625, -4.991943359375, -4.5244140625, -4.056884765625, -3.58935546875, -3.121826171875, -2.654296875, -2.186767578125, -1.71923828125, -1.251708984375, -0.7841796875, -0.316650390625, 0.15087890625, 0.618408203125, 1.0859375, 1.553466796875, 2.02099609375, 2.488525390625, 2.9560546875, 3.423583984375, 3.89111328125, 4.358642578125, 4.826171875, 5.293701171875, 5.76123046875, 6.228759765625, 6.6962890625, 7.163818359375, 7.63134765625, 8.098876953125, 8.56640625, 9.033935546875, 9.50146484375, 9.968994140625, 10.4365234375, 10.904052734375, 11.37158203125, 11.839111328125, 12.306640625, 12.774169921875, 13.24169921875, 13.709228515625, 14.1767578125, 14.644287109375, 15.11181640625, 15.579345703125, 16.046875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 4.0, 6.0, 8.0, 7.0, 7.0, 20.0, 14.0, 24.0, 19.0, 32.0, 31.0, 48.0, 59.0, 59.0, 67.0, 69.0, 79.0, 75.0, 63.0, 58.0, 54.0, 35.0, 44.0, 24.0, 25.0, 11.0, 16.0, 7.0, 9.0, 10.0, 5.0, 3.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-179.46360778808594, -174.63201904296875, -169.8004150390625, -164.96881103515625, -160.13722229003906, -155.30563354492188, -150.47402954101562, -145.64242553710938, -140.8108367919922, -135.979248046875, -131.14764404296875, -126.31604766845703, -121.48445129394531, -116.6528549194336, -111.82125854492188, -106.98966217041016, -102.15806579589844, -97.32646942138672, -92.494873046875, -87.66327667236328, -82.83168029785156, -78.00008392333984, -73.16848754882812, -68.3368911743164, -63.50529479980469, -58.67369842529297, -53.84210205078125, -49.01050567626953, -44.17890930175781, -39.347312927246094, -34.515716552734375, -29.684120178222656, -24.8525390625, -20.02094268798828, -15.189346313476562, -10.357749938964844, -5.526153564453125, -0.6945571899414062, 4.1370391845703125, 8.968635559082031, 13.80023193359375, 18.63182830810547, 23.463424682617188, 28.295021057128906, 33.126617431640625, 37.958213806152344, 42.78981018066406, 47.62140655517578, 52.4530029296875, 57.28459930419922, 62.11619567871094, 66.94779205322266, 71.77938842773438, 76.6109848022461, 81.44258117675781, 86.27417755126953, 91.10577392578125, 95.93737030029297, 100.76896667480469, 105.6005630493164, 110.43215942382812, 115.26375579833984, 120.09535217285156, 124.92694854736328, 129.758544921875]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 4.0, 7.0, 9.0, 8.0, 10.0, 6.0, 16.0, 22.0, 24.0, 30.0, 22.0, 33.0, 46.0, 56.0, 46.0, 45.0, 59.0, 52.0, 62.0, 63.0, 56.0, 49.0, 44.0, 33.0, 37.0, 38.0, 18.0, 13.0, 22.0, 15.0, 13.0, 11.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-125.78013610839844, -121.90802001953125, -118.0359115600586, -114.16380310058594, -110.29168701171875, -106.41957092285156, -102.5474624633789, -98.67535400390625, -94.80323791503906, -90.93112182617188, -87.05901336669922, -83.18690490722656, -79.31478881835938, -75.44267272949219, -71.57056427001953, -67.69845581054688, -63.82633972167969, -59.954227447509766, -56.082115173339844, -52.21000289916992, -48.337890625, -44.46577835083008, -40.593666076660156, -36.721553802490234, -32.84944152832031, -28.97732925415039, -25.10521697998047, -21.233104705810547, -17.360992431640625, -13.488880157470703, -9.616767883300781, -5.744655609130859, -1.8725433349609375, 1.9995689392089844, 5.871681213378906, 9.743793487548828, 13.61590576171875, 17.488018035888672, 21.360130310058594, 25.232242584228516, 29.104354858398438, 32.97646713256836, 36.84857940673828, 40.7206916809082, 44.592803955078125, 48.46491622924805, 52.33702850341797, 56.20914077758789, 60.08125305175781, 63.953365325927734, 67.82547760009766, 71.69758605957031, 75.5697021484375, 79.44181823730469, 83.31392669677734, 87.18603515625, 91.05815124511719, 94.93026733398438, 98.80237579345703, 102.67448425292969, 106.54660034179688, 110.41871643066406, 114.29082489013672, 118.16293334960938, 122.03504943847656]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 2.0, 11.0, 8.0, 11.0, 13.0, 18.0, 27.0, 23.0, 39.0, 30.0, 46.0, 62.0, 94.0, 146.0, 198.0, 294.0, 456.0, 806.0, 1468.0, 4237.0, 512340.0, 1600.0, 797.0, 460.0, 304.0, 191.0, 148.0, 96.0, 70.0, 59.0, 40.0, 24.0, 33.0, 14.0, 14.0, 13.0, 11.0, 10.0, 9.0, 8.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-2329.248291015625, -2258.72705078125, -2188.2060546875, -2117.684814453125, -2047.163818359375, -1976.642578125, -1906.1214599609375, -1835.600341796875, -1765.0792236328125, -1694.55810546875, -1624.0369873046875, -1553.515869140625, -1482.99462890625, -1412.4736328125, -1341.952392578125, -1271.4312744140625, -1200.91015625, -1130.3890380859375, -1059.867919921875, -989.3467407226562, -918.8256225585938, -848.3045043945312, -777.7833251953125, -707.26220703125, -636.7410888671875, -566.219970703125, -495.6988220214844, -425.17767333984375, -354.65655517578125, -284.13543701171875, -213.61428833007812, -143.0931396484375, -72.572265625, -2.0511322021484375, 68.47000122070312, 138.9911346435547, 209.51226806640625, 280.03338623046875, 350.5545349121094, 421.07568359375, 491.5968017578125, 562.117919921875, 632.6390380859375, 703.1602172851562, 773.6813354492188, 844.2024536132812, 914.7236328125, 985.2447509765625, 1055.765869140625, 1126.2869873046875, 1196.80810546875, 1267.3292236328125, 1337.850341796875, 1408.37158203125, 1478.8927001953125, 1549.413818359375, 1619.9349365234375, 1690.4560546875, 1760.9771728515625, 1831.498291015625, 1902.01953125, 1972.54052734375, 2043.061767578125, 2113.5830078125, 2184.10400390625]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 7.0, 2.0, 8.0, 9.0, 11.0, 7.0, 8.0, 25.0, 17.0, 34.0, 25.0, 26.0, 36.0, 62.0, 42.0, 41.0, 60.0, 1075.0, 68.0, 56.0, 64.0, 46.0, 51.0, 34.0, 37.0, 32.0, 31.0, 14.0, 20.0, 16.0, 12.0, 15.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4107.04736328125, -3982.537353515625, -3858.02734375, -3733.517333984375, -3609.00732421875, -3484.497314453125, -3359.9873046875, -3235.477294921875, -3110.96728515625, -2986.457275390625, -2861.947265625, -2737.437255859375, -2612.92724609375, -2488.417236328125, -2363.9072265625, -2239.397216796875, -2114.88720703125, -1990.377197265625, -1865.8671875, -1741.357177734375, -1616.84716796875, -1492.337158203125, -1367.8271484375, -1243.317138671875, -1118.80712890625, -994.297119140625, -869.787109375, -745.277099609375, -620.76708984375, -496.257080078125, -371.7470703125, -247.237060546875, -122.727294921875, 1.78271484375, 126.292724609375, 250.802734375, 375.312744140625, 499.82275390625, 624.332763671875, 748.8427734375, 873.352783203125, 997.86279296875, 1122.372802734375, 1246.8828125, 1371.392822265625, 1495.90283203125, 1620.412841796875, 1744.9228515625, 1869.432861328125, 1993.94287109375, 2118.452880859375, 2242.962890625, 2367.472900390625, 2491.98291015625, 2616.492919921875, 2741.0029296875, 2865.512939453125, 2990.02294921875, 3114.532958984375, 3239.04296875, 3363.552978515625, 3488.06298828125, 3612.572998046875, 3737.0830078125, 3861.593017578125]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 11.0, 15.0, 15.0, 21.0, 23.0, 39.0, 36.0, 46.0, 58.0, 84.0, 97.0, 120.0, 209.0, 383.0, 690.0, 1377.0, 2404.0, 4011.0, 8809.0, 31203860.0, 18826.0, 9726.0, 1608.0, 739.0, 379.0, 227.0, 140.0, 106.0, 81.0, 63.0, 49.0, 45.0, 40.0, 32.0, 23.0, 25.0, 14.0, 11.0, 14.0, 14.0, 7.0, 5.0, 4.0, 2.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2727.01513671875, -2643.531982421875, -2560.048828125, -2476.5654296875, -2393.082275390625, -2309.59912109375, -2226.115966796875, -2142.6328125, -2059.1494140625, -1975.666259765625, -1892.1829833984375, -1808.6998291015625, -1725.216552734375, -1641.7333984375, -1558.250244140625, -1474.76708984375, -1391.283935546875, -1307.80078125, -1224.3175048828125, -1140.8343505859375, -1057.35107421875, -973.867919921875, -890.384765625, -806.9015502929688, -723.4183349609375, -639.9351196289062, -556.451904296875, -472.96875, -389.48553466796875, -306.0023193359375, -222.51913452148438, -139.03594970703125, -55.552490234375, 27.930709838867188, 111.41390991210938, 194.89710998535156, 278.38031005859375, 361.863525390625, 445.3467102050781, 528.8298950195312, 612.3131103515625, 695.7963256835938, 779.279541015625, 862.7626953125, 946.2459106445312, 1029.7291259765625, 1113.2122802734375, 1196.695556640625, 1280.1787109375, 1363.661865234375, 1447.1451416015625, 1530.6282958984375, 1614.111572265625, 1697.5947265625, 1781.077880859375, 1864.56103515625, 1948.0443115234375, 2031.5274658203125, 2115.0107421875, 2198.493896484375, 2281.97705078125, 2365.46044921875, 2448.943603515625, 2532.4267578125, 2615.909912109375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 8.0, 13.0, 22.0, 32.0, 52.0, 54.0, 93.0, 134.0, 206.0, 299.0, 396.0, 602.0, 839.0, 1394.0, 2276.0, 3450.0, 5744.0, 9429.0, 16818.0, 30531.0, 57884.0, 117381.0, 258450.0, 656203.0, 2029128.0, 1967592.0, 640271.0, 251579.0, 114232.0, 56230.0, 29890.0, 16332.0, 9135.0, 5499.0, 3307.0, 2048.0, 1279.0, 887.0, 533.0, 400.0, 259.0, 147.0, 110.0, 88.0, 52.0, 41.0, 34.0, 14.0, 11.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-141.0, -136.44921875, -131.8984375, -127.34765625, -122.796875, -118.24609375, -113.6953125, -109.14453125, -104.59375, -100.04296875, -95.4921875, -90.94140625, -86.390625, -81.83984375, -77.2890625, -72.73828125, -68.1875, -63.63671875, -59.0859375, -54.53515625, -49.984375, -45.43359375, -40.8828125, -36.33203125, -31.78125, -27.23046875, -22.6796875, -18.12890625, -13.578125, -9.02734375, -4.4765625, 0.07421875, 4.625, 9.17578125, 13.7265625, 18.27734375, 22.828125, 27.37890625, 31.9296875, 36.48046875, 41.03125, 45.58203125, 50.1328125, 54.68359375, 59.234375, 63.78515625, 68.3359375, 72.88671875, 77.4375, 81.98828125, 86.5390625, 91.08984375, 95.640625, 100.19140625, 104.7421875, 109.29296875, 113.84375, 118.39453125, 122.9453125, 127.49609375, 132.046875, 136.59765625, 141.1484375, 145.69921875, 150.25]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 7.0, 3.0, 13.0, 4.0, 7.0, 11.0, 9.0, 19.0, 17.0, 17.0, 16.0, 25.0, 39.0, 45.0, 39.0, 46.0, 67.0, 112.0, 83.0, 128.0, 131.0, 158.0, 132.0, 157.0, 105.0, 106.0, 98.0, 84.0, 57.0, 44.0, 39.0, 34.0, 31.0, 32.0, 21.0, 17.0, 6.0, 13.0, 17.0, 10.0, 3.0, 3.0, 3.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-41.625, -40.3349609375, -39.044921875, -37.7548828125, -36.46484375, -35.1748046875, -33.884765625, -32.5947265625, -31.3046875, -30.0146484375, -28.724609375, -27.4345703125, -26.14453125, -24.8544921875, -23.564453125, -22.2744140625, -20.984375, -19.6943359375, -18.404296875, -17.1142578125, -15.82421875, -14.5341796875, -13.244140625, -11.9541015625, -10.6640625, -9.3740234375, -8.083984375, -6.7939453125, -5.50390625, -4.2138671875, -2.923828125, -1.6337890625, -0.34375, 0.9462890625, 2.236328125, 3.5263671875, 4.81640625, 6.1064453125, 7.396484375, 8.6865234375, 9.9765625, 11.2666015625, 12.556640625, 13.8466796875, 15.13671875, 16.4267578125, 17.716796875, 19.0068359375, 20.296875, 21.5869140625, 22.876953125, 24.1669921875, 25.45703125, 26.7470703125, 28.037109375, 29.3271484375, 30.6171875, 31.9072265625, 33.197265625, 34.4873046875, 35.77734375, 37.0673828125, 38.357421875, 39.6474609375, 40.9375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 8.0, 12.0, 17.0, 23.0, 36.0, 54.0, 97.0, 143.0, 215.0, 364.0, 524.0, 850.0, 1390.0, 2248.0, 3790.0, 6477.0, 11841.0, 21297.0, 39941.0, 76933.0, 147869.0, 287164.0, 583111.0, 1411813.0, 2042298.0, 844703.0, 391660.0, 197579.0, 102019.0, 52883.0, 28191.0, 15332.0, 8290.0, 4897.0, 2804.0, 1685.0, 1056.0, 623.0, 397.0, 274.0, 180.0, 112.0, 75.0, 55.0, 41.0, 19.0, 14.0, 7.0, 14.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-78.8125, -76.205078125, -73.59765625, -70.990234375, -68.3828125, -65.775390625, -63.16796875, -60.560546875, -57.953125, -55.345703125, -52.73828125, -50.130859375, -47.5234375, -44.916015625, -42.30859375, -39.701171875, -37.09375, -34.486328125, -31.87890625, -29.271484375, -26.6640625, -24.056640625, -21.44921875, -18.841796875, -16.234375, -13.626953125, -11.01953125, -8.412109375, -5.8046875, -3.197265625, -0.58984375, 2.017578125, 4.625, 7.232421875, 9.83984375, 12.447265625, 15.0546875, 17.662109375, 20.26953125, 22.876953125, 25.484375, 28.091796875, 30.69921875, 33.306640625, 35.9140625, 38.521484375, 41.12890625, 43.736328125, 46.34375, 48.951171875, 51.55859375, 54.166015625, 56.7734375, 59.380859375, 61.98828125, 64.595703125, 67.203125, 69.810546875, 72.41796875, 75.025390625, 77.6328125, 80.240234375, 82.84765625, 85.455078125, 88.0625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 5.0, 12.0, 15.0, 27.0, 29.0, 26.0, 48.0, 43.0, 61.0, 59.0, 76.0, 89.0, 81.0, 143.0, 142.0, 169.0, 163.0, 125.0, 127.0, 103.0, 102.0, 74.0, 38.0, 44.0, 44.0, 38.0, 25.0, 17.0, 19.0, 17.0, 14.0, 6.0, 5.0, 6.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-64.1875, -62.294921875, -60.40234375, -58.509765625, -56.6171875, -54.724609375, -52.83203125, -50.939453125, -49.046875, -47.154296875, -45.26171875, -43.369140625, -41.4765625, -39.583984375, -37.69140625, -35.798828125, -33.90625, -32.013671875, -30.12109375, -28.228515625, -26.3359375, -24.443359375, -22.55078125, -20.658203125, -18.765625, -16.873046875, -14.98046875, -13.087890625, -11.1953125, -9.302734375, -7.41015625, -5.517578125, -3.625, -1.732421875, 0.16015625, 2.052734375, 3.9453125, 5.837890625, 7.73046875, 9.623046875, 11.515625, 13.408203125, 15.30078125, 17.193359375, 19.0859375, 20.978515625, 22.87109375, 24.763671875, 26.65625, 28.548828125, 30.44140625, 32.333984375, 34.2265625, 36.119140625, 38.01171875, 39.904296875, 41.796875, 43.689453125, 45.58203125, 47.474609375, 49.3671875, 51.259765625, 53.15234375, 55.044921875, 56.9375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 13.0, 8.0, 9.0, 11.0, 39.0, 52.0, 63.0, 75.0, 107.0, 166.0, 232.0, 422.0, 547.0, 874.0, 1307.0, 2269.0, 3511.0, 5424.0, 9240.0, 16062.0, 28370.0, 56795.0, 137509.0, 5461163.0, 374627.0, 94201.0, 42528.0, 22589.0, 12572.0, 7576.0, 4708.0, 2774.0, 1822.0, 1209.0, 838.0, 512.0, 359.0, 250.0, 172.0, 119.0, 80.0, 68.0, 49.0, 29.0, 22.0, 17.0, 14.0, 12.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-249.875, -241.767578125, -233.66015625, -225.552734375, -217.4453125, -209.337890625, -201.23046875, -193.123046875, -185.015625, -176.908203125, -168.80078125, -160.693359375, -152.5859375, -144.478515625, -136.37109375, -128.263671875, -120.15625, -112.048828125, -103.94140625, -95.833984375, -87.7265625, -79.619140625, -71.51171875, -63.404296875, -55.296875, -47.189453125, -39.08203125, -30.974609375, -22.8671875, -14.759765625, -6.65234375, 1.455078125, 9.5625, 17.669921875, 25.77734375, 33.884765625, 41.9921875, 50.099609375, 58.20703125, 66.314453125, 74.421875, 82.529296875, 90.63671875, 98.744140625, 106.8515625, 114.958984375, 123.06640625, 131.173828125, 139.28125, 147.388671875, 155.49609375, 163.603515625, 171.7109375, 179.818359375, 187.92578125, 196.033203125, 204.140625, 212.248046875, 220.35546875, 228.462890625, 236.5703125, 244.677734375, 252.78515625, 260.892578125, 269.0]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 8.0, 7.0, 14.0, 11.0, 16.0, 17.0, 17.0, 24.0, 28.0, 24.0, 38.0, 48.0, 55.0, 46.0, 74.0, 106.0, 139.0, 186.0, 212.0, 228.0, 154.0, 132.0, 84.0, 72.0, 60.0, 43.0, 34.0, 25.0, 24.0, 23.0, 12.0, 16.0, 9.0, 9.0, 9.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-115.125, -112.06640625, -109.0078125, -105.94921875, -102.890625, -99.83203125, -96.7734375, -93.71484375, -90.65625, -87.59765625, -84.5390625, -81.48046875, -78.421875, -75.36328125, -72.3046875, -69.24609375, -66.1875, -63.12890625, -60.0703125, -57.01171875, -53.953125, -50.89453125, -47.8359375, -44.77734375, -41.71875, -38.66015625, -35.6015625, -32.54296875, -29.484375, -26.42578125, -23.3671875, -20.30859375, -17.25, -14.19140625, -11.1328125, -8.07421875, -5.015625, -1.95703125, 1.1015625, 4.16015625, 7.21875, 10.27734375, 13.3359375, 16.39453125, 19.453125, 22.51171875, 25.5703125, 28.62890625, 31.6875, 34.74609375, 37.8046875, 40.86328125, 43.921875, 46.98046875, 50.0390625, 53.09765625, 56.15625, 59.21484375, 62.2734375, 65.33203125, 68.390625, 71.44921875, 74.5078125, 77.56640625, 80.625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 0.0, 6.0, 10.0, 19.0, 41.0, 65.0, 118.0, 481.0, 146.0, 48.0, 30.0, 11.0, 12.0, 5.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-29289.205078125, -28697.8671875, -28106.53125, -27515.193359375, -26923.85546875, -26332.517578125, -25741.1796875, -25149.84375, -24558.505859375, -23967.16796875, -23375.83203125, -22784.494140625, -22193.15625, -21601.818359375, -21010.48046875, -20419.14453125, -19827.806640625, -19236.46875, -18645.1328125, -18053.794921875, -17462.45703125, -16871.119140625, -16279.7822265625, -15688.4453125, -15097.107421875, -14505.76953125, -13914.4326171875, -13323.095703125, -12731.7578125, -12140.419921875, -11549.0830078125, -10957.74609375, -10366.40625, -9775.068359375, -9183.7314453125, -8592.39453125, -8001.056640625, -7409.71923828125, -6818.3818359375, -6227.04443359375, -5635.70703125, -5044.36962890625, -4453.0322265625, -3861.69482421875, -3270.357421875, -2679.02001953125, -2087.6826171875, -1496.34521484375, -905.0078125, -313.67041015625, 277.6669921875, 869.00439453125, 1460.341796875, 2051.67919921875, 2643.0166015625, 3234.35400390625, 3825.69140625, 4417.02880859375, 5008.3662109375, 5599.70361328125, 6191.041015625, 6782.37841796875, 7373.7158203125, 7965.05322265625, 8556.390625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 7.0, 2.0, 7.0, 1.0, 10.0, 1.0, 8.0, 7.0, 8.0, 10.0, 18.0, 10.0, 17.0, 21.0, 18.0, 19.0, 17.0, 22.0, 46.0, 76.0, 126.0, 165.0, 92.0, 54.0, 41.0, 23.0, 29.0, 24.0, 19.0, 10.0, 7.0, 12.0, 10.0, 12.0, 13.0, 10.0, 5.0, 4.0, 1.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2373.5947265625, -2302.244873046875, -2230.895263671875, -2159.54541015625, -2088.195556640625, -2016.845947265625, -1945.49609375, -1874.1463623046875, -1802.796630859375, -1731.4468994140625, -1660.0970458984375, -1588.747314453125, -1517.3975830078125, -1446.0478515625, -1374.697998046875, -1303.3482666015625, -1231.9984130859375, -1160.648681640625, -1089.298828125, -1017.9490966796875, -946.599365234375, -875.2495727539062, -803.8997802734375, -732.550048828125, -661.2002563476562, -589.8504638671875, -518.500732421875, -447.15093994140625, -375.8011779785156, -304.451416015625, -233.10162353515625, -161.75186157226562, -90.402099609375, -19.052330017089844, 52.29743957519531, 123.647216796875, 194.99697875976562, 266.34674072265625, 337.696533203125, 409.0462951660156, 480.39605712890625, 551.745849609375, 623.0955810546875, 694.4453735351562, 765.795166015625, 837.1448974609375, 908.4946899414062, 979.844482421875, 1051.1942138671875, 1122.5439453125, 1193.893798828125, 1265.2435302734375, 1336.59326171875, 1407.943115234375, 1479.2928466796875, 1550.642578125, 1621.992431640625, 1693.3421630859375, 1764.6920166015625, 1836.041748046875, 1907.3914794921875, 1978.7412109375, 2050.091064453125, 2121.44091796875, 2192.79052734375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 1.0, 5.0, 6.0, 8.0, 14.0, 14.0, 17.0, 28.0, 46.0, 50.0, 82.0, 127.0, 152.0, 240.0, 405.0, 589.0, 968.0, 1453.0, 2354.0, 3848.0, 6569.0, 11784.0, 22641.0, 47996.0, 137289.0, 843552.0, 2771360.0, 221554.0, 63832.0, 26600.0, 13072.0, 7207.0, 4245.0, 2476.0, 1452.0, 845.0, 523.0, 318.0, 214.0, 125.0, 76.0, 52.0, 31.0, 17.0, 12.0, 9.0, 5.0, 7.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-64.625, -62.78662109375, -60.9482421875, -59.10986328125, -57.271484375, -55.43310546875, -53.5947265625, -51.75634765625, -49.91796875, -48.07958984375, -46.2412109375, -44.40283203125, -42.564453125, -40.72607421875, -38.8876953125, -37.04931640625, -35.2109375, -33.37255859375, -31.5341796875, -29.69580078125, -27.857421875, -26.01904296875, -24.1806640625, -22.34228515625, -20.50390625, -18.66552734375, -16.8271484375, -14.98876953125, -13.150390625, -11.31201171875, -9.4736328125, -7.63525390625, -5.796875, -3.95849609375, -2.1201171875, -0.28173828125, 1.556640625, 3.39501953125, 5.2333984375, 7.07177734375, 8.91015625, 10.74853515625, 12.5869140625, 14.42529296875, 16.263671875, 18.10205078125, 19.9404296875, 21.77880859375, 23.6171875, 25.45556640625, 27.2939453125, 29.13232421875, 30.970703125, 32.80908203125, 34.6474609375, 36.48583984375, 38.32421875, 40.16259765625, 42.0009765625, 43.83935546875, 45.677734375, 47.51611328125, 49.3544921875, 51.19287109375, 53.03125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 10.0, 2.0, 7.0, 11.0, 13.0, 29.0, 30.0, 40.0, 59.0, 62.0, 98.0, 110.0, 116.0, 99.0, 90.0, 56.0, 50.0, 30.0, 17.0, 20.0, 10.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.494140625, -3.39459228515625, -3.2950439453125, -3.19549560546875, -3.095947265625, -2.99639892578125, -2.8968505859375, -2.79730224609375, -2.69775390625, -2.59820556640625, -2.4986572265625, -2.39910888671875, -2.299560546875, -2.20001220703125, -2.1004638671875, -2.00091552734375, -1.9013671875, -1.80181884765625, -1.7022705078125, -1.60272216796875, -1.503173828125, -1.40362548828125, -1.3040771484375, -1.20452880859375, -1.10498046875, -1.00543212890625, -0.9058837890625, -0.80633544921875, -0.706787109375, -0.60723876953125, -0.5076904296875, -0.40814208984375, -0.30859375, -0.20904541015625, -0.1094970703125, -0.00994873046875, 0.089599609375, 0.18914794921875, 0.2886962890625, 0.38824462890625, 0.48779296875, 0.58734130859375, 0.6868896484375, 0.78643798828125, 0.885986328125, 0.98553466796875, 1.0850830078125, 1.18463134765625, 1.2841796875, 1.38372802734375, 1.4832763671875, 1.58282470703125, 1.682373046875, 1.78192138671875, 1.8814697265625, 1.98101806640625, 2.08056640625, 2.18011474609375, 2.2796630859375, 2.37921142578125, 2.478759765625, 2.57830810546875, 2.6778564453125, 2.77740478515625, 2.876953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 12.0, 14.0, 21.0, 39.0, 41.0, 94.0, 106.0, 160.0, 238.0, 400.0, 629.0, 1066.0, 1823.0, 3646.0, 7537.0, 18319.0, 48716.0, 148731.0, 570236.0, 2405466.0, 708703.0, 179679.0, 58367.0, 21610.0, 9199.0, 4211.0, 2116.0, 1225.0, 696.0, 405.0, 259.0, 167.0, 113.0, 78.0, 46.0, 35.0, 30.0, 12.0, 11.0, 10.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-54.3125, -52.6943359375, -51.076171875, -49.4580078125, -47.83984375, -46.2216796875, -44.603515625, -42.9853515625, -41.3671875, -39.7490234375, -38.130859375, -36.5126953125, -34.89453125, -33.2763671875, -31.658203125, -30.0400390625, -28.421875, -26.8037109375, -25.185546875, -23.5673828125, -21.94921875, -20.3310546875, -18.712890625, -17.0947265625, -15.4765625, -13.8583984375, -12.240234375, -10.6220703125, -9.00390625, -7.3857421875, -5.767578125, -4.1494140625, -2.53125, -0.9130859375, 0.705078125, 2.3232421875, 3.94140625, 5.5595703125, 7.177734375, 8.7958984375, 10.4140625, 12.0322265625, 13.650390625, 15.2685546875, 16.88671875, 18.5048828125, 20.123046875, 21.7412109375, 23.359375, 24.9775390625, 26.595703125, 28.2138671875, 29.83203125, 31.4501953125, 33.068359375, 34.6865234375, 36.3046875, 37.9228515625, 39.541015625, 41.1591796875, 42.77734375, 44.3955078125, 46.013671875, 47.6318359375, 49.25]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 9.0, 0.0, 10.0, 10.0, 17.0, 16.0, 32.0, 53.0, 68.0, 92.0, 118.0, 149.0, 251.0, 297.0, 424.0, 713.0, 436.0, 318.0, 262.0, 181.0, 158.0, 127.0, 92.0, 53.0, 51.0, 37.0, 21.0, 21.0, 14.0, 10.0, 11.0, 4.0, 3.0, 7.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.4453125, -14.013671875, -13.58203125, -13.150390625, -12.71875, -12.287109375, -11.85546875, -11.423828125, -10.9921875, -10.560546875, -10.12890625, -9.697265625, -9.265625, -8.833984375, -8.40234375, -7.970703125, -7.5390625, -7.107421875, -6.67578125, -6.244140625, -5.8125, -5.380859375, -4.94921875, -4.517578125, -4.0859375, -3.654296875, -3.22265625, -2.791015625, -2.359375, -1.927734375, -1.49609375, -1.064453125, -0.6328125, -0.201171875, 0.23046875, 0.662109375, 1.09375, 1.525390625, 1.95703125, 2.388671875, 2.8203125, 3.251953125, 3.68359375, 4.115234375, 4.546875, 4.978515625, 5.41015625, 5.841796875, 6.2734375, 6.705078125, 7.13671875, 7.568359375, 8.0, 8.431640625, 8.86328125, 9.294921875, 9.7265625, 10.158203125, 10.58984375, 11.021484375, 11.453125, 11.884765625, 12.31640625, 12.748046875, 13.1796875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 16.0, 47.0, 124.0, 280.0, 285.0, 138.0, 63.0, 22.0, 17.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-395.7984619140625, -379.9058837890625, -364.0133361816406, -348.1207580566406, -332.2281799316406, -316.33563232421875, -300.44305419921875, -284.55047607421875, -268.65789794921875, -252.7653350830078, -236.8727569580078, -220.98019409179688, -205.08761596679688, -189.19505310058594, -173.302490234375, -157.409912109375, -141.51734924316406, -125.6247787475586, -109.73220825195312, -93.83964538574219, -77.94706726074219, -62.05450439453125, -46.16193389892578, -30.269363403320312, -14.376792907714844, 1.5157766342163086, 17.40834617614746, 33.3009147644043, 49.193485260009766, 65.08605194091797, 80.97862243652344, 96.8711929321289, 112.76376342773438, 128.6563262939453, 144.5489044189453, 160.44146728515625, 176.33404541015625, 192.2266082763672, 208.11917114257812, 224.01174926757812, 239.90432739257812, 255.79689025878906, 271.689453125, 287.58203125, 303.474609375, 319.3671875, 335.2597351074219, 351.1523132324219, 367.04486083984375, 382.93743896484375, 398.8299865722656, 414.7225646972656, 430.6151428222656, 446.5076904296875, 462.4002685546875, 478.2928466796875, 494.1854248046875, 510.0780029296875, 525.9705810546875, 541.8631591796875, 557.7556762695312, 573.6482543945312, 589.5408325195312, 605.4334106445312, 621.3259887695312]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 11.0, 13.0, 13.0, 27.0, 23.0, 39.0, 50.0, 39.0, 60.0, 59.0, 52.0, 56.0, 59.0, 59.0, 57.0, 58.0, 64.0, 52.0, 30.0, 44.0, 30.0, 19.0, 20.0, 12.0, 14.0, 5.0, 6.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-125.65234375, -121.87139892578125, -118.0904541015625, -114.30950164794922, -110.52855682373047, -106.74761199951172, -102.96665954589844, -99.18571472167969, -95.40476989746094, -91.62382507324219, -87.84288024902344, -84.06192779541016, -80.2809829711914, -76.50003814697266, -72.71908569335938, -68.93814086914062, -65.15719604492188, -61.376251220703125, -57.59530258178711, -53.814353942871094, -50.033409118652344, -46.252464294433594, -42.47151565551758, -38.69056701660156, -34.90962219238281, -31.12867546081543, -27.347728729248047, -23.566781997680664, -19.78583526611328, -16.0048885345459, -12.223941802978516, -8.442995071411133, -4.662055969238281, -0.8811092376708984, 2.8998374938964844, 6.680784225463867, 10.46173095703125, 14.242677688598633, 18.023624420166016, 21.8045711517334, 25.58551788330078, 29.366464614868164, 33.14741134643555, 36.92835998535156, 40.70930480957031, 44.49024963378906, 48.27119827270508, 52.052146911621094, 55.833091735839844, 59.614036560058594, 63.39498519897461, 67.17593383789062, 70.95687866210938, 74.73782348632812, 78.51876831054688, 82.29972076416016, 86.0806655883789, 89.86161041259766, 93.64256286621094, 97.42350769042969, 101.20445251464844, 104.98539733886719, 108.76634216308594, 112.54729461669922, 116.32823944091797]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 7.0, 5.0, 8.0, 9.0, 17.0, 18.0, 20.0, 22.0, 34.0, 52.0, 98.0, 140.0, 212.0, 394.0, 883.0, 2281.0, 7240.0, 31933.0, 219958.0, 664303.0, 95930.0, 17323.0, 4568.0, 1560.0, 645.0, 301.0, 182.0, 109.0, 79.0, 49.0, 30.0, 33.0, 22.0, 18.0, 16.0, 9.0, 13.0, 10.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-51.5625, -50.10205078125, -48.6416015625, -47.18115234375, -45.720703125, -44.26025390625, -42.7998046875, -41.33935546875, -39.87890625, -38.41845703125, -36.9580078125, -35.49755859375, -34.037109375, -32.57666015625, -31.1162109375, -29.65576171875, -28.1953125, -26.73486328125, -25.2744140625, -23.81396484375, -22.353515625, -20.89306640625, -19.4326171875, -17.97216796875, -16.51171875, -15.05126953125, -13.5908203125, -12.13037109375, -10.669921875, -9.20947265625, -7.7490234375, -6.28857421875, -4.828125, -3.36767578125, -1.9072265625, -0.44677734375, 1.013671875, 2.47412109375, 3.9345703125, 5.39501953125, 6.85546875, 8.31591796875, 9.7763671875, 11.23681640625, 12.697265625, 14.15771484375, 15.6181640625, 17.07861328125, 18.5390625, 19.99951171875, 21.4599609375, 22.92041015625, 24.380859375, 25.84130859375, 27.3017578125, 28.76220703125, 30.22265625, 31.68310546875, 33.1435546875, 34.60400390625, 36.064453125, 37.52490234375, 38.9853515625, 40.44580078125, 41.90625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 4.0, 14.0, 20.0, 38.0, 62.0, 87.0, 124.0, 131.0, 126.0, 115.0, 104.0, 72.0, 33.0, 31.0, 19.0, 12.0, 7.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.890625, -4.649169921875, -4.40771484375, -4.166259765625, -3.9248046875, -3.683349609375, -3.44189453125, -3.200439453125, -2.958984375, -2.717529296875, -2.47607421875, -2.234619140625, -1.9931640625, -1.751708984375, -1.51025390625, -1.268798828125, -1.02734375, -0.785888671875, -0.54443359375, -0.302978515625, -0.0615234375, 0.179931640625, 0.42138671875, 0.662841796875, 0.904296875, 1.145751953125, 1.38720703125, 1.628662109375, 1.8701171875, 2.111572265625, 2.35302734375, 2.594482421875, 2.8359375, 3.077392578125, 3.31884765625, 3.560302734375, 3.8017578125, 4.043212890625, 4.28466796875, 4.526123046875, 4.767578125, 5.009033203125, 5.25048828125, 5.491943359375, 5.7333984375, 5.974853515625, 6.21630859375, 6.457763671875, 6.69921875, 6.940673828125, 7.18212890625, 7.423583984375, 7.6650390625, 7.906494140625, 8.14794921875, 8.389404296875, 8.630859375, 8.872314453125, 9.11376953125, 9.355224609375, 9.5966796875, 9.838134765625, 10.07958984375, 10.321044921875, 10.5625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 11.0, 9.0, 11.0, 9.0, 13.0, 36.0, 50.0, 54.0, 85.0, 135.0, 213.0, 328.0, 568.0, 961.0, 1502.0, 2986.0, 5711.0, 11842.0, 27104.0, 72878.0, 246813.0, 451202.0, 142374.0, 46946.0, 18568.0, 8672.0, 4167.0, 2223.0, 1282.0, 705.0, 393.0, 251.0, 166.0, 92.0, 71.0, 43.0, 30.0, 18.0, 13.0, 4.0, 6.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.890625, -27.0771484375, -26.263671875, -25.4501953125, -24.63671875, -23.8232421875, -23.009765625, -22.1962890625, -21.3828125, -20.5693359375, -19.755859375, -18.9423828125, -18.12890625, -17.3154296875, -16.501953125, -15.6884765625, -14.875, -14.0615234375, -13.248046875, -12.4345703125, -11.62109375, -10.8076171875, -9.994140625, -9.1806640625, -8.3671875, -7.5537109375, -6.740234375, -5.9267578125, -5.11328125, -4.2998046875, -3.486328125, -2.6728515625, -1.859375, -1.0458984375, -0.232421875, 0.5810546875, 1.39453125, 2.2080078125, 3.021484375, 3.8349609375, 4.6484375, 5.4619140625, 6.275390625, 7.0888671875, 7.90234375, 8.7158203125, 9.529296875, 10.3427734375, 11.15625, 11.9697265625, 12.783203125, 13.5966796875, 14.41015625, 15.2236328125, 16.037109375, 16.8505859375, 17.6640625, 18.4775390625, 19.291015625, 20.1044921875, 20.91796875, 21.7314453125, 22.544921875, 23.3583984375, 24.171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 8.0, 12.0, 12.0, 19.0, 22.0, 33.0, 42.0, 48.0, 34.0, 52.0, 49.0, 55.0, 55.0, 59.0, 46.0, 58.0, 66.0, 42.0, 60.0, 30.0, 29.0, 35.0, 18.0, 28.0, 20.0, 15.0, 12.0, 9.0, 7.0, 5.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.25, -22.402587890625, -21.55517578125, -20.707763671875, -19.8603515625, -19.012939453125, -18.16552734375, -17.318115234375, -16.470703125, -15.623291015625, -14.77587890625, -13.928466796875, -13.0810546875, -12.233642578125, -11.38623046875, -10.538818359375, -9.69140625, -8.843994140625, -7.99658203125, -7.149169921875, -6.3017578125, -5.454345703125, -4.60693359375, -3.759521484375, -2.912109375, -2.064697265625, -1.21728515625, -0.369873046875, 0.4775390625, 1.324951171875, 2.17236328125, 3.019775390625, 3.8671875, 4.714599609375, 5.56201171875, 6.409423828125, 7.2568359375, 8.104248046875, 8.95166015625, 9.799072265625, 10.646484375, 11.493896484375, 12.34130859375, 13.188720703125, 14.0361328125, 14.883544921875, 15.73095703125, 16.578369140625, 17.42578125, 18.273193359375, 19.12060546875, 19.968017578125, 20.8154296875, 21.662841796875, 22.51025390625, 23.357666015625, 24.205078125, 25.052490234375, 25.89990234375, 26.747314453125, 27.5947265625, 28.442138671875, 29.28955078125, 30.136962890625, 30.984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 4.0, 16.0, 21.0, 14.0, 30.0, 36.0, 66.0, 73.0, 118.0, 168.0, 364.0, 583.0, 1083.0, 2217.0, 4904.0, 12541.0, 40369.0, 183660.0, 563533.0, 177964.0, 39024.0, 12239.0, 4822.0, 2059.0, 1077.0, 587.0, 320.0, 219.0, 151.0, 96.0, 43.0, 33.0, 27.0, 13.0, 15.0, 8.0, 8.0, 7.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-25.109375, -24.359619140625, -23.60986328125, -22.860107421875, -22.1103515625, -21.360595703125, -20.61083984375, -19.861083984375, -19.111328125, -18.361572265625, -17.61181640625, -16.862060546875, -16.1123046875, -15.362548828125, -14.61279296875, -13.863037109375, -13.11328125, -12.363525390625, -11.61376953125, -10.864013671875, -10.1142578125, -9.364501953125, -8.61474609375, -7.864990234375, -7.115234375, -6.365478515625, -5.61572265625, -4.865966796875, -4.1162109375, -3.366455078125, -2.61669921875, -1.866943359375, -1.1171875, -0.367431640625, 0.38232421875, 1.132080078125, 1.8818359375, 2.631591796875, 3.38134765625, 4.131103515625, 4.880859375, 5.630615234375, 6.38037109375, 7.130126953125, 7.8798828125, 8.629638671875, 9.37939453125, 10.129150390625, 10.87890625, 11.628662109375, 12.37841796875, 13.128173828125, 13.8779296875, 14.627685546875, 15.37744140625, 16.127197265625, 16.876953125, 17.626708984375, 18.37646484375, 19.126220703125, 19.8759765625, 20.625732421875, 21.37548828125, 22.125244140625, 22.875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 2.0, 7.0, 7.0, 10.0, 13.0, 10.0, 20.0, 23.0, 47.0, 40.0, 45.0, 63.0, 78.0, 88.0, 78.0, 91.0, 78.0, 73.0, 46.0, 40.0, 24.0, 26.0, 27.0, 12.0, 14.0, 10.0, 7.0, 9.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010595321655273438, -0.001018241047859192, -0.00097694993019104, -0.0009356588125228882, -0.0008943676948547363, -0.0008530765771865845, -0.0008117854595184326, -0.0007704943418502808, -0.0007292032241821289, -0.000687912106513977, -0.0006466209888458252, -0.0006053298711776733, -0.0005640387535095215, -0.0005227476358413696, -0.0004814565181732178, -0.0004401654005050659, -0.00039887428283691406, -0.0003575831651687622, -0.00031629204750061035, -0.0002750009298324585, -0.00023370981216430664, -0.00019241869449615479, -0.00015112757682800293, -0.00010983645915985107, -6.854534149169922e-05, -2.7254223823547363e-05, 1.4036893844604492e-05, 5.532801151275635e-05, 9.66191291809082e-05, 0.00013791024684906006, 0.00017920136451721191, 0.00022049248218536377, 0.0002617835998535156, 0.0003030747175216675, 0.00034436583518981934, 0.0003856569528579712, 0.00042694807052612305, 0.0004682391881942749, 0.0005095303058624268, 0.0005508214235305786, 0.0005921125411987305, 0.0006334036588668823, 0.0006746947765350342, 0.000715985894203186, 0.0007572770118713379, 0.0007985681295394897, 0.0008398592472076416, 0.0008811503648757935, 0.0009224414825439453, 0.0009637326002120972, 0.001005023717880249, 0.0010463148355484009, 0.0010876059532165527, 0.0011288970708847046, 0.0011701881885528564, 0.0012114793062210083, 0.0012527704238891602, 0.001294061541557312, 0.0013353526592254639, 0.0013766437768936157, 0.0014179348945617676, 0.0014592260122299194, 0.0015005171298980713, 0.0015418082475662231, 0.001583099365234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 9.0, 16.0, 14.0, 26.0, 37.0, 47.0, 82.0, 121.0, 219.0, 402.0, 708.0, 1374.0, 3218.0, 8486.0, 26476.0, 110768.0, 494135.0, 311670.0, 63025.0, 17089.0, 5687.0, 2442.0, 1121.0, 601.0, 304.0, 171.0, 111.0, 65.0, 39.0, 34.0, 22.0, 12.0, 8.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.03125, -22.307373046875, -21.58349609375, -20.859619140625, -20.1357421875, -19.411865234375, -18.68798828125, -17.964111328125, -17.240234375, -16.516357421875, -15.79248046875, -15.068603515625, -14.3447265625, -13.620849609375, -12.89697265625, -12.173095703125, -11.44921875, -10.725341796875, -10.00146484375, -9.277587890625, -8.5537109375, -7.829833984375, -7.10595703125, -6.382080078125, -5.658203125, -4.934326171875, -4.21044921875, -3.486572265625, -2.7626953125, -2.038818359375, -1.31494140625, -0.591064453125, 0.1328125, 0.856689453125, 1.58056640625, 2.304443359375, 3.0283203125, 3.752197265625, 4.47607421875, 5.199951171875, 5.923828125, 6.647705078125, 7.37158203125, 8.095458984375, 8.8193359375, 9.543212890625, 10.26708984375, 10.990966796875, 11.71484375, 12.438720703125, 13.16259765625, 13.886474609375, 14.6103515625, 15.334228515625, 16.05810546875, 16.781982421875, 17.505859375, 18.229736328125, 18.95361328125, 19.677490234375, 20.4013671875, 21.125244140625, 21.84912109375, 22.572998046875, 23.296875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 4.0, 4.0, 8.0, 11.0, 10.0, 12.0, 19.0, 38.0, 33.0, 48.0, 68.0, 64.0, 57.0, 70.0, 65.0, 84.0, 81.0, 64.0, 50.0, 37.0, 39.0, 40.0, 32.0, 18.0, 10.0, 7.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5390625, -9.2041015625, -8.869140625, -8.5341796875, -8.19921875, -7.8642578125, -7.529296875, -7.1943359375, -6.859375, -6.5244140625, -6.189453125, -5.8544921875, -5.51953125, -5.1845703125, -4.849609375, -4.5146484375, -4.1796875, -3.8447265625, -3.509765625, -3.1748046875, -2.83984375, -2.5048828125, -2.169921875, -1.8349609375, -1.5, -1.1650390625, -0.830078125, -0.4951171875, -0.16015625, 0.1748046875, 0.509765625, 0.8447265625, 1.1796875, 1.5146484375, 1.849609375, 2.1845703125, 2.51953125, 2.8544921875, 3.189453125, 3.5244140625, 3.859375, 4.1943359375, 4.529296875, 4.8642578125, 5.19921875, 5.5341796875, 5.869140625, 6.2041015625, 6.5390625, 6.8740234375, 7.208984375, 7.5439453125, 7.87890625, 8.2138671875, 8.548828125, 8.8837890625, 9.21875, 9.5537109375, 9.888671875, 10.2236328125, 10.55859375, 10.8935546875, 11.228515625, 11.5634765625, 11.8984375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 7.0, 7.0, 18.0, 40.0, 56.0, 141.0, 227.0, 227.0, 115.0, 68.0, 30.0, 20.0, 14.0, 3.0, 8.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.4768829345703, -195.0966339111328, -184.71636962890625, -174.33612060546875, -163.9558563232422, -153.5756072998047, -143.19534301757812, -132.81509399414062, -122.4348373413086, -112.05458068847656, -101.67432403564453, -91.2940673828125, -80.913818359375, -70.53355407714844, -60.15330505371094, -49.773048400878906, -39.392791748046875, -29.012535095214844, -18.632280349731445, -8.252025604248047, 2.1282310485839844, 12.508487701416016, 22.88874053955078, 33.26899719238281, 43.649253845214844, 54.029510498046875, 64.4097671508789, 74.79002380371094, 85.17027282714844, 95.550537109375, 105.9307861328125, 116.31104278564453, 126.69131469726562, 137.07156372070312, 147.4518280029297, 157.8320770263672, 168.21234130859375, 178.59259033203125, 188.97283935546875, 199.3531036376953, 209.73336791992188, 220.11361694335938, 230.49388122558594, 240.87413024902344, 251.25439453125, 261.6346435546875, 272.014892578125, 282.3951416015625, 292.775390625, 303.1556396484375, 313.535888671875, 323.9161682128906, 334.2964172363281, 344.6766662597656, 355.0569152832031, 365.43719482421875, 375.81744384765625, 386.19769287109375, 396.57794189453125, 406.9582214355469, 417.3384704589844, 427.7187194824219, 438.0989685058594, 448.479248046875, 458.8594970703125]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 6.0, 7.0, 8.0, 17.0, 18.0, 56.0, 69.0, 119.0, 139.0, 174.0, 134.0, 97.0, 41.0, 30.0, 23.0, 16.0, 12.0, 5.0, 8.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-405.77960205078125, -393.95550537109375, -382.13140869140625, -370.30731201171875, -358.48321533203125, -346.65911865234375, -334.83502197265625, -323.01092529296875, -311.18682861328125, -299.36273193359375, -287.53863525390625, -275.71453857421875, -263.89044189453125, -252.06634521484375, -240.2422637939453, -228.4181671142578, -216.59408569335938, -204.76998901367188, -192.94589233398438, -181.12179565429688, -169.29769897460938, -157.47360229492188, -145.64952087402344, -133.82542419433594, -122.00132751464844, -110.17723083496094, -98.35313415527344, -86.52904510498047, -74.70494842529297, -62.88085174560547, -51.0567626953125, -39.232666015625, -27.4085693359375, -15.584474563598633, -3.7603797912597656, 8.063713073730469, 19.88780975341797, 31.71190643310547, 43.53599548339844, 55.36009216308594, 67.18418884277344, 79.00828552246094, 90.83238220214844, 102.6564712524414, 114.4805679321289, 126.3046646118164, 138.12875366210938, 149.95285034179688, 161.77694702148438, 173.60104370117188, 185.42514038085938, 197.24923706054688, 209.07333374023438, 220.89743041992188, 232.7215118408203, 244.5456085205078, 256.36968994140625, 268.19378662109375, 280.01788330078125, 291.84197998046875, 303.66607666015625, 315.49017333984375, 327.31427001953125, 339.13836669921875, 350.96246337890625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 9.0, 13.0, 13.0, 21.0, 36.0, 62.0, 94.0, 146.0, 232.0, 452.0, 849.0, 1666.0, 3657.0, 9032.0, 29492.0, 165049.0, 3784712.0, 155120.0, 27674.0, 8902.0, 3492.0, 1623.0, 826.0, 422.0, 261.0, 155.0, 88.0, 70.0, 39.0, 18.0, 11.0, 11.0, 8.0, 10.0, 8.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-108.5625, -104.4638671875, -100.365234375, -96.2666015625, -92.16796875, -88.0693359375, -83.970703125, -79.8720703125, -75.7734375, -71.6748046875, -67.576171875, -63.4775390625, -59.37890625, -55.2802734375, -51.181640625, -47.0830078125, -42.984375, -38.8857421875, -34.787109375, -30.6884765625, -26.58984375, -22.4912109375, -18.392578125, -14.2939453125, -10.1953125, -6.0966796875, -1.998046875, 2.1005859375, 6.19921875, 10.2978515625, 14.396484375, 18.4951171875, 22.59375, 26.6923828125, 30.791015625, 34.8896484375, 38.98828125, 43.0869140625, 47.185546875, 51.2841796875, 55.3828125, 59.4814453125, 63.580078125, 67.6787109375, 71.77734375, 75.8759765625, 79.974609375, 84.0732421875, 88.171875, 92.2705078125, 96.369140625, 100.4677734375, 104.56640625, 108.6650390625, 112.763671875, 116.8623046875, 120.9609375, 125.0595703125, 129.158203125, 133.2568359375, 137.35546875, 141.4541015625, 145.552734375, 149.6513671875, 153.75]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 9.0, 8.0, 12.0, 17.0, 37.0, 24.0, 51.0, 68.0, 63.0, 72.0, 79.0, 82.0, 75.0, 81.0, 75.0, 65.0, 43.0, 38.0, 24.0, 19.0, 17.0, 8.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.96856689453125, -4.8160400390625, -4.66351318359375, -4.510986328125, -4.35845947265625, -4.2059326171875, -4.05340576171875, -3.90087890625, -3.74835205078125, -3.5958251953125, -3.44329833984375, -3.290771484375, -3.13824462890625, -2.9857177734375, -2.83319091796875, -2.6806640625, -2.52813720703125, -2.3756103515625, -2.22308349609375, -2.070556640625, -1.91802978515625, -1.7655029296875, -1.61297607421875, -1.46044921875, -1.30792236328125, -1.1553955078125, -1.00286865234375, -0.850341796875, -0.69781494140625, -0.5452880859375, -0.39276123046875, -0.240234375, -0.08770751953125, 0.0648193359375, 0.21734619140625, 0.369873046875, 0.52239990234375, 0.6749267578125, 0.82745361328125, 0.97998046875, 1.13250732421875, 1.2850341796875, 1.43756103515625, 1.590087890625, 1.74261474609375, 1.8951416015625, 2.04766845703125, 2.2001953125, 2.35272216796875, 2.5052490234375, 2.65777587890625, 2.810302734375, 2.96282958984375, 3.1153564453125, 3.26788330078125, 3.42041015625, 3.57293701171875, 3.7254638671875, 3.87799072265625, 4.030517578125, 4.18304443359375, 4.3355712890625, 4.48809814453125, 4.640625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 4.0, 9.0, 6.0, 17.0, 21.0, 30.0, 36.0, 70.0, 82.0, 110.0, 161.0, 278.0, 457.0, 683.0, 1169.0, 2094.0, 3751.0, 7322.0, 14622.0, 31833.0, 78664.0, 261681.0, 3023380.0, 557711.0, 123569.0, 45608.0, 19946.0, 9664.0, 5020.0, 2636.0, 1472.0, 868.0, 471.0, 305.0, 183.0, 100.0, 79.0, 52.0, 44.0, 28.0, 15.0, 12.0, 4.0, 7.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.625, -77.3310546875, -75.037109375, -72.7431640625, -70.44921875, -68.1552734375, -65.861328125, -63.5673828125, -61.2734375, -58.9794921875, -56.685546875, -54.3916015625, -52.09765625, -49.8037109375, -47.509765625, -45.2158203125, -42.921875, -40.6279296875, -38.333984375, -36.0400390625, -33.74609375, -31.4521484375, -29.158203125, -26.8642578125, -24.5703125, -22.2763671875, -19.982421875, -17.6884765625, -15.39453125, -13.1005859375, -10.806640625, -8.5126953125, -6.21875, -3.9248046875, -1.630859375, 0.6630859375, 2.95703125, 5.2509765625, 7.544921875, 9.8388671875, 12.1328125, 14.4267578125, 16.720703125, 19.0146484375, 21.30859375, 23.6025390625, 25.896484375, 28.1904296875, 30.484375, 32.7783203125, 35.072265625, 37.3662109375, 39.66015625, 41.9541015625, 44.248046875, 46.5419921875, 48.8359375, 51.1298828125, 53.423828125, 55.7177734375, 58.01171875, 60.3056640625, 62.599609375, 64.8935546875, 67.1875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 9.0, 6.0, 8.0, 4.0, 12.0, 18.0, 24.0, 28.0, 30.0, 38.0, 46.0, 86.0, 104.0, 143.0, 219.0, 506.0, 1686.0, 388.0, 194.0, 144.0, 88.0, 65.0, 59.0, 31.0, 34.0, 27.0, 22.0, 11.0, 13.0, 9.0, 6.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.84375, -12.45849609375, -12.0732421875, -11.68798828125, -11.302734375, -10.91748046875, -10.5322265625, -10.14697265625, -9.76171875, -9.37646484375, -8.9912109375, -8.60595703125, -8.220703125, -7.83544921875, -7.4501953125, -7.06494140625, -6.6796875, -6.29443359375, -5.9091796875, -5.52392578125, -5.138671875, -4.75341796875, -4.3681640625, -3.98291015625, -3.59765625, -3.21240234375, -2.8271484375, -2.44189453125, -2.056640625, -1.67138671875, -1.2861328125, -0.90087890625, -0.515625, -0.13037109375, 0.2548828125, 0.64013671875, 1.025390625, 1.41064453125, 1.7958984375, 2.18115234375, 2.56640625, 2.95166015625, 3.3369140625, 3.72216796875, 4.107421875, 4.49267578125, 4.8779296875, 5.26318359375, 5.6484375, 6.03369140625, 6.4189453125, 6.80419921875, 7.189453125, 7.57470703125, 7.9599609375, 8.34521484375, 8.73046875, 9.11572265625, 9.5009765625, 9.88623046875, 10.271484375, 10.65673828125, 11.0419921875, 11.42724609375, 11.8125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 2.0, 6.0, 7.0, 15.0, 38.0, 74.0, 153.0, 175.0, 241.0, 161.0, 82.0, 27.0, 14.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-146.32127380371094, -141.4709930419922, -136.62069702148438, -131.77041625976562, -126.92013549804688, -122.06985473632812, -117.21956634521484, -112.36927795410156, -107.51899719238281, -102.66871643066406, -97.81842803955078, -92.9681396484375, -88.11785888671875, -83.267578125, -78.41728973388672, -73.56700134277344, -68.71672058105469, -63.86643600463867, -59.016151428222656, -54.16586685180664, -49.315582275390625, -44.46529769897461, -39.615013122558594, -34.76472854614258, -29.914443969726562, -25.064159393310547, -20.21387481689453, -15.363590240478516, -10.5133056640625, -5.663021087646484, -0.8127365112304688, 4.037548065185547, 8.8878173828125, 13.738101959228516, 18.58838653564453, 23.438671112060547, 28.288955688476562, 33.13924026489258, 37.989524841308594, 42.83980941772461, 47.690093994140625, 52.54037857055664, 57.390663146972656, 62.24094772338867, 67.09123229980469, 71.94151306152344, 76.79180145263672, 81.64208984375, 86.49237060546875, 91.3426513671875, 96.19293975830078, 101.04322814941406, 105.89350891113281, 110.74378967285156, 115.59407806396484, 120.44436645507812, 125.29464721679688, 130.14492797851562, 134.99520874023438, 139.8455047607422, 144.69578552246094, 149.5460662841797, 154.3963623046875, 159.24664306640625, 164.096923828125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 6.0, 7.0, 5.0, 11.0, 13.0, 15.0, 26.0, 27.0, 36.0, 47.0, 50.0, 70.0, 49.0, 80.0, 72.0, 79.0, 47.0, 71.0, 44.0, 46.0, 38.0, 38.0, 34.0, 22.0, 16.0, 22.0, 10.0, 9.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.88868713378906, -76.93315887451172, -74.9776382446289, -73.02210998535156, -71.06658172607422, -69.11105346679688, -67.15553283691406, -65.20000457763672, -63.244476318359375, -61.2889518737793, -59.33342361450195, -57.377899169921875, -55.42237091064453, -53.46684646606445, -51.511322021484375, -49.55579376220703, -47.60026931762695, -45.644744873046875, -43.68921661376953, -41.73369216918945, -39.77816390991211, -37.82263946533203, -35.86711120605469, -33.91158676147461, -31.9560604095459, -30.000534057617188, -28.045007705688477, -26.089481353759766, -24.133956909179688, -22.178428649902344, -20.222904205322266, -18.267377853393555, -16.311851501464844, -14.356325149536133, -12.400798797607422, -10.445273399353027, -8.489747047424316, -6.5342206954956055, -4.578695297241211, -2.6231689453125, -0.6676425933837891, 1.2878835201263428, 3.2434096336364746, 5.198935508728027, 7.154461860656738, 9.10998821258545, 11.065513610839844, 13.021039962768555, 14.976566314697266, 16.932092666625977, 18.887619018554688, 20.843143463134766, 22.79867172241211, 24.754196166992188, 26.7097225189209, 28.66524887084961, 30.62077522277832, 32.57630157470703, 34.53182601928711, 36.48735427856445, 38.44287872314453, 40.398406982421875, 42.35393142700195, 44.30945587158203, 46.264984130859375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 4.0, 7.0, 9.0, 12.0, 16.0, 36.0, 24.0, 56.0, 94.0, 147.0, 239.0, 551.0, 1480.0, 4683.0, 21491.0, 229595.0, 719825.0, 57255.0, 8920.0, 2364.0, 867.0, 358.0, 184.0, 101.0, 69.0, 51.0, 31.0, 14.0, 13.0, 14.0, 10.0, 1.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-100.5625, -97.123046875, -93.68359375, -90.244140625, -86.8046875, -83.365234375, -79.92578125, -76.486328125, -73.046875, -69.607421875, -66.16796875, -62.728515625, -59.2890625, -55.849609375, -52.41015625, -48.970703125, -45.53125, -42.091796875, -38.65234375, -35.212890625, -31.7734375, -28.333984375, -24.89453125, -21.455078125, -18.015625, -14.576171875, -11.13671875, -7.697265625, -4.2578125, -0.818359375, 2.62109375, 6.060546875, 9.5, 12.939453125, 16.37890625, 19.818359375, 23.2578125, 26.697265625, 30.13671875, 33.576171875, 37.015625, 40.455078125, 43.89453125, 47.333984375, 50.7734375, 54.212890625, 57.65234375, 61.091796875, 64.53125, 67.970703125, 71.41015625, 74.849609375, 78.2890625, 81.728515625, 85.16796875, 88.607421875, 92.046875, 95.486328125, 98.92578125, 102.365234375, 105.8046875, 109.244140625, 112.68359375, 116.123046875, 119.5625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 10.0, 14.0, 20.0, 30.0, 54.0, 96.0, 113.0, 124.0, 121.0, 126.0, 95.0, 81.0, 52.0, 37.0, 14.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.8125, -13.53778076171875, -13.2630615234375, -12.98834228515625, -12.713623046875, -12.43890380859375, -12.1641845703125, -11.88946533203125, -11.61474609375, -11.34002685546875, -11.0653076171875, -10.79058837890625, -10.515869140625, -10.24114990234375, -9.9664306640625, -9.69171142578125, -9.4169921875, -9.14227294921875, -8.8675537109375, -8.59283447265625, -8.318115234375, -8.04339599609375, -7.7686767578125, -7.49395751953125, -7.21923828125, -6.94451904296875, -6.6697998046875, -6.39508056640625, -6.120361328125, -5.84564208984375, -5.5709228515625, -5.29620361328125, -5.021484375, -4.74676513671875, -4.4720458984375, -4.19732666015625, -3.922607421875, -3.64788818359375, -3.3731689453125, -3.09844970703125, -2.82373046875, -2.54901123046875, -2.2742919921875, -1.99957275390625, -1.724853515625, -1.45013427734375, -1.1754150390625, -0.90069580078125, -0.6259765625, -0.35125732421875, -0.0765380859375, 0.19818115234375, 0.472900390625, 0.74761962890625, 1.0223388671875, 1.29705810546875, 1.57177734375, 1.84649658203125, 2.1212158203125, 2.39593505859375, 2.670654296875, 2.94537353515625, 3.2200927734375, 3.49481201171875, 3.76953125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 14.0, 11.0, 20.0, 27.0, 51.0, 81.0, 133.0, 234.0, 448.0, 792.0, 1547.0, 3252.0, 7497.0, 19305.0, 60427.0, 262051.0, 503816.0, 129967.0, 35976.0, 12751.0, 5194.0, 2460.0, 1160.0, 546.0, 328.0, 176.0, 108.0, 51.0, 41.0, 32.0, 10.0, 11.0, 8.0, 9.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.4375, -43.0166015625, -41.595703125, -40.1748046875, -38.75390625, -37.3330078125, -35.912109375, -34.4912109375, -33.0703125, -31.6494140625, -30.228515625, -28.8076171875, -27.38671875, -25.9658203125, -24.544921875, -23.1240234375, -21.703125, -20.2822265625, -18.861328125, -17.4404296875, -16.01953125, -14.5986328125, -13.177734375, -11.7568359375, -10.3359375, -8.9150390625, -7.494140625, -6.0732421875, -4.65234375, -3.2314453125, -1.810546875, -0.3896484375, 1.03125, 2.4521484375, 3.873046875, 5.2939453125, 6.71484375, 8.1357421875, 9.556640625, 10.9775390625, 12.3984375, 13.8193359375, 15.240234375, 16.6611328125, 18.08203125, 19.5029296875, 20.923828125, 22.3447265625, 23.765625, 25.1865234375, 26.607421875, 28.0283203125, 29.44921875, 30.8701171875, 32.291015625, 33.7119140625, 35.1328125, 36.5537109375, 37.974609375, 39.3955078125, 40.81640625, 42.2373046875, 43.658203125, 45.0791015625, 46.5]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 11.0, 19.0, 9.0, 21.0, 24.0, 38.0, 29.0, 38.0, 47.0, 44.0, 48.0, 52.0, 48.0, 72.0, 53.0, 55.0, 50.0, 45.0, 61.0, 35.0, 32.0, 35.0, 23.0, 22.0, 22.0, 15.0, 8.0, 8.0, 8.0, 7.0, 4.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.921875, -23.25, -22.578125, -21.90625, -21.234375, -20.5625, -19.890625, -19.21875, -18.546875, -17.875, -17.203125, -16.53125, -15.859375, -15.1875, -14.515625, -13.84375, -13.171875, -12.5, -11.828125, -11.15625, -10.484375, -9.8125, -9.140625, -8.46875, -7.796875, -7.125, -6.453125, -5.78125, -5.109375, -4.4375, -3.765625, -3.09375, -2.421875, -1.75, -1.078125, -0.40625, 0.265625, 0.9375, 1.609375, 2.28125, 2.953125, 3.625, 4.296875, 4.96875, 5.640625, 6.3125, 6.984375, 7.65625, 8.328125, 9.0, 9.671875, 10.34375, 11.015625, 11.6875, 12.359375, 13.03125, 13.703125, 14.375, 15.046875, 15.71875, 16.390625, 17.0625, 17.734375, 18.40625, 19.078125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 12.0, 16.0, 12.0, 22.0, 37.0, 52.0, 63.0, 106.0, 169.0, 228.0, 409.0, 568.0, 977.0, 1706.0, 3320.0, 6286.0, 12852.0, 28253.0, 67327.0, 166395.0, 327169.0, 247656.0, 104060.0, 42785.0, 18903.0, 8772.0, 4510.0, 2382.0, 1391.0, 787.0, 440.0, 277.0, 195.0, 114.0, 99.0, 48.0, 45.0, 27.0, 19.0, 13.0, 14.0, 14.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-28.296875, -27.482421875, -26.66796875, -25.853515625, -25.0390625, -24.224609375, -23.41015625, -22.595703125, -21.78125, -20.966796875, -20.15234375, -19.337890625, -18.5234375, -17.708984375, -16.89453125, -16.080078125, -15.265625, -14.451171875, -13.63671875, -12.822265625, -12.0078125, -11.193359375, -10.37890625, -9.564453125, -8.75, -7.935546875, -7.12109375, -6.306640625, -5.4921875, -4.677734375, -3.86328125, -3.048828125, -2.234375, -1.419921875, -0.60546875, 0.208984375, 1.0234375, 1.837890625, 2.65234375, 3.466796875, 4.28125, 5.095703125, 5.91015625, 6.724609375, 7.5390625, 8.353515625, 9.16796875, 9.982421875, 10.796875, 11.611328125, 12.42578125, 13.240234375, 14.0546875, 14.869140625, 15.68359375, 16.498046875, 17.3125, 18.126953125, 18.94140625, 19.755859375, 20.5703125, 21.384765625, 22.19921875, 23.013671875, 23.828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 7.0, 6.0, 13.0, 10.0, 19.0, 18.0, 30.0, 57.0, 62.0, 81.0, 113.0, 101.0, 103.0, 117.0, 62.0, 55.0, 44.0, 21.0, 20.0, 8.0, 4.0, 13.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022125244140625, -0.0021327435970306396, -0.0020529627799987793, -0.001973181962966919, -0.0018934011459350586, -0.0018136203289031982, -0.0017338395118713379, -0.0016540586948394775, -0.0015742778778076172, -0.0014944970607757568, -0.0014147162437438965, -0.0013349354267120361, -0.0012551546096801758, -0.0011753737926483154, -0.001095592975616455, -0.0010158121585845947, -0.0009360313415527344, -0.000856250524520874, -0.0007764697074890137, -0.0006966888904571533, -0.000616908073425293, -0.0005371272563934326, -0.00045734643936157227, -0.0003775656223297119, -0.00029778480529785156, -0.0002180039882659912, -0.00013822317123413086, -5.844235420227051e-05, 2.1338462829589844e-05, 0.0001011192798614502, 0.00018090009689331055, 0.0002606809139251709, 0.00034046173095703125, 0.0004202425479888916, 0.000500023365020752, 0.0005798041820526123, 0.0006595849990844727, 0.000739365816116333, 0.0008191466331481934, 0.0008989274501800537, 0.000978708267211914, 0.0010584890842437744, 0.0011382699012756348, 0.0012180507183074951, 0.0012978315353393555, 0.0013776123523712158, 0.0014573931694030762, 0.0015371739864349365, 0.0016169548034667969, 0.0016967356204986572, 0.0017765164375305176, 0.001856297254562378, 0.0019360780715942383, 0.0020158588886260986, 0.002095639705657959, 0.0021754205226898193, 0.0022552013397216797, 0.00233498215675354, 0.0024147629737854004, 0.0024945437908172607, 0.002574324607849121, 0.0026541054248809814, 0.002733886241912842, 0.002813667058944702, 0.0028934478759765625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 8.0, 18.0, 18.0, 26.0, 28.0, 32.0, 70.0, 145.0, 188.0, 287.0, 522.0, 984.0, 1990.0, 4013.0, 9315.0, 23482.0, 66652.0, 204381.0, 400655.0, 219737.0, 72051.0, 24893.0, 10016.0, 4440.0, 2083.0, 1018.0, 620.0, 307.0, 189.0, 142.0, 68.0, 47.0, 29.0, 19.0, 18.0, 15.0, 8.0, 6.0, 12.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-33.21875, -32.19775390625, -31.1767578125, -30.15576171875, -29.134765625, -28.11376953125, -27.0927734375, -26.07177734375, -25.05078125, -24.02978515625, -23.0087890625, -21.98779296875, -20.966796875, -19.94580078125, -18.9248046875, -17.90380859375, -16.8828125, -15.86181640625, -14.8408203125, -13.81982421875, -12.798828125, -11.77783203125, -10.7568359375, -9.73583984375, -8.71484375, -7.69384765625, -6.6728515625, -5.65185546875, -4.630859375, -3.60986328125, -2.5888671875, -1.56787109375, -0.546875, 0.47412109375, 1.4951171875, 2.51611328125, 3.537109375, 4.55810546875, 5.5791015625, 6.60009765625, 7.62109375, 8.64208984375, 9.6630859375, 10.68408203125, 11.705078125, 12.72607421875, 13.7470703125, 14.76806640625, 15.7890625, 16.81005859375, 17.8310546875, 18.85205078125, 19.873046875, 20.89404296875, 21.9150390625, 22.93603515625, 23.95703125, 24.97802734375, 25.9990234375, 27.02001953125, 28.041015625, 29.06201171875, 30.0830078125, 31.10400390625, 32.125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 2.0, 8.0, 12.0, 9.0, 16.0, 26.0, 34.0, 23.0, 44.0, 46.0, 51.0, 52.0, 56.0, 67.0, 77.0, 72.0, 88.0, 49.0, 52.0, 39.0, 35.0, 26.0, 20.0, 17.0, 13.0, 15.0, 10.0, 4.0, 8.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-13.4765625, -13.0728759765625, -12.669189453125, -12.2655029296875, -11.86181640625, -11.4581298828125, -11.054443359375, -10.6507568359375, -10.2470703125, -9.8433837890625, -9.439697265625, -9.0360107421875, -8.63232421875, -8.2286376953125, -7.824951171875, -7.4212646484375, -7.017578125, -6.6138916015625, -6.210205078125, -5.8065185546875, -5.40283203125, -4.9991455078125, -4.595458984375, -4.1917724609375, -3.7880859375, -3.3843994140625, -2.980712890625, -2.5770263671875, -2.17333984375, -1.7696533203125, -1.365966796875, -0.9622802734375, -0.55859375, -0.1549072265625, 0.248779296875, 0.6524658203125, 1.05615234375, 1.4598388671875, 1.863525390625, 2.2672119140625, 2.6708984375, 3.0745849609375, 3.478271484375, 3.8819580078125, 4.28564453125, 4.6893310546875, 5.093017578125, 5.4967041015625, 5.900390625, 6.3040771484375, 6.707763671875, 7.1114501953125, 7.51513671875, 7.9188232421875, 8.322509765625, 8.7261962890625, 9.1298828125, 9.5335693359375, 9.937255859375, 10.3409423828125, 10.74462890625, 11.1483154296875, 11.552001953125, 11.9556884765625, 12.359375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 2.0, 6.0, 7.0, 18.0, 23.0, 30.0, 43.0, 67.0, 110.0, 122.0, 126.0, 118.0, 106.0, 80.0, 38.0, 24.0, 21.0, 20.0, 10.0, 8.0, 7.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-189.30255126953125, -182.3919219970703, -175.48130798339844, -168.5706787109375, -161.66004943847656, -154.74942016601562, -147.83880615234375, -140.9281768798828, -134.01754760742188, -127.10692596435547, -120.19629669189453, -113.28567504882812, -106.37504577636719, -99.46442413330078, -92.55380249023438, -85.64317321777344, -78.73255157470703, -71.82192993164062, -64.91130065917969, -58.00067901611328, -51.090049743652344, -44.17942810058594, -37.268802642822266, -30.358177185058594, -23.447551727294922, -16.53692626953125, -9.626301765441895, -2.715677261352539, 4.194948196411133, 11.105571746826172, 18.016197204589844, 24.926822662353516, 31.837448120117188, 38.74807357788086, 45.65869903564453, 52.56932067871094, 59.479949951171875, 66.39057159423828, 73.30119323730469, 80.21182250976562, 87.12245178222656, 94.03307342529297, 100.9437026977539, 107.85432434082031, 114.76495361328125, 121.67557525634766, 128.58619689941406, 135.496826171875, 142.40744018554688, 149.3180694580078, 156.2286834716797, 163.13931274414062, 170.04994201660156, 176.9605712890625, 183.87118530273438, 190.7818145751953, 197.69244384765625, 204.6030731201172, 211.51368713378906, 218.42431640625, 225.33494567871094, 232.24557495117188, 239.15618896484375, 246.0668182373047, 252.97744750976562]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 7.0, 6.0, 12.0, 8.0, 22.0, 21.0, 30.0, 26.0, 45.0, 51.0, 55.0, 61.0, 70.0, 77.0, 85.0, 49.0, 62.0, 58.0, 59.0, 37.0, 37.0, 32.0, 13.0, 21.0, 15.0, 13.0, 6.0, 9.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-164.29312133789062, -159.32205200195312, -154.35098266601562, -149.37991333007812, -144.40882873535156, -139.43775939941406, -134.46669006347656, -129.49562072753906, -124.52455139160156, -119.55348205566406, -114.58240509033203, -109.61133575439453, -104.64026641845703, -99.669189453125, -94.6981201171875, -89.72705078125, -84.75597381591797, -79.78490447998047, -74.81382751464844, -69.84275817871094, -64.87168884277344, -59.90061569213867, -54.929542541503906, -49.958473205566406, -44.98740005493164, -40.016326904296875, -35.045257568359375, -30.07418441772461, -25.103113174438477, -20.132041931152344, -15.160968780517578, -10.189899444580078, -5.2188262939453125, -0.24775457382202148, 4.7233171463012695, 9.694389343261719, 14.665460586547852, 19.636531829833984, 24.60760498046875, 29.57867431640625, 34.549747467041016, 39.52082061767578, 44.49188995361328, 49.46296310424805, 54.43403625488281, 59.40510559082031, 64.37617492675781, 69.34724426269531, 74.31832122802734, 79.28939056396484, 84.26046752929688, 89.23153686523438, 94.20260620117188, 99.17367553710938, 104.1447525024414, 109.1158218383789, 114.08689880371094, 119.05796813964844, 124.02904510498047, 129.0001220703125, 133.97119140625, 138.9422607421875, 143.913330078125, 148.8843994140625, 153.85546875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 6.0, 11.0, 12.0, 18.0, 12.0, 22.0, 25.0, 32.0, 57.0, 90.0, 145.0, 298.0, 476.0, 1134.0, 2666.0, 7890.0, 28807.0, 175520.0, 3787183.0, 151580.0, 26788.0, 7202.0, 2429.0, 979.0, 429.0, 224.0, 93.0, 59.0, 38.0, 21.0, 14.0, 12.0, 8.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-217.875, -211.900390625, -205.92578125, -199.951171875, -193.9765625, -188.001953125, -182.02734375, -176.052734375, -170.078125, -164.103515625, -158.12890625, -152.154296875, -146.1796875, -140.205078125, -134.23046875, -128.255859375, -122.28125, -116.306640625, -110.33203125, -104.357421875, -98.3828125, -92.408203125, -86.43359375, -80.458984375, -74.484375, -68.509765625, -62.53515625, -56.560546875, -50.5859375, -44.611328125, -38.63671875, -32.662109375, -26.6875, -20.712890625, -14.73828125, -8.763671875, -2.7890625, 3.185546875, 9.16015625, 15.134765625, 21.109375, 27.083984375, 33.05859375, 39.033203125, 45.0078125, 50.982421875, 56.95703125, 62.931640625, 68.90625, 74.880859375, 80.85546875, 86.830078125, 92.8046875, 98.779296875, 104.75390625, 110.728515625, 116.703125, 122.677734375, 128.65234375, 134.626953125, 140.6015625, 146.576171875, 152.55078125, 158.525390625, 164.5]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 15.0, 10.0, 22.0, 20.0, 36.0, 41.0, 56.0, 71.0, 95.0, 78.0, 80.0, 72.0, 92.0, 66.0, 66.0, 49.0, 40.0, 35.0, 19.0, 23.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66015625, -7.47119140625, -7.2822265625, -7.09326171875, -6.904296875, -6.71533203125, -6.5263671875, -6.33740234375, -6.1484375, -5.95947265625, -5.7705078125, -5.58154296875, -5.392578125, -5.20361328125, -5.0146484375, -4.82568359375, -4.63671875, -4.44775390625, -4.2587890625, -4.06982421875, -3.880859375, -3.69189453125, -3.5029296875, -3.31396484375, -3.125, -2.93603515625, -2.7470703125, -2.55810546875, -2.369140625, -2.18017578125, -1.9912109375, -1.80224609375, -1.61328125, -1.42431640625, -1.2353515625, -1.04638671875, -0.857421875, -0.66845703125, -0.4794921875, -0.29052734375, -0.1015625, 0.08740234375, 0.2763671875, 0.46533203125, 0.654296875, 0.84326171875, 1.0322265625, 1.22119140625, 1.41015625, 1.59912109375, 1.7880859375, 1.97705078125, 2.166015625, 2.35498046875, 2.5439453125, 2.73291015625, 2.921875, 3.11083984375, 3.2998046875, 3.48876953125, 3.677734375, 3.86669921875, 4.0556640625, 4.24462890625, 4.43359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 7.0, 6.0, 17.0, 17.0, 23.0, 31.0, 35.0, 71.0, 113.0, 244.0, 461.0, 1527.0, 8387.0, 85562.0, 3874086.0, 205582.0, 14554.0, 2261.0, 649.0, 255.0, 141.0, 82.0, 54.0, 29.0, 19.0, 18.0, 17.0, 6.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-382.25, -371.81640625, -361.3828125, -350.94921875, -340.515625, -330.08203125, -319.6484375, -309.21484375, -298.78125, -288.34765625, -277.9140625, -267.48046875, -257.046875, -246.61328125, -236.1796875, -225.74609375, -215.3125, -204.87890625, -194.4453125, -184.01171875, -173.578125, -163.14453125, -152.7109375, -142.27734375, -131.84375, -121.41015625, -110.9765625, -100.54296875, -90.109375, -79.67578125, -69.2421875, -58.80859375, -48.375, -37.94140625, -27.5078125, -17.07421875, -6.640625, 3.79296875, 14.2265625, 24.66015625, 35.09375, 45.52734375, 55.9609375, 66.39453125, 76.828125, 87.26171875, 97.6953125, 108.12890625, 118.5625, 128.99609375, 139.4296875, 149.86328125, 160.296875, 170.73046875, 181.1640625, 191.59765625, 202.03125, 212.46484375, 222.8984375, 233.33203125, 243.765625, 254.19921875, 264.6328125, 275.06640625, 285.5]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 4.0, 7.0, 12.0, 23.0, 22.0, 43.0, 40.0, 65.0, 82.0, 125.0, 181.0, 389.0, 1777.0, 537.0, 243.0, 132.0, 98.0, 62.0, 66.0, 39.0, 28.0, 20.0, 21.0, 10.0, 12.0, 3.0, 8.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.75, -13.192626953125, -12.63525390625, -12.077880859375, -11.5205078125, -10.963134765625, -10.40576171875, -9.848388671875, -9.291015625, -8.733642578125, -8.17626953125, -7.618896484375, -7.0615234375, -6.504150390625, -5.94677734375, -5.389404296875, -4.83203125, -4.274658203125, -3.71728515625, -3.159912109375, -2.6025390625, -2.045166015625, -1.48779296875, -0.930419921875, -0.373046875, 0.184326171875, 0.74169921875, 1.299072265625, 1.8564453125, 2.413818359375, 2.97119140625, 3.528564453125, 4.0859375, 4.643310546875, 5.20068359375, 5.758056640625, 6.3154296875, 6.872802734375, 7.43017578125, 7.987548828125, 8.544921875, 9.102294921875, 9.65966796875, 10.217041015625, 10.7744140625, 11.331787109375, 11.88916015625, 12.446533203125, 13.00390625, 13.561279296875, 14.11865234375, 14.676025390625, 15.2333984375, 15.790771484375, 16.34814453125, 16.905517578125, 17.462890625, 18.020263671875, 18.57763671875, 19.135009765625, 19.6923828125, 20.249755859375, 20.80712890625, 21.364501953125, 21.921875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 6.0, 17.0, 20.0, 43.0, 57.0, 120.0, 209.0, 216.0, 138.0, 86.0, 39.0, 32.0, 13.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-316.38458251953125, -308.3214416503906, -300.2582702636719, -292.19512939453125, -284.1319580078125, -276.0688171386719, -268.00567626953125, -259.9425048828125, -251.87936401367188, -243.8162078857422, -235.7530517578125, -227.68991088867188, -219.6267547607422, -211.5635986328125, -203.50045776367188, -195.4373016357422, -187.3741455078125, -179.3109893798828, -171.24783325195312, -163.1846923828125, -155.1215362548828, -147.05838012695312, -138.9952392578125, -130.9320831298828, -122.86892700195312, -114.80577087402344, -106.74262237548828, -98.67947387695312, -90.61631774902344, -82.55316162109375, -74.4900131225586, -66.42686462402344, -58.36372375488281, -50.30057144165039, -42.23741912841797, -34.17426681518555, -26.111114501953125, -18.047962188720703, -9.984809875488281, -1.9216575622558594, 6.1414947509765625, 14.204647064208984, 22.267799377441406, 30.330951690673828, 38.39410400390625, 46.45725631713867, 54.520408630371094, 62.583560943603516, 70.64671325683594, 78.70986938476562, 86.77301788330078, 94.83616638183594, 102.89932250976562, 110.96247863769531, 119.02562713623047, 127.08877563476562, 135.1519317626953, 143.215087890625, 151.27822875976562, 159.3413848876953, 167.404541015625, 175.4676971435547, 183.53085327148438, 191.593994140625, 199.6571502685547]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 13.0, 10.0, 15.0, 21.0, 20.0, 35.0, 32.0, 36.0, 39.0, 37.0, 50.0, 63.0, 51.0, 62.0, 44.0, 52.0, 60.0, 58.0, 35.0, 52.0, 42.0, 44.0, 30.0, 22.0, 20.0, 10.0, 9.0, 10.0, 8.0, 7.0, 6.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.41670989990234, -61.7652702331543, -59.113826751708984, -56.46238708496094, -53.810943603515625, -51.15950393676758, -48.50806427001953, -45.85662078857422, -43.20518112182617, -40.553741455078125, -37.90229797363281, -35.250858306884766, -32.59941864013672, -29.947975158691406, -27.29653549194336, -24.64509391784668, -21.99365234375, -19.34221076965332, -16.69076919555664, -14.039329528808594, -11.387887954711914, -8.736446380615234, -6.085005760192871, -3.433565139770508, -0.7821235656738281, 1.8693175315856934, 4.520758628845215, 7.172199726104736, 9.823640823364258, 12.475082397460938, 15.1265230178833, 17.777963638305664, 20.429405212402344, 23.080846786499023, 25.732288360595703, 28.38372802734375, 31.03516960144043, 33.68661117553711, 36.338050842285156, 38.98949432373047, 41.640933990478516, 44.29237365722656, 46.943817138671875, 49.59525680541992, 52.24669647216797, 54.89813995361328, 57.54957962036133, 60.201019287109375, 62.85246276855469, 65.50390625, 68.15534210205078, 70.8067855834961, 73.4582290649414, 76.10966491699219, 78.7611083984375, 81.41255187988281, 84.06399536132812, 86.71543884277344, 89.36687469482422, 92.01831817626953, 94.66976165771484, 97.32119750976562, 99.97264099121094, 102.62408447265625, 105.27552032470703]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 5.0, 8.0, 12.0, 18.0, 20.0, 25.0, 49.0, 67.0, 114.0, 247.0, 384.0, 831.0, 1915.0, 4795.0, 12682.0, 35827.0, 110398.0, 324619.0, 361004.0, 129366.0, 42233.0, 14370.0, 5396.0, 2165.0, 898.0, 468.0, 242.0, 141.0, 86.0, 57.0, 31.0, 24.0, 15.0, 9.0, 14.0, 9.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.3125, -78.6083984375, -75.904296875, -73.2001953125, -70.49609375, -67.7919921875, -65.087890625, -62.3837890625, -59.6796875, -56.9755859375, -54.271484375, -51.5673828125, -48.86328125, -46.1591796875, -43.455078125, -40.7509765625, -38.046875, -35.3427734375, -32.638671875, -29.9345703125, -27.23046875, -24.5263671875, -21.822265625, -19.1181640625, -16.4140625, -13.7099609375, -11.005859375, -8.3017578125, -5.59765625, -2.8935546875, -0.189453125, 2.5146484375, 5.21875, 7.9228515625, 10.626953125, 13.3310546875, 16.03515625, 18.7392578125, 21.443359375, 24.1474609375, 26.8515625, 29.5556640625, 32.259765625, 34.9638671875, 37.66796875, 40.3720703125, 43.076171875, 45.7802734375, 48.484375, 51.1884765625, 53.892578125, 56.5966796875, 59.30078125, 62.0048828125, 64.708984375, 67.4130859375, 70.1171875, 72.8212890625, 75.525390625, 78.2294921875, 80.93359375, 83.6376953125, 86.341796875, 89.0458984375, 91.75]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 2.0, 9.0, 6.0, 12.0, 9.0, 16.0, 18.0, 20.0, 22.0, 23.0, 22.0, 21.0, 25.0, 25.0, 43.0, 35.0, 48.0, 38.0, 44.0, 50.0, 46.0, 34.0, 47.0, 39.0, 30.0, 30.0, 34.0, 34.0, 34.0, 27.0, 26.0, 12.0, 17.0, 23.0, 19.0, 12.0, 7.0, 10.0, 6.0, 1.0, 4.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.48828125, -3.380340576171875, -3.27239990234375, -3.164459228515625, -3.0565185546875, -2.948577880859375, -2.84063720703125, -2.732696533203125, -2.624755859375, -2.516815185546875, -2.40887451171875, -2.300933837890625, -2.1929931640625, -2.085052490234375, -1.97711181640625, -1.869171142578125, -1.76123046875, -1.653289794921875, -1.54534912109375, -1.437408447265625, -1.3294677734375, -1.221527099609375, -1.11358642578125, -1.005645751953125, -0.897705078125, -0.789764404296875, -0.68182373046875, -0.573883056640625, -0.4659423828125, -0.358001708984375, -0.25006103515625, -0.142120361328125, -0.0341796875, 0.073760986328125, 0.18170166015625, 0.289642333984375, 0.3975830078125, 0.505523681640625, 0.61346435546875, 0.721405029296875, 0.829345703125, 0.937286376953125, 1.04522705078125, 1.153167724609375, 1.2611083984375, 1.369049072265625, 1.47698974609375, 1.584930419921875, 1.69287109375, 1.800811767578125, 1.90875244140625, 2.016693115234375, 2.1246337890625, 2.232574462890625, 2.34051513671875, 2.448455810546875, 2.556396484375, 2.664337158203125, 2.77227783203125, 2.880218505859375, 2.9881591796875, 3.096099853515625, 3.20404052734375, 3.311981201171875, 3.419921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 12.0, 13.0, 22.0, 21.0, 40.0, 47.0, 53.0, 82.0, 95.0, 155.0, 243.0, 393.0, 580.0, 1030.0, 1868.0, 3735.0, 8054.0, 19713.0, 56165.0, 175335.0, 388269.0, 257308.0, 84984.0, 28473.0, 11223.0, 4815.0, 2418.0, 1288.0, 770.0, 413.0, 279.0, 185.0, 137.0, 78.0, 51.0, 59.0, 25.0, 27.0, 24.0, 17.0, 7.0, 11.0, 4.0, 6.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0], "bins": [-83.25, -80.7783203125, -78.306640625, -75.8349609375, -73.36328125, -70.8916015625, -68.419921875, -65.9482421875, -63.4765625, -61.0048828125, -58.533203125, -56.0615234375, -53.58984375, -51.1181640625, -48.646484375, -46.1748046875, -43.703125, -41.2314453125, -38.759765625, -36.2880859375, -33.81640625, -31.3447265625, -28.873046875, -26.4013671875, -23.9296875, -21.4580078125, -18.986328125, -16.5146484375, -14.04296875, -11.5712890625, -9.099609375, -6.6279296875, -4.15625, -1.6845703125, 0.787109375, 3.2587890625, 5.73046875, 8.2021484375, 10.673828125, 13.1455078125, 15.6171875, 18.0888671875, 20.560546875, 23.0322265625, 25.50390625, 27.9755859375, 30.447265625, 32.9189453125, 35.390625, 37.8623046875, 40.333984375, 42.8056640625, 45.27734375, 47.7490234375, 50.220703125, 52.6923828125, 55.1640625, 57.6357421875, 60.107421875, 62.5791015625, 65.05078125, 67.5224609375, 69.994140625, 72.4658203125, 74.9375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 5.0, 10.0, 8.0, 8.0, 10.0, 12.0, 14.0, 19.0, 22.0, 24.0, 36.0, 43.0, 32.0, 47.0, 38.0, 50.0, 43.0, 45.0, 46.0, 50.0, 51.0, 41.0, 43.0, 55.0, 39.0, 35.0, 28.0, 22.0, 28.0, 17.0, 16.0, 12.0, 11.0, 6.0, 5.0, 7.0, 4.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.203125, -25.39111328125, -24.5791015625, -23.76708984375, -22.955078125, -22.14306640625, -21.3310546875, -20.51904296875, -19.70703125, -18.89501953125, -18.0830078125, -17.27099609375, -16.458984375, -15.64697265625, -14.8349609375, -14.02294921875, -13.2109375, -12.39892578125, -11.5869140625, -10.77490234375, -9.962890625, -9.15087890625, -8.3388671875, -7.52685546875, -6.71484375, -5.90283203125, -5.0908203125, -4.27880859375, -3.466796875, -2.65478515625, -1.8427734375, -1.03076171875, -0.21875, 0.59326171875, 1.4052734375, 2.21728515625, 3.029296875, 3.84130859375, 4.6533203125, 5.46533203125, 6.27734375, 7.08935546875, 7.9013671875, 8.71337890625, 9.525390625, 10.33740234375, 11.1494140625, 11.96142578125, 12.7734375, 13.58544921875, 14.3974609375, 15.20947265625, 16.021484375, 16.83349609375, 17.6455078125, 18.45751953125, 19.26953125, 20.08154296875, 20.8935546875, 21.70556640625, 22.517578125, 23.32958984375, 24.1416015625, 24.95361328125, 25.765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 14.0, 10.0, 14.0, 28.0, 41.0, 48.0, 99.0, 124.0, 168.0, 287.0, 484.0, 743.0, 1253.0, 2360.0, 4509.0, 9927.0, 25080.0, 75969.0, 250952.0, 410753.0, 177121.0, 53602.0, 18700.0, 7724.0, 3742.0, 1963.0, 1100.0, 596.0, 407.0, 232.0, 159.0, 85.0, 84.0, 38.0, 27.0, 27.0, 18.0, 19.0, 2.0, 8.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.375, -45.81396484375, -44.2529296875, -42.69189453125, -41.130859375, -39.56982421875, -38.0087890625, -36.44775390625, -34.88671875, -33.32568359375, -31.7646484375, -30.20361328125, -28.642578125, -27.08154296875, -25.5205078125, -23.95947265625, -22.3984375, -20.83740234375, -19.2763671875, -17.71533203125, -16.154296875, -14.59326171875, -13.0322265625, -11.47119140625, -9.91015625, -8.34912109375, -6.7880859375, -5.22705078125, -3.666015625, -2.10498046875, -0.5439453125, 1.01708984375, 2.578125, 4.13916015625, 5.7001953125, 7.26123046875, 8.822265625, 10.38330078125, 11.9443359375, 13.50537109375, 15.06640625, 16.62744140625, 18.1884765625, 19.74951171875, 21.310546875, 22.87158203125, 24.4326171875, 25.99365234375, 27.5546875, 29.11572265625, 30.6767578125, 32.23779296875, 33.798828125, 35.35986328125, 36.9208984375, 38.48193359375, 40.04296875, 41.60400390625, 43.1650390625, 44.72607421875, 46.287109375, 47.84814453125, 49.4091796875, 50.97021484375, 52.53125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 5.0, 10.0, 13.0, 11.0, 21.0, 27.0, 23.0, 24.0, 23.0, 50.0, 58.0, 65.0, 80.0, 79.0, 70.0, 65.0, 80.0, 56.0, 42.0, 53.0, 27.0, 24.0, 14.0, 14.0, 13.0, 8.0, 7.0, 7.0, 4.0, 6.0, 2.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004486083984375, -0.004313051700592041, -0.004140019416809082, -0.003966987133026123, -0.003793954849243164, -0.003620922565460205, -0.003447890281677246, -0.003274857997894287, -0.003101825714111328, -0.002928793430328369, -0.00275576114654541, -0.002582728862762451, -0.002409696578979492, -0.002236664295196533, -0.0020636320114135742, -0.0018905997276306152, -0.0017175674438476562, -0.0015445351600646973, -0.0013715028762817383, -0.0011984705924987793, -0.0010254383087158203, -0.0008524060249328613, -0.0006793737411499023, -0.0005063414573669434, -0.0003333091735839844, -0.0001602768898010254, 1.2755393981933594e-05, 0.00018578767776489258, 0.00035881996154785156, 0.0005318522453308105, 0.0007048845291137695, 0.0008779168128967285, 0.0010509490966796875, 0.0012239813804626465, 0.0013970136642456055, 0.0015700459480285645, 0.0017430782318115234, 0.0019161105155944824, 0.0020891427993774414, 0.0022621750831604004, 0.0024352073669433594, 0.0026082396507263184, 0.0027812719345092773, 0.0029543042182922363, 0.0031273365020751953, 0.0033003687858581543, 0.0034734010696411133, 0.0036464333534240723, 0.0038194656372070312, 0.00399249792098999, 0.004165530204772949, 0.004338562488555908, 0.004511594772338867, 0.004684627056121826, 0.004857659339904785, 0.005030691623687744, 0.005203723907470703, 0.005376756191253662, 0.005549788475036621, 0.00572282075881958, 0.005895853042602539, 0.006068885326385498, 0.006241917610168457, 0.006414949893951416, 0.006587982177734375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 15.0, 14.0, 25.0, 40.0, 75.0, 88.0, 158.0, 249.0, 427.0, 744.0, 1331.0, 2837.0, 6596.0, 19086.0, 74046.0, 357691.0, 445870.0, 99796.0, 24600.0, 8070.0, 3276.0, 1473.0, 794.0, 444.0, 271.0, 172.0, 107.0, 67.0, 51.0, 31.0, 24.0, 13.0, 9.0, 15.0, 5.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-71.9375, -69.6962890625, -67.455078125, -65.2138671875, -62.97265625, -60.7314453125, -58.490234375, -56.2490234375, -54.0078125, -51.7666015625, -49.525390625, -47.2841796875, -45.04296875, -42.8017578125, -40.560546875, -38.3193359375, -36.078125, -33.8369140625, -31.595703125, -29.3544921875, -27.11328125, -24.8720703125, -22.630859375, -20.3896484375, -18.1484375, -15.9072265625, -13.666015625, -11.4248046875, -9.18359375, -6.9423828125, -4.701171875, -2.4599609375, -0.21875, 2.0224609375, 4.263671875, 6.5048828125, 8.74609375, 10.9873046875, 13.228515625, 15.4697265625, 17.7109375, 19.9521484375, 22.193359375, 24.4345703125, 26.67578125, 28.9169921875, 31.158203125, 33.3994140625, 35.640625, 37.8818359375, 40.123046875, 42.3642578125, 44.60546875, 46.8466796875, 49.087890625, 51.3291015625, 53.5703125, 55.8115234375, 58.052734375, 60.2939453125, 62.53515625, 64.7763671875, 67.017578125, 69.2587890625, 71.5]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 7.0, 7.0, 12.0, 16.0, 19.0, 16.0, 26.0, 38.0, 38.0, 42.0, 62.0, 77.0, 77.0, 62.0, 70.0, 65.0, 65.0, 48.0, 37.0, 37.0, 43.0, 30.0, 22.0, 16.0, 15.0, 13.0, 8.0, 9.0, 4.0, 5.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.328125, -23.494873046875, -22.66162109375, -21.828369140625, -20.9951171875, -20.161865234375, -19.32861328125, -18.495361328125, -17.662109375, -16.828857421875, -15.99560546875, -15.162353515625, -14.3291015625, -13.495849609375, -12.66259765625, -11.829345703125, -10.99609375, -10.162841796875, -9.32958984375, -8.496337890625, -7.6630859375, -6.829833984375, -5.99658203125, -5.163330078125, -4.330078125, -3.496826171875, -2.66357421875, -1.830322265625, -0.9970703125, -0.163818359375, 0.66943359375, 1.502685546875, 2.3359375, 3.169189453125, 4.00244140625, 4.835693359375, 5.6689453125, 6.502197265625, 7.33544921875, 8.168701171875, 9.001953125, 9.835205078125, 10.66845703125, 11.501708984375, 12.3349609375, 13.168212890625, 14.00146484375, 14.834716796875, 15.66796875, 16.501220703125, 17.33447265625, 18.167724609375, 19.0009765625, 19.834228515625, 20.66748046875, 21.500732421875, 22.333984375, 23.167236328125, 24.00048828125, 24.833740234375, 25.6669921875, 26.500244140625, 27.33349609375, 28.166748046875, 29.0]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 10.0, 16.0, 32.0, 105.0, 214.0, 301.0, 193.0, 79.0, 33.0, 13.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1470.41015625, -1432.190673828125, -1393.97119140625, -1355.751708984375, -1317.5322265625, -1279.312744140625, -1241.09326171875, -1202.873779296875, -1164.654296875, -1126.434814453125, -1088.21533203125, -1049.995849609375, -1011.7763671875, -973.556884765625, -935.33740234375, -897.117919921875, -858.8983764648438, -820.6788940429688, -782.4594116210938, -744.2399291992188, -706.0204467773438, -667.8009643554688, -629.5814208984375, -591.3619384765625, -553.1424560546875, -514.9229736328125, -476.7034912109375, -438.4840087890625, -400.2645263671875, -362.0450439453125, -323.8255310058594, -285.6060485839844, -247.38665771484375, -209.16717529296875, -170.94769287109375, -132.7281951904297, -94.50871276855469, -56.28923034667969, -18.069732666015625, 20.149749755859375, 58.369232177734375, 96.58871459960938, 134.80819702148438, 173.02769470214844, 211.24717712402344, 249.46665954589844, 287.6861572265625, 325.9056396484375, 364.1251220703125, 402.3446044921875, 440.5640869140625, 478.7835693359375, 517.0030517578125, 555.2225341796875, 593.4420166015625, 631.6614990234375, 669.8809814453125, 708.1004638671875, 746.3199462890625, 784.5394287109375, 822.7589111328125, 860.9783935546875, 899.1978759765625, 937.4173583984375, 975.6369018554688]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 5.0, 6.0, 4.0, 10.0, 7.0, 18.0, 20.0, 26.0, 25.0, 25.0, 32.0, 31.0, 42.0, 52.0, 59.0, 62.0, 53.0, 48.0, 45.0, 71.0, 44.0, 40.0, 44.0, 30.0, 23.0, 24.0, 29.0, 29.0, 23.0, 23.0, 12.0, 12.0, 7.0, 4.0, 3.0, 6.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-203.62213134765625, -196.8587646484375, -190.0954132080078, -183.33204650878906, -176.5686798095703, -169.80532836914062, -163.04196166992188, -156.27859497070312, -149.51522827148438, -142.75186157226562, -135.98851013183594, -129.2251434326172, -122.46177673339844, -115.69841766357422, -108.93505859375, -102.17169189453125, -95.40834045410156, -88.64498138427734, -81.8816146850586, -75.11825561523438, -68.35488891601562, -61.591529846191406, -54.82817077636719, -48.0648078918457, -41.30144500732422, -34.538082122802734, -27.774721145629883, -21.01136016845703, -14.247997283935547, -7.4846343994140625, -0.7212753295898438, 6.042087554931641, 12.805450439453125, 19.56881332397461, 26.33217430114746, 33.09553527832031, 39.8588981628418, 46.62226104736328, 53.3856201171875, 60.148983001708984, 66.91234588623047, 73.67570495605469, 80.43907165527344, 87.20243072509766, 93.96578979492188, 100.72915649414062, 107.49251556396484, 114.25587463378906, 121.01924133300781, 127.78260040283203, 134.54595947265625, 141.309326171875, 148.07269287109375, 154.8360595703125, 161.5994110107422, 168.36277770996094, 175.12612915039062, 181.88949584960938, 188.65284729003906, 195.4162139892578, 202.17958068847656, 208.94293212890625, 215.706298828125, 222.46966552734375, 229.2330322265625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 10.0, 15.0, 28.0, 43.0, 60.0, 124.0, 235.0, 485.0, 1254.0, 4032.0, 17650.0, 118734.0, 3780884.0, 234246.0, 27670.0, 5799.0, 1662.0, 650.0, 291.0, 136.0, 83.0, 60.0, 37.0, 27.0, 20.0, 13.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-299.0, -290.3671875, -281.734375, -273.1015625, -264.46875, -255.8359375, -247.203125, -238.5703125, -229.9375, -221.3046875, -212.671875, -204.0390625, -195.40625, -186.7734375, -178.140625, -169.5078125, -160.875, -152.2421875, -143.609375, -134.9765625, -126.34375, -117.7109375, -109.078125, -100.4453125, -91.8125, -83.1796875, -74.546875, -65.9140625, -57.28125, -48.6484375, -40.015625, -31.3828125, -22.75, -14.1171875, -5.484375, 3.1484375, 11.78125, 20.4140625, 29.046875, 37.6796875, 46.3125, 54.9453125, 63.578125, 72.2109375, 80.84375, 89.4765625, 98.109375, 106.7421875, 115.375, 124.0078125, 132.640625, 141.2734375, 149.90625, 158.5390625, 167.171875, 175.8046875, 184.4375, 193.0703125, 201.703125, 210.3359375, 218.96875, 227.6015625, 236.234375, 244.8671875, 253.5]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 8.0, 11.0, 17.0, 20.0, 20.0, 41.0, 32.0, 43.0, 48.0, 59.0, 63.0, 69.0, 68.0, 84.0, 67.0, 56.0, 56.0, 65.0, 34.0, 30.0, 34.0, 20.0, 16.0, 5.0, 11.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.359375, -8.118896484375, -7.87841796875, -7.637939453125, -7.3974609375, -7.156982421875, -6.91650390625, -6.676025390625, -6.435546875, -6.195068359375, -5.95458984375, -5.714111328125, -5.4736328125, -5.233154296875, -4.99267578125, -4.752197265625, -4.51171875, -4.271240234375, -4.03076171875, -3.790283203125, -3.5498046875, -3.309326171875, -3.06884765625, -2.828369140625, -2.587890625, -2.347412109375, -2.10693359375, -1.866455078125, -1.6259765625, -1.385498046875, -1.14501953125, -0.904541015625, -0.6640625, -0.423583984375, -0.18310546875, 0.057373046875, 0.2978515625, 0.538330078125, 0.77880859375, 1.019287109375, 1.259765625, 1.500244140625, 1.74072265625, 1.981201171875, 2.2216796875, 2.462158203125, 2.70263671875, 2.943115234375, 3.18359375, 3.424072265625, 3.66455078125, 3.905029296875, 4.1455078125, 4.385986328125, 4.62646484375, 4.866943359375, 5.107421875, 5.347900390625, 5.58837890625, 5.828857421875, 6.0693359375, 6.309814453125, 6.55029296875, 6.790771484375, 7.03125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 4.0, 13.0, 11.0, 23.0, 34.0, 41.0, 43.0, 53.0, 63.0, 141.0, 1038.0, 46760.0, 4092839.0, 51779.0, 1032.0, 140.0, 59.0, 50.0, 38.0, 30.0, 19.0, 20.0, 21.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-646.0, -625.5, -605.0, -584.5, -564.0, -543.5, -523.0, -502.5, -482.0, -461.5, -441.0, -420.5, -400.0, -379.5, -359.0, -338.5, -318.0, -297.5, -277.0, -256.5, -236.0, -215.5, -195.0, -174.5, -154.0, -133.5, -113.0, -92.5, -72.0, -51.5, -31.0, -10.5, 10.0, 30.5, 51.0, 71.5, 92.0, 112.5, 133.0, 153.5, 174.0, 194.5, 215.0, 235.5, 256.0, 276.5, 297.0, 317.5, 338.0, 358.5, 379.0, 399.5, 420.0, 440.5, 461.0, 481.5, 502.0, 522.5, 543.0, 563.5, 584.0, 604.5, 625.0, 645.5, 666.0]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 6.0, 11.0, 14.0, 19.0, 53.0, 80.0, 133.0, 202.0, 442.0, 2026.0, 544.0, 251.0, 121.0, 77.0, 47.0, 31.0, 7.0, 12.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-68.1875, -66.8408203125, -65.494140625, -64.1474609375, -62.80078125, -61.4541015625, -60.107421875, -58.7607421875, -57.4140625, -56.0673828125, -54.720703125, -53.3740234375, -52.02734375, -50.6806640625, -49.333984375, -47.9873046875, -46.640625, -45.2939453125, -43.947265625, -42.6005859375, -41.25390625, -39.9072265625, -38.560546875, -37.2138671875, -35.8671875, -34.5205078125, -33.173828125, -31.8271484375, -30.48046875, -29.1337890625, -27.787109375, -26.4404296875, -25.09375, -23.7470703125, -22.400390625, -21.0537109375, -19.70703125, -18.3603515625, -17.013671875, -15.6669921875, -14.3203125, -12.9736328125, -11.626953125, -10.2802734375, -8.93359375, -7.5869140625, -6.240234375, -4.8935546875, -3.546875, -2.2001953125, -0.853515625, 0.4931640625, 1.83984375, 3.1865234375, 4.533203125, 5.8798828125, 7.2265625, 8.5732421875, 9.919921875, 11.2666015625, 12.61328125, 13.9599609375, 15.306640625, 16.6533203125, 18.0]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 2.0, 8.0, 14.0, 16.0, 30.0, 36.0, 59.0, 128.0, 166.0, 155.0, 135.0, 113.0, 56.0, 35.0, 20.0, 15.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-312.4701232910156, -302.81158447265625, -293.1530456542969, -283.4945068359375, -273.83599853515625, -264.1774597167969, -254.5189208984375, -244.86038208007812, -235.20184326171875, -225.54330444335938, -215.884765625, -206.2262420654297, -196.5677032470703, -186.90916442871094, -177.25064086914062, -167.59210205078125, -157.93356323242188, -148.2750244140625, -138.61648559570312, -128.9579620361328, -119.29942321777344, -109.64088439941406, -99.98235321044922, -90.32382202148438, -80.665283203125, -71.00674438476562, -61.34821319580078, -51.68967819213867, -42.03114318847656, -32.37260818481445, -22.714073181152344, -13.0555419921875, -3.39697265625, 6.261562347412109, 15.920097351074219, 25.578632354736328, 35.23716735839844, 44.89570236206055, 54.554237365722656, 64.2127685546875, 73.87130737304688, 83.52984619140625, 93.1883773803711, 102.84690856933594, 112.50544738769531, 122.16398620605469, 131.822509765625, 141.48104858398438, 151.13958740234375, 160.79812622070312, 170.4566650390625, 180.1151885986328, 189.7737274169922, 199.43226623535156, 209.09078979492188, 218.74932861328125, 228.40786743164062, 238.06640625, 247.72494506835938, 257.38348388671875, 267.0419921875, 276.7005310058594, 286.35906982421875, 296.0176086425781, 305.6761474609375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 8.0, 9.0, 18.0, 19.0, 21.0, 15.0, 19.0, 28.0, 32.0, 32.0, 38.0, 26.0, 39.0, 49.0, 41.0, 39.0, 36.0, 56.0, 41.0, 51.0, 44.0, 38.0, 37.0, 36.0, 34.0, 23.0, 19.0, 31.0, 19.0, 19.0, 12.0, 8.0, 9.0, 11.0, 7.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.92109680175781, -91.05319213867188, -88.1852798461914, -85.31737518310547, -82.44947052001953, -79.58155822753906, -76.71365356445312, -73.84574890136719, -70.97783660888672, -68.10993194580078, -65.24201965332031, -62.374114990234375, -59.50620651245117, -56.63829803466797, -53.77039337158203, -50.90248489379883, -48.03458023071289, -45.16667175292969, -42.29876708984375, -39.43085861206055, -36.562950134277344, -33.695045471191406, -30.827136993408203, -27.959228515625, -25.09132194519043, -22.22341537475586, -19.355506896972656, -16.487600326538086, -13.6196928024292, -10.751785278320312, -7.883878707885742, -5.015970230102539, -2.1480636596679688, 0.7198436260223389, 3.5877509117126465, 6.455657958984375, 9.323565483093262, 12.191473007202148, 15.059379577636719, 17.927288055419922, 20.795194625854492, 23.663101196289062, 26.531009674072266, 29.398916244506836, 32.266822814941406, 35.13473129272461, 38.00263977050781, 40.87054443359375, 43.73845291137695, 46.606361389160156, 49.474266052246094, 52.3421745300293, 55.2100830078125, 58.07798767089844, 60.94589614868164, 63.813804626464844, 66.68170928955078, 69.54961395263672, 72.41752624511719, 75.28543090820312, 78.15333557128906, 81.02124786376953, 83.88915252685547, 86.75706481933594, 89.62496948242188]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 7.0, 4.0, 12.0, 8.0, 13.0, 10.0, 21.0, 31.0, 32.0, 35.0, 51.0, 43.0, 59.0, 117.0, 169.0, 208.0, 393.0, 562.0, 1005.0, 2185.0, 5319.0, 15819.0, 51559.0, 172017.0, 395784.0, 272897.0, 88400.0, 26555.0, 8553.0, 3206.0, 1394.0, 705.0, 402.0, 269.0, 217.0, 118.0, 101.0, 65.0, 32.0, 38.0, 14.0, 27.0, 16.0, 19.0, 14.0, 10.0, 14.0, 2.0, 6.0, 8.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-93.0, -89.97265625, -86.9453125, -83.91796875, -80.890625, -77.86328125, -74.8359375, -71.80859375, -68.78125, -65.75390625, -62.7265625, -59.69921875, -56.671875, -53.64453125, -50.6171875, -47.58984375, -44.5625, -41.53515625, -38.5078125, -35.48046875, -32.453125, -29.42578125, -26.3984375, -23.37109375, -20.34375, -17.31640625, -14.2890625, -11.26171875, -8.234375, -5.20703125, -2.1796875, 0.84765625, 3.875, 6.90234375, 9.9296875, 12.95703125, 15.984375, 19.01171875, 22.0390625, 25.06640625, 28.09375, 31.12109375, 34.1484375, 37.17578125, 40.203125, 43.23046875, 46.2578125, 49.28515625, 52.3125, 55.33984375, 58.3671875, 61.39453125, 64.421875, 67.44921875, 70.4765625, 73.50390625, 76.53125, 79.55859375, 82.5859375, 85.61328125, 88.640625, 91.66796875, 94.6953125, 97.72265625, 100.75]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 22.0, 15.0, 20.0, 40.0, 40.0, 53.0, 62.0, 73.0, 81.0, 81.0, 84.0, 57.0, 62.0, 61.0, 51.0, 54.0, 38.0, 24.0, 25.0, 15.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.4453125, -10.16302490234375, -9.8807373046875, -9.59844970703125, -9.316162109375, -9.03387451171875, -8.7515869140625, -8.46929931640625, -8.18701171875, -7.90472412109375, -7.6224365234375, -7.34014892578125, -7.057861328125, -6.77557373046875, -6.4932861328125, -6.21099853515625, -5.9287109375, -5.64642333984375, -5.3641357421875, -5.08184814453125, -4.799560546875, -4.51727294921875, -4.2349853515625, -3.95269775390625, -3.67041015625, -3.38812255859375, -3.1058349609375, -2.82354736328125, -2.541259765625, -2.25897216796875, -1.9766845703125, -1.69439697265625, -1.412109375, -1.12982177734375, -0.8475341796875, -0.56524658203125, -0.282958984375, -0.00067138671875, 0.2816162109375, 0.56390380859375, 0.84619140625, 1.12847900390625, 1.4107666015625, 1.69305419921875, 1.975341796875, 2.25762939453125, 2.5399169921875, 2.82220458984375, 3.1044921875, 3.38677978515625, 3.6690673828125, 3.95135498046875, 4.233642578125, 4.51593017578125, 4.7982177734375, 5.08050537109375, 5.36279296875, 5.64508056640625, 5.9273681640625, 6.20965576171875, 6.491943359375, 6.77423095703125, 7.0565185546875, 7.33880615234375, 7.62109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 2.0, 9.0, 12.0, 14.0, 10.0, 15.0, 24.0, 44.0, 51.0, 66.0, 94.0, 121.0, 184.0, 280.0, 394.0, 706.0, 1229.0, 2109.0, 4405.0, 10240.0, 28022.0, 89022.0, 280058.0, 395228.0, 158831.0, 47895.0, 15910.0, 6498.0, 3015.0, 1549.0, 884.0, 531.0, 327.0, 219.0, 158.0, 116.0, 75.0, 45.0, 43.0, 29.0, 22.0, 19.0, 14.0, 13.0, 8.0, 10.0, 3.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.8125, -79.0146484375, -76.216796875, -73.4189453125, -70.62109375, -67.8232421875, -65.025390625, -62.2275390625, -59.4296875, -56.6318359375, -53.833984375, -51.0361328125, -48.23828125, -45.4404296875, -42.642578125, -39.8447265625, -37.046875, -34.2490234375, -31.451171875, -28.6533203125, -25.85546875, -23.0576171875, -20.259765625, -17.4619140625, -14.6640625, -11.8662109375, -9.068359375, -6.2705078125, -3.47265625, -0.6748046875, 2.123046875, 4.9208984375, 7.71875, 10.5166015625, 13.314453125, 16.1123046875, 18.91015625, 21.7080078125, 24.505859375, 27.3037109375, 30.1015625, 32.8994140625, 35.697265625, 38.4951171875, 41.29296875, 44.0908203125, 46.888671875, 49.6865234375, 52.484375, 55.2822265625, 58.080078125, 60.8779296875, 63.67578125, 66.4736328125, 69.271484375, 72.0693359375, 74.8671875, 77.6650390625, 80.462890625, 83.2607421875, 86.05859375, 88.8564453125, 91.654296875, 94.4521484375, 97.25]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 8.0, 4.0, 9.0, 18.0, 15.0, 20.0, 21.0, 29.0, 40.0, 37.0, 42.0, 48.0, 49.0, 46.0, 46.0, 44.0, 53.0, 55.0, 58.0, 56.0, 50.0, 44.0, 41.0, 22.0, 30.0, 20.0, 15.0, 12.0, 14.0, 18.0, 9.0, 7.0, 11.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.3125, -43.98583984375, -42.6591796875, -41.33251953125, -40.005859375, -38.67919921875, -37.3525390625, -36.02587890625, -34.69921875, -33.37255859375, -32.0458984375, -30.71923828125, -29.392578125, -28.06591796875, -26.7392578125, -25.41259765625, -24.0859375, -22.75927734375, -21.4326171875, -20.10595703125, -18.779296875, -17.45263671875, -16.1259765625, -14.79931640625, -13.47265625, -12.14599609375, -10.8193359375, -9.49267578125, -8.166015625, -6.83935546875, -5.5126953125, -4.18603515625, -2.859375, -1.53271484375, -0.2060546875, 1.12060546875, 2.447265625, 3.77392578125, 5.1005859375, 6.42724609375, 7.75390625, 9.08056640625, 10.4072265625, 11.73388671875, 13.060546875, 14.38720703125, 15.7138671875, 17.04052734375, 18.3671875, 19.69384765625, 21.0205078125, 22.34716796875, 23.673828125, 25.00048828125, 26.3271484375, 27.65380859375, 28.98046875, 30.30712890625, 31.6337890625, 32.96044921875, 34.287109375, 35.61376953125, 36.9404296875, 38.26708984375, 39.59375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 11.0, 9.0, 10.0, 23.0, 27.0, 65.0, 60.0, 107.0, 174.0, 334.0, 505.0, 1033.0, 2116.0, 4920.0, 13181.0, 47280.0, 246643.0, 542931.0, 142172.0, 30163.0, 9360.0, 3635.0, 1735.0, 837.0, 440.0, 289.0, 169.0, 113.0, 71.0, 41.0, 33.0, 12.0, 11.0, 11.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.5, -59.330078125, -57.16015625, -54.990234375, -52.8203125, -50.650390625, -48.48046875, -46.310546875, -44.140625, -41.970703125, -39.80078125, -37.630859375, -35.4609375, -33.291015625, -31.12109375, -28.951171875, -26.78125, -24.611328125, -22.44140625, -20.271484375, -18.1015625, -15.931640625, -13.76171875, -11.591796875, -9.421875, -7.251953125, -5.08203125, -2.912109375, -0.7421875, 1.427734375, 3.59765625, 5.767578125, 7.9375, 10.107421875, 12.27734375, 14.447265625, 16.6171875, 18.787109375, 20.95703125, 23.126953125, 25.296875, 27.466796875, 29.63671875, 31.806640625, 33.9765625, 36.146484375, 38.31640625, 40.486328125, 42.65625, 44.826171875, 46.99609375, 49.166015625, 51.3359375, 53.505859375, 55.67578125, 57.845703125, 60.015625, 62.185546875, 64.35546875, 66.525390625, 68.6953125, 70.865234375, 73.03515625, 75.205078125, 77.375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 5.0, 3.0, 2.0, 12.0, 6.0, 11.0, 24.0, 18.0, 30.0, 31.0, 46.0, 45.0, 68.0, 91.0, 82.0, 88.0, 94.0, 79.0, 61.0, 46.0, 39.0, 30.0, 19.0, 19.0, 13.0, 7.0, 5.0, 9.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.007282257080078125, -0.007073700428009033, -0.006865143775939941, -0.00665658712387085, -0.006448030471801758, -0.006239473819732666, -0.006030917167663574, -0.005822360515594482, -0.005613803863525391, -0.005405247211456299, -0.005196690559387207, -0.004988133907318115, -0.0047795772552490234, -0.004571020603179932, -0.00436246395111084, -0.004153907299041748, -0.003945350646972656, -0.0037367939949035645, -0.0035282373428344727, -0.003319680690765381, -0.003111124038696289, -0.0029025673866271973, -0.0026940107345581055, -0.0024854540824890137, -0.002276897430419922, -0.00206834077835083, -0.0018597841262817383, -0.0016512274742126465, -0.0014426708221435547, -0.0012341141700744629, -0.001025557518005371, -0.0008170008659362793, -0.0006084442138671875, -0.0003998875617980957, -0.0001913309097290039, 1.722574234008789e-05, 0.0002257823944091797, 0.0004343390464782715, 0.0006428956985473633, 0.0008514523506164551, 0.0010600090026855469, 0.0012685656547546387, 0.0014771223068237305, 0.0016856789588928223, 0.001894235610961914, 0.002102792263031006, 0.0023113489151000977, 0.0025199055671691895, 0.0027284622192382812, 0.002937018871307373, 0.003145575523376465, 0.0033541321754455566, 0.0035626888275146484, 0.0037712454795837402, 0.003979802131652832, 0.004188358783721924, 0.004396915435791016, 0.004605472087860107, 0.004814028739929199, 0.005022585391998291, 0.005231142044067383, 0.005439698696136475, 0.005648255348205566, 0.005856812000274658, 0.00606536865234375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 12.0, 15.0, 13.0, 30.0, 33.0, 58.0, 59.0, 108.0, 141.0, 263.0, 464.0, 823.0, 1778.0, 3951.0, 10939.0, 45178.0, 407615.0, 500281.0, 55592.0, 12545.0, 4438.0, 1928.0, 905.0, 508.0, 284.0, 188.0, 112.0, 92.0, 55.0, 35.0, 20.0, 12.0, 12.0, 10.0, 8.0, 7.0, 8.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-100.625, -97.384765625, -94.14453125, -90.904296875, -87.6640625, -84.423828125, -81.18359375, -77.943359375, -74.703125, -71.462890625, -68.22265625, -64.982421875, -61.7421875, -58.501953125, -55.26171875, -52.021484375, -48.78125, -45.541015625, -42.30078125, -39.060546875, -35.8203125, -32.580078125, -29.33984375, -26.099609375, -22.859375, -19.619140625, -16.37890625, -13.138671875, -9.8984375, -6.658203125, -3.41796875, -0.177734375, 3.0625, 6.302734375, 9.54296875, 12.783203125, 16.0234375, 19.263671875, 22.50390625, 25.744140625, 28.984375, 32.224609375, 35.46484375, 38.705078125, 41.9453125, 45.185546875, 48.42578125, 51.666015625, 54.90625, 58.146484375, 61.38671875, 64.626953125, 67.8671875, 71.107421875, 74.34765625, 77.587890625, 80.828125, 84.068359375, 87.30859375, 90.548828125, 93.7890625, 97.029296875, 100.26953125, 103.509765625, 106.75]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 5.0, 7.0, 8.0, 15.0, 16.0, 26.0, 29.0, 40.0, 49.0, 76.0, 81.0, 75.0, 88.0, 89.0, 65.0, 66.0, 49.0, 40.0, 29.0, 29.0, 26.0, 9.0, 11.0, 6.0, 6.0, 13.0, 3.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.0625, -30.890625, -29.71875, -28.546875, -27.375, -26.203125, -25.03125, -23.859375, -22.6875, -21.515625, -20.34375, -19.171875, -18.0, -16.828125, -15.65625, -14.484375, -13.3125, -12.140625, -10.96875, -9.796875, -8.625, -7.453125, -6.28125, -5.109375, -3.9375, -2.765625, -1.59375, -0.421875, 0.75, 1.921875, 3.09375, 4.265625, 5.4375, 6.609375, 7.78125, 8.953125, 10.125, 11.296875, 12.46875, 13.640625, 14.8125, 15.984375, 17.15625, 18.328125, 19.5, 20.671875, 21.84375, 23.015625, 24.1875, 25.359375, 26.53125, 27.703125, 28.875, 30.046875, 31.21875, 32.390625, 33.5625, 34.734375, 35.90625, 37.078125, 38.25, 39.421875, 40.59375, 41.765625, 42.9375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 18.0, 31.0, 58.0, 93.0, 150.0, 174.0, 159.0, 111.0, 70.0, 40.0, 30.0, 21.0, 11.0, 2.0, 4.0, 6.0, 4.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-744.619873046875, -722.4520263671875, -700.2841796875, -678.1163330078125, -655.9485473632812, -633.7807006835938, -611.6128540039062, -589.4450073242188, -567.2772216796875, -545.109375, -522.9415283203125, -500.7737121582031, -478.60589599609375, -456.43804931640625, -434.27020263671875, -412.10235595703125, -389.93450927734375, -367.76666259765625, -345.5988464355469, -323.4309997558594, -301.26318359375, -279.0953369140625, -256.927490234375, -234.75965881347656, -212.59182739257812, -190.4239959716797, -168.25616455078125, -146.08831787109375, -123.92048645019531, -101.75265502929688, -79.58480834960938, -57.41697692871094, -35.2491455078125, -13.081310272216797, 9.086524963378906, 31.254364013671875, 53.42219543457031, 75.59002685546875, 97.75787353515625, 119.92570495605469, 142.09353637695312, 164.26136779785156, 186.42919921875, 208.5970458984375, 230.76487731933594, 252.93270874023438, 275.1005554199219, 297.26837158203125, 319.43621826171875, 341.60406494140625, 363.7718811035156, 385.9397277832031, 408.1075439453125, 430.275390625, 452.4432373046875, 474.611083984375, 496.7789001464844, 518.9467163085938, 541.1145629882812, 563.2824096679688, 585.4502563476562, 607.6180419921875, 629.785888671875, 651.9537353515625, 674.12158203125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 8.0, 6.0, 6.0, 5.0, 15.0, 13.0, 14.0, 16.0, 11.0, 23.0, 28.0, 27.0, 32.0, 28.0, 33.0, 40.0, 36.0, 50.0, 27.0, 42.0, 51.0, 41.0, 60.0, 41.0, 34.0, 32.0, 32.0, 34.0, 36.0, 21.0, 22.0, 19.0, 18.0, 23.0, 14.0, 10.0, 11.0, 7.0, 5.0, 3.0, 6.0, 10.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-232.5243682861328, -225.1221466064453, -217.71990966796875, -210.31768798828125, -202.91546630859375, -195.5132293701172, -188.1110076904297, -180.70877075195312, -173.30654907226562, -165.90432739257812, -158.50209045410156, -151.09986877441406, -143.69764709472656, -136.29541015625, -128.8931884765625, -121.49095916748047, -114.08873748779297, -106.68650817871094, -99.28428649902344, -91.8820571899414, -84.47982788085938, -77.07760620117188, -69.67537689208984, -62.27314758300781, -54.87092208862305, -47.46869659423828, -40.06646728515625, -32.664241790771484, -25.262014389038086, -17.859786987304688, -10.457561492919922, -3.0553321838378906, 4.346893310546875, 11.749120712280273, 19.151348114013672, 26.553573608398438, 33.95580291748047, 41.358028411865234, 48.76025390625, 56.16248321533203, 63.5647087097168, 70.96693420410156, 78.3691635131836, 85.77139282226562, 93.17361450195312, 100.57584381103516, 107.97807312011719, 115.38029479980469, 122.78252410888672, 130.18475341796875, 137.58697509765625, 144.98919677734375, 152.3914337158203, 159.7936553955078, 167.19589233398438, 174.59811401367188, 182.00033569335938, 189.40255737304688, 196.80479431152344, 204.20701599121094, 211.60923767089844, 219.011474609375, 226.4136962890625, 233.81591796875, 241.21815490722656]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 7.0, 9.0, 13.0, 20.0, 21.0, 33.0, 40.0, 66.0, 74.0, 130.0, 214.0, 391.0, 745.0, 1764.0, 5203.0, 18679.0, 92572.0, 3562875.0, 444953.0, 48180.0, 11725.0, 3655.0, 1389.0, 637.0, 318.0, 193.0, 120.0, 84.0, 65.0, 25.0, 21.0, 20.0, 11.0, 8.0, 6.0, 6.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.875, -146.4140625, -140.953125, -135.4921875, -130.03125, -124.5703125, -119.109375, -113.6484375, -108.1875, -102.7265625, -97.265625, -91.8046875, -86.34375, -80.8828125, -75.421875, -69.9609375, -64.5, -59.0390625, -53.578125, -48.1171875, -42.65625, -37.1953125, -31.734375, -26.2734375, -20.8125, -15.3515625, -9.890625, -4.4296875, 1.03125, 6.4921875, 11.953125, 17.4140625, 22.875, 28.3359375, 33.796875, 39.2578125, 44.71875, 50.1796875, 55.640625, 61.1015625, 66.5625, 72.0234375, 77.484375, 82.9453125, 88.40625, 93.8671875, 99.328125, 104.7890625, 110.25, 115.7109375, 121.171875, 126.6328125, 132.09375, 137.5546875, 143.015625, 148.4765625, 153.9375, 159.3984375, 164.859375, 170.3203125, 175.78125, 181.2421875, 186.703125, 192.1640625, 197.625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 11.0, 8.0, 22.0, 19.0, 28.0, 25.0, 29.0, 31.0, 47.0, 58.0, 63.0, 56.0, 63.0, 49.0, 59.0, 59.0, 52.0, 39.0, 44.0, 39.0, 41.0, 40.0, 18.0, 17.0, 21.0, 12.0, 14.0, 10.0, 8.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.51953125, -6.25701904296875, -5.9945068359375, -5.73199462890625, -5.469482421875, -5.20697021484375, -4.9444580078125, -4.68194580078125, -4.41943359375, -4.15692138671875, -3.8944091796875, -3.63189697265625, -3.369384765625, -3.10687255859375, -2.8443603515625, -2.58184814453125, -2.3193359375, -2.05682373046875, -1.7943115234375, -1.53179931640625, -1.269287109375, -1.00677490234375, -0.7442626953125, -0.48175048828125, -0.21923828125, 0.04327392578125, 0.3057861328125, 0.56829833984375, 0.830810546875, 1.09332275390625, 1.3558349609375, 1.61834716796875, 1.880859375, 2.14337158203125, 2.4058837890625, 2.66839599609375, 2.930908203125, 3.19342041015625, 3.4559326171875, 3.71844482421875, 3.98095703125, 4.24346923828125, 4.5059814453125, 4.76849365234375, 5.031005859375, 5.29351806640625, 5.5560302734375, 5.81854248046875, 6.0810546875, 6.34356689453125, 6.6060791015625, 6.86859130859375, 7.131103515625, 7.39361572265625, 7.6561279296875, 7.91864013671875, 8.18115234375, 8.44366455078125, 8.7061767578125, 8.96868896484375, 9.231201171875, 9.49371337890625, 9.7562255859375, 10.01873779296875, 10.28125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 8.0, 14.0, 22.0, 28.0, 45.0, 92.0, 155.0, 295.0, 605.0, 1322.0, 3476.0, 12025.0, 54005.0, 409514.0, 3497753.0, 173002.0, 30179.0, 7385.0, 2396.0, 888.0, 443.0, 234.0, 165.0, 93.0, 54.0, 25.0, 21.0, 12.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-178.25, -173.056640625, -167.86328125, -162.669921875, -157.4765625, -152.283203125, -147.08984375, -141.896484375, -136.703125, -131.509765625, -126.31640625, -121.123046875, -115.9296875, -110.736328125, -105.54296875, -100.349609375, -95.15625, -89.962890625, -84.76953125, -79.576171875, -74.3828125, -69.189453125, -63.99609375, -58.802734375, -53.609375, -48.416015625, -43.22265625, -38.029296875, -32.8359375, -27.642578125, -22.44921875, -17.255859375, -12.0625, -6.869140625, -1.67578125, 3.517578125, 8.7109375, 13.904296875, 19.09765625, 24.291015625, 29.484375, 34.677734375, 39.87109375, 45.064453125, 50.2578125, 55.451171875, 60.64453125, 65.837890625, 71.03125, 76.224609375, 81.41796875, 86.611328125, 91.8046875, 96.998046875, 102.19140625, 107.384765625, 112.578125, 117.771484375, 122.96484375, 128.158203125, 133.3515625, 138.544921875, 143.73828125, 148.931640625, 154.125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 8.0, 7.0, 9.0, 14.0, 15.0, 20.0, 13.0, 26.0, 32.0, 43.0, 53.0, 72.0, 71.0, 104.0, 199.0, 301.0, 631.0, 1336.0, 371.0, 206.0, 130.0, 96.0, 67.0, 49.0, 29.0, 31.0, 25.0, 27.0, 12.0, 14.0, 12.0, 12.0, 7.0, 10.0, 7.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.4794921875, -18.833984375, -18.1884765625, -17.54296875, -16.8974609375, -16.251953125, -15.6064453125, -14.9609375, -14.3154296875, -13.669921875, -13.0244140625, -12.37890625, -11.7333984375, -11.087890625, -10.4423828125, -9.796875, -9.1513671875, -8.505859375, -7.8603515625, -7.21484375, -6.5693359375, -5.923828125, -5.2783203125, -4.6328125, -3.9873046875, -3.341796875, -2.6962890625, -2.05078125, -1.4052734375, -0.759765625, -0.1142578125, 0.53125, 1.1767578125, 1.822265625, 2.4677734375, 3.11328125, 3.7587890625, 4.404296875, 5.0498046875, 5.6953125, 6.3408203125, 6.986328125, 7.6318359375, 8.27734375, 8.9228515625, 9.568359375, 10.2138671875, 10.859375, 11.5048828125, 12.150390625, 12.7958984375, 13.44140625, 14.0869140625, 14.732421875, 15.3779296875, 16.0234375, 16.6689453125, 17.314453125, 17.9599609375, 18.60546875, 19.2509765625, 19.896484375, 20.5419921875, 21.1875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 7.0, 11.0, 21.0, 31.0, 71.0, 141.0, 169.0, 203.0, 155.0, 105.0, 40.0, 31.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-408.87091064453125, -399.2136535644531, -389.556396484375, -379.8991394042969, -370.24188232421875, -360.5846252441406, -350.9273681640625, -341.27008056640625, -331.61285400390625, -321.9555969238281, -312.29833984375, -302.6410827636719, -292.98382568359375, -283.3265686035156, -273.6693115234375, -264.01202392578125, -254.35476684570312, -244.697509765625, -235.04025268554688, -225.38299560546875, -215.72573852539062, -206.0684814453125, -196.4112091064453, -186.7539520263672, -177.09669494628906, -167.43943786621094, -157.7821807861328, -148.1249237060547, -138.4676513671875, -128.81039428710938, -119.15313720703125, -109.49588012695312, -99.83863830566406, -90.18138122558594, -80.52412414550781, -70.86685943603516, -61.20960235595703, -51.552345275878906, -41.895084381103516, -32.237823486328125, -22.58056640625, -12.923307418823242, -3.2660484313964844, 6.391210556030273, 16.04846954345703, 25.705726623535156, 35.36298751831055, 45.02024841308594, 54.67750549316406, 64.33476257324219, 73.99201965332031, 83.64928436279297, 93.3065414428711, 102.96379852294922, 112.62106323242188, 122.2783203125, 131.93557739257812, 141.59283447265625, 151.25009155273438, 160.9073486328125, 170.56460571289062, 180.22186279296875, 189.87913513183594, 199.53639221191406, 209.1936492919922]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 12.0, 14.0, 19.0, 21.0, 28.0, 24.0, 32.0, 28.0, 36.0, 39.0, 44.0, 32.0, 46.0, 51.0, 62.0, 46.0, 53.0, 44.0, 55.0, 39.0, 40.0, 32.0, 34.0, 24.0, 25.0, 32.0, 19.0, 10.0, 9.0, 6.0, 5.0, 8.0, 5.0, 5.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.48548126220703, -94.37825012207031, -91.27101135253906, -88.16378021240234, -85.05654907226562, -81.9493179321289, -78.84207916259766, -75.73484802246094, -72.62761688232422, -69.5203857421875, -66.41314697265625, -63.30591583251953, -60.19868469238281, -57.09144973754883, -53.984214782714844, -50.876983642578125, -47.76974868774414, -44.662513732910156, -41.55528259277344, -38.44804763793945, -35.340816497802734, -32.23358154296875, -29.1263484954834, -26.019115447998047, -22.911882400512695, -19.804649353027344, -16.697416305541992, -13.590182304382324, -10.482949256896973, -7.375716209411621, -4.268482208251953, -1.1612491607666016, 1.94598388671875, 5.053216934204102, 8.160449981689453, 11.267683982849121, 14.374917030334473, 17.48215103149414, 20.589384078979492, 23.696617126464844, 26.803850173950195, 29.911083221435547, 33.01831817626953, 36.12554931640625, 39.232784271240234, 42.34001541137695, 45.44725036621094, 48.554481506347656, 51.66171646118164, 54.768951416015625, 57.876182556152344, 60.98341751098633, 64.09065246582031, 67.19788360595703, 70.30511474609375, 73.412353515625, 76.51958465576172, 79.62681579589844, 82.73405456542969, 85.8412857055664, 88.94851684570312, 92.05574798583984, 95.1629867553711, 98.27021789550781, 101.37744903564453]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 9.0, 7.0, 12.0, 24.0, 29.0, 36.0, 44.0, 80.0, 97.0, 187.0, 370.0, 729.0, 1826.0, 5809.0, 23604.0, 112616.0, 442906.0, 355471.0, 79904.0, 17403.0, 4425.0, 1475.0, 637.0, 339.0, 142.0, 107.0, 72.0, 49.0, 30.0, 33.0, 19.0, 17.0, 9.0, 10.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-106.5, -103.052734375, -99.60546875, -96.158203125, -92.7109375, -89.263671875, -85.81640625, -82.369140625, -78.921875, -75.474609375, -72.02734375, -68.580078125, -65.1328125, -61.685546875, -58.23828125, -54.791015625, -51.34375, -47.896484375, -44.44921875, -41.001953125, -37.5546875, -34.107421875, -30.66015625, -27.212890625, -23.765625, -20.318359375, -16.87109375, -13.423828125, -9.9765625, -6.529296875, -3.08203125, 0.365234375, 3.8125, 7.259765625, 10.70703125, 14.154296875, 17.6015625, 21.048828125, 24.49609375, 27.943359375, 31.390625, 34.837890625, 38.28515625, 41.732421875, 45.1796875, 48.626953125, 52.07421875, 55.521484375, 58.96875, 62.416015625, 65.86328125, 69.310546875, 72.7578125, 76.205078125, 79.65234375, 83.099609375, 86.546875, 89.994140625, 93.44140625, 96.888671875, 100.3359375, 103.783203125, 107.23046875, 110.677734375, 114.125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 6.0, 9.0, 18.0, 20.0, 24.0, 29.0, 27.0, 49.0, 62.0, 61.0, 57.0, 79.0, 75.0, 62.0, 70.0, 53.0, 41.0, 48.0, 43.0, 38.0, 28.0, 24.0, 25.0, 9.0, 12.0, 12.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.65625, -6.3404541015625, -6.024658203125, -5.7088623046875, -5.39306640625, -5.0772705078125, -4.761474609375, -4.4456787109375, -4.1298828125, -3.8140869140625, -3.498291015625, -3.1824951171875, -2.86669921875, -2.5509033203125, -2.235107421875, -1.9193115234375, -1.603515625, -1.2877197265625, -0.971923828125, -0.6561279296875, -0.34033203125, -0.0245361328125, 0.291259765625, 0.6070556640625, 0.9228515625, 1.2386474609375, 1.554443359375, 1.8702392578125, 2.18603515625, 2.5018310546875, 2.817626953125, 3.1334228515625, 3.44921875, 3.7650146484375, 4.080810546875, 4.3966064453125, 4.71240234375, 5.0281982421875, 5.343994140625, 5.6597900390625, 5.9755859375, 6.2913818359375, 6.607177734375, 6.9229736328125, 7.23876953125, 7.5545654296875, 7.870361328125, 8.1861572265625, 8.501953125, 8.8177490234375, 9.133544921875, 9.4493408203125, 9.76513671875, 10.0809326171875, 10.396728515625, 10.7125244140625, 11.0283203125, 11.3441162109375, 11.659912109375, 11.9757080078125, 12.29150390625, 12.6072998046875, 12.923095703125, 13.2388916015625, 13.5546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 7.0, 12.0, 17.0, 20.0, 26.0, 32.0, 39.0, 52.0, 95.0, 97.0, 166.0, 214.0, 282.0, 432.0, 722.0, 1126.0, 1977.0, 3682.0, 7771.0, 18165.0, 46038.0, 120128.0, 275163.0, 315712.0, 153348.0, 60382.0, 22889.0, 9415.0, 4556.0, 2261.0, 1253.0, 781.0, 504.0, 362.0, 256.0, 152.0, 115.0, 84.0, 53.0, 45.0, 41.0, 25.0, 16.0, 16.0, 9.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.0, -55.1083984375, -53.216796875, -51.3251953125, -49.43359375, -47.5419921875, -45.650390625, -43.7587890625, -41.8671875, -39.9755859375, -38.083984375, -36.1923828125, -34.30078125, -32.4091796875, -30.517578125, -28.6259765625, -26.734375, -24.8427734375, -22.951171875, -21.0595703125, -19.16796875, -17.2763671875, -15.384765625, -13.4931640625, -11.6015625, -9.7099609375, -7.818359375, -5.9267578125, -4.03515625, -2.1435546875, -0.251953125, 1.6396484375, 3.53125, 5.4228515625, 7.314453125, 9.2060546875, 11.09765625, 12.9892578125, 14.880859375, 16.7724609375, 18.6640625, 20.5556640625, 22.447265625, 24.3388671875, 26.23046875, 28.1220703125, 30.013671875, 31.9052734375, 33.796875, 35.6884765625, 37.580078125, 39.4716796875, 41.36328125, 43.2548828125, 45.146484375, 47.0380859375, 48.9296875, 50.8212890625, 52.712890625, 54.6044921875, 56.49609375, 58.3876953125, 60.279296875, 62.1708984375, 64.0625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 4.0, 9.0, 12.0, 11.0, 16.0, 14.0, 25.0, 24.0, 36.0, 27.0, 29.0, 27.0, 29.0, 38.0, 37.0, 34.0, 46.0, 42.0, 45.0, 33.0, 45.0, 36.0, 52.0, 50.0, 33.0, 31.0, 26.0, 22.0, 25.0, 24.0, 22.0, 16.0, 8.0, 19.0, 13.0, 10.0, 9.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-35.53125, -34.4462890625, -33.361328125, -32.2763671875, -31.19140625, -30.1064453125, -29.021484375, -27.9365234375, -26.8515625, -25.7666015625, -24.681640625, -23.5966796875, -22.51171875, -21.4267578125, -20.341796875, -19.2568359375, -18.171875, -17.0869140625, -16.001953125, -14.9169921875, -13.83203125, -12.7470703125, -11.662109375, -10.5771484375, -9.4921875, -8.4072265625, -7.322265625, -6.2373046875, -5.15234375, -4.0673828125, -2.982421875, -1.8974609375, -0.8125, 0.2724609375, 1.357421875, 2.4423828125, 3.52734375, 4.6123046875, 5.697265625, 6.7822265625, 7.8671875, 8.9521484375, 10.037109375, 11.1220703125, 12.20703125, 13.2919921875, 14.376953125, 15.4619140625, 16.546875, 17.6318359375, 18.716796875, 19.8017578125, 20.88671875, 21.9716796875, 23.056640625, 24.1416015625, 25.2265625, 26.3115234375, 27.396484375, 28.4814453125, 29.56640625, 30.6513671875, 31.736328125, 32.8212890625, 33.90625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 6.0, 6.0, 5.0, 8.0, 10.0, 14.0, 23.0, 35.0, 26.0, 78.0, 90.0, 140.0, 255.0, 429.0, 736.0, 1453.0, 3241.0, 8216.0, 24285.0, 87013.0, 360229.0, 412861.0, 104176.0, 28494.0, 9488.0, 3588.0, 1627.0, 813.0, 440.0, 260.0, 170.0, 112.0, 73.0, 40.0, 31.0, 31.0, 20.0, 8.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.28125, -35.11328125, -33.9453125, -32.77734375, -31.609375, -30.44140625, -29.2734375, -28.10546875, -26.9375, -25.76953125, -24.6015625, -23.43359375, -22.265625, -21.09765625, -19.9296875, -18.76171875, -17.59375, -16.42578125, -15.2578125, -14.08984375, -12.921875, -11.75390625, -10.5859375, -9.41796875, -8.25, -7.08203125, -5.9140625, -4.74609375, -3.578125, -2.41015625, -1.2421875, -0.07421875, 1.09375, 2.26171875, 3.4296875, 4.59765625, 5.765625, 6.93359375, 8.1015625, 9.26953125, 10.4375, 11.60546875, 12.7734375, 13.94140625, 15.109375, 16.27734375, 17.4453125, 18.61328125, 19.78125, 20.94921875, 22.1171875, 23.28515625, 24.453125, 25.62109375, 26.7890625, 27.95703125, 29.125, 30.29296875, 31.4609375, 32.62890625, 33.796875, 34.96484375, 36.1328125, 37.30078125, 38.46875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 6.0, 5.0, 6.0, 9.0, 13.0, 19.0, 25.0, 57.0, 63.0, 94.0, 112.0, 121.0, 128.0, 84.0, 73.0, 53.0, 35.0, 28.0, 20.0, 10.0, 13.0, 10.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00714111328125, -0.006935596466064453, -0.006730079650878906, -0.006524562835693359, -0.0063190460205078125, -0.006113529205322266, -0.005908012390136719, -0.005702495574951172, -0.005496978759765625, -0.005291461944580078, -0.005085945129394531, -0.004880428314208984, -0.0046749114990234375, -0.004469394683837891, -0.004263877868652344, -0.004058361053466797, -0.00385284423828125, -0.003647327423095703, -0.0034418106079101562, -0.0032362937927246094, -0.0030307769775390625, -0.0028252601623535156, -0.0026197433471679688, -0.002414226531982422, -0.002208709716796875, -0.002003192901611328, -0.0017976760864257812, -0.0015921592712402344, -0.0013866424560546875, -0.0011811256408691406, -0.0009756088256835938, -0.0007700920104980469, -0.0005645751953125, -0.0003590583801269531, -0.00015354156494140625, 5.1975250244140625e-05, 0.0002574920654296875, 0.0004630088806152344, 0.0006685256958007812, 0.0008740425109863281, 0.001079559326171875, 0.0012850761413574219, 0.0014905929565429688, 0.0016961097717285156, 0.0019016265869140625, 0.0021071434020996094, 0.0023126602172851562, 0.002518177032470703, 0.00272369384765625, 0.002929210662841797, 0.0031347274780273438, 0.0033402442932128906, 0.0035457611083984375, 0.0037512779235839844, 0.003956794738769531, 0.004162311553955078, 0.004367828369140625, 0.004573345184326172, 0.004778861999511719, 0.004984378814697266, 0.0051898956298828125, 0.005395412445068359, 0.005600929260253906, 0.005806446075439453, 0.006011962890625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 14.0, 10.0, 25.0, 24.0, 44.0, 63.0, 96.0, 146.0, 264.0, 449.0, 741.0, 1500.0, 3378.0, 8956.0, 31288.0, 157999.0, 603846.0, 186862.0, 35584.0, 10026.0, 3606.0, 1626.0, 820.0, 451.0, 267.0, 145.0, 84.0, 60.0, 43.0, 36.0, 22.0, 15.0, 15.0, 9.0, 9.0, 0.0, 6.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-53.03125, -51.49609375, -49.9609375, -48.42578125, -46.890625, -45.35546875, -43.8203125, -42.28515625, -40.75, -39.21484375, -37.6796875, -36.14453125, -34.609375, -33.07421875, -31.5390625, -30.00390625, -28.46875, -26.93359375, -25.3984375, -23.86328125, -22.328125, -20.79296875, -19.2578125, -17.72265625, -16.1875, -14.65234375, -13.1171875, -11.58203125, -10.046875, -8.51171875, -6.9765625, -5.44140625, -3.90625, -2.37109375, -0.8359375, 0.69921875, 2.234375, 3.76953125, 5.3046875, 6.83984375, 8.375, 9.91015625, 11.4453125, 12.98046875, 14.515625, 16.05078125, 17.5859375, 19.12109375, 20.65625, 22.19140625, 23.7265625, 25.26171875, 26.796875, 28.33203125, 29.8671875, 31.40234375, 32.9375, 34.47265625, 36.0078125, 37.54296875, 39.078125, 40.61328125, 42.1484375, 43.68359375, 45.21875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 7.0, 10.0, 8.0, 14.0, 7.0, 14.0, 27.0, 23.0, 30.0, 35.0, 56.0, 54.0, 70.0, 73.0, 93.0, 82.0, 93.0, 53.0, 57.0, 44.0, 24.0, 21.0, 16.0, 13.0, 13.0, 16.0, 7.0, 10.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.265625, -18.54248046875, -17.8193359375, -17.09619140625, -16.373046875, -15.64990234375, -14.9267578125, -14.20361328125, -13.48046875, -12.75732421875, -12.0341796875, -11.31103515625, -10.587890625, -9.86474609375, -9.1416015625, -8.41845703125, -7.6953125, -6.97216796875, -6.2490234375, -5.52587890625, -4.802734375, -4.07958984375, -3.3564453125, -2.63330078125, -1.91015625, -1.18701171875, -0.4638671875, 0.25927734375, 0.982421875, 1.70556640625, 2.4287109375, 3.15185546875, 3.875, 4.59814453125, 5.3212890625, 6.04443359375, 6.767578125, 7.49072265625, 8.2138671875, 8.93701171875, 9.66015625, 10.38330078125, 11.1064453125, 11.82958984375, 12.552734375, 13.27587890625, 13.9990234375, 14.72216796875, 15.4453125, 16.16845703125, 16.8916015625, 17.61474609375, 18.337890625, 19.06103515625, 19.7841796875, 20.50732421875, 21.23046875, 21.95361328125, 22.6767578125, 23.39990234375, 24.123046875, 24.84619140625, 25.5693359375, 26.29248046875, 27.015625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 13.0, 14.0, 32.0, 53.0, 120.0, 183.0, 194.0, 172.0, 104.0, 61.0, 28.0, 16.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-304.243896484375, -281.3418273925781, -258.4397277832031, -235.53765869140625, -212.63558959960938, -189.73350524902344, -166.8314208984375, -143.92935180664062, -121.02726745605469, -98.12519073486328, -75.22311401367188, -52.32102966308594, -29.41895294189453, -6.516876220703125, 16.385208129882812, 39.28727722167969, 62.189361572265625, 85.09143829345703, 107.99351501464844, 130.89559936523438, 153.79766845703125, 176.6997528076172, 199.60183715820312, 222.50390625, 245.40599060058594, 268.3080749511719, 291.21014404296875, 314.11224365234375, 337.0143127441406, 359.9163818359375, 382.8184814453125, 405.72052001953125, 428.62261962890625, 451.5246887207031, 474.4267883300781, 497.328857421875, 520.23095703125, 543.1329956054688, 566.0350952148438, 588.9371337890625, 611.8392333984375, 634.7413330078125, 657.6433715820312, 680.5454711914062, 703.4475708007812, 726.349609375, 749.251708984375, 772.15380859375, 795.055908203125, 817.9580078125, 840.8600463867188, 863.7621459960938, 886.6642456054688, 909.5662841796875, 932.4683837890625, 955.3704833984375, 978.2725219726562, 1001.1746215820312, 1024.07666015625, 1046.978759765625, 1069.880859375, 1092.782958984375, 1115.68505859375, 1138.5870361328125, 1161.4891357421875]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 12.0, 15.0, 13.0, 12.0, 17.0, 14.0, 23.0, 25.0, 24.0, 42.0, 29.0, 39.0, 43.0, 53.0, 45.0, 64.0, 55.0, 65.0, 49.0, 46.0, 33.0, 42.0, 48.0, 29.0, 29.0, 25.0, 26.0, 12.0, 18.0, 8.0, 8.0, 11.0, 10.0, 0.0, 2.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-292.1956787109375, -284.10540771484375, -276.0151062011719, -267.9248352050781, -259.83453369140625, -251.74424743652344, -243.65396118164062, -235.56369018554688, -227.473388671875, -219.3831024169922, -211.29281616210938, -203.20252990722656, -195.11224365234375, -187.02195739746094, -178.93167114257812, -170.84140014648438, -162.75111389160156, -154.66082763671875, -146.57054138183594, -138.48025512695312, -130.3899688720703, -122.2996826171875, -114.20940399169922, -106.1191177368164, -98.0288314819336, -89.93854522705078, -81.84825897216797, -73.75798034667969, -65.66769409179688, -57.5774040222168, -49.48712158203125, -41.39683532714844, -33.306549072265625, -25.216262817382812, -17.125978469848633, -9.035694122314453, -0.9454078674316406, 7.144878387451172, 15.235160827636719, 23.32544708251953, 31.415733337402344, 39.506019592285156, 47.59630584716797, 55.686588287353516, 63.77687454223633, 71.86715698242188, 79.95744323730469, 88.0477294921875, 96.13801574707031, 104.22830200195312, 112.31858825683594, 120.40887451171875, 128.49916076660156, 136.58944702148438, 144.67971801757812, 152.77001953125, 160.86029052734375, 168.95057678222656, 177.04086303710938, 185.1311492919922, 193.221435546875, 201.3117218017578, 209.40200805664062, 217.49227905273438, 225.58258056640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 11.0, 12.0, 18.0, 33.0, 40.0, 62.0, 92.0, 172.0, 260.0, 509.0, 1203.0, 2976.0, 8841.0, 34060.0, 246768.0, 3776784.0, 93582.0, 19125.0, 5749.0, 2061.0, 880.0, 385.0, 242.0, 147.0, 75.0, 65.0, 36.0, 23.0, 14.0, 15.0, 11.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-153.625, -149.7158203125, -145.806640625, -141.8974609375, -137.98828125, -134.0791015625, -130.169921875, -126.2607421875, -122.3515625, -118.4423828125, -114.533203125, -110.6240234375, -106.71484375, -102.8056640625, -98.896484375, -94.9873046875, -91.078125, -87.1689453125, -83.259765625, -79.3505859375, -75.44140625, -71.5322265625, -67.623046875, -63.7138671875, -59.8046875, -55.8955078125, -51.986328125, -48.0771484375, -44.16796875, -40.2587890625, -36.349609375, -32.4404296875, -28.53125, -24.6220703125, -20.712890625, -16.8037109375, -12.89453125, -8.9853515625, -5.076171875, -1.1669921875, 2.7421875, 6.6513671875, 10.560546875, 14.4697265625, 18.37890625, 22.2880859375, 26.197265625, 30.1064453125, 34.015625, 37.9248046875, 41.833984375, 45.7431640625, 49.65234375, 53.5615234375, 57.470703125, 61.3798828125, 65.2890625, 69.1982421875, 73.107421875, 77.0166015625, 80.92578125, 84.8349609375, 88.744140625, 92.6533203125, 96.5625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 10.0, 8.0, 9.0, 22.0, 27.0, 31.0, 35.0, 45.0, 57.0, 43.0, 73.0, 62.0, 71.0, 80.0, 76.0, 59.0, 49.0, 53.0, 48.0, 34.0, 23.0, 24.0, 18.0, 10.0, 9.0, 8.0, 8.0, 9.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87109375, -6.52911376953125, -6.1871337890625, -5.84515380859375, -5.503173828125, -5.16119384765625, -4.8192138671875, -4.47723388671875, -4.13525390625, -3.79327392578125, -3.4512939453125, -3.10931396484375, -2.767333984375, -2.42535400390625, -2.0833740234375, -1.74139404296875, -1.3994140625, -1.05743408203125, -0.7154541015625, -0.37347412109375, -0.031494140625, 0.31048583984375, 0.6524658203125, 0.99444580078125, 1.33642578125, 1.67840576171875, 2.0203857421875, 2.36236572265625, 2.704345703125, 3.04632568359375, 3.3883056640625, 3.73028564453125, 4.072265625, 4.41424560546875, 4.7562255859375, 5.09820556640625, 5.440185546875, 5.78216552734375, 6.1241455078125, 6.46612548828125, 6.80810546875, 7.15008544921875, 7.4920654296875, 7.83404541015625, 8.176025390625, 8.51800537109375, 8.8599853515625, 9.20196533203125, 9.5439453125, 9.88592529296875, 10.2279052734375, 10.56988525390625, 10.911865234375, 11.25384521484375, 11.5958251953125, 11.93780517578125, 12.27978515625, 12.62176513671875, 12.9637451171875, 13.30572509765625, 13.647705078125, 13.98968505859375, 14.3316650390625, 14.67364501953125, 15.015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 10.0, 16.0, 23.0, 29.0, 49.0, 72.0, 166.0, 321.0, 850.0, 2653.0, 11243.0, 66159.0, 3414334.0, 645085.0, 42444.0, 7654.0, 2003.0, 636.0, 258.0, 107.0, 65.0, 39.0, 27.0, 9.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-184.0, -179.01171875, -174.0234375, -169.03515625, -164.046875, -159.05859375, -154.0703125, -149.08203125, -144.09375, -139.10546875, -134.1171875, -129.12890625, -124.140625, -119.15234375, -114.1640625, -109.17578125, -104.1875, -99.19921875, -94.2109375, -89.22265625, -84.234375, -79.24609375, -74.2578125, -69.26953125, -64.28125, -59.29296875, -54.3046875, -49.31640625, -44.328125, -39.33984375, -34.3515625, -29.36328125, -24.375, -19.38671875, -14.3984375, -9.41015625, -4.421875, 0.56640625, 5.5546875, 10.54296875, 15.53125, 20.51953125, 25.5078125, 30.49609375, 35.484375, 40.47265625, 45.4609375, 50.44921875, 55.4375, 60.42578125, 65.4140625, 70.40234375, 75.390625, 80.37890625, 85.3671875, 90.35546875, 95.34375, 100.33203125, 105.3203125, 110.30859375, 115.296875, 120.28515625, 125.2734375, 130.26171875, 135.25]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 13.0, 13.0, 29.0, 35.0, 36.0, 79.0, 137.0, 355.0, 2153.0, 684.0, 204.0, 120.0, 92.0, 40.0, 25.0, 16.0, 17.0, 8.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.6875, -47.623291015625, -46.55908203125, -45.494873046875, -44.4306640625, -43.366455078125, -42.30224609375, -41.238037109375, -40.173828125, -39.109619140625, -38.04541015625, -36.981201171875, -35.9169921875, -34.852783203125, -33.78857421875, -32.724365234375, -31.66015625, -30.595947265625, -29.53173828125, -28.467529296875, -27.4033203125, -26.339111328125, -25.27490234375, -24.210693359375, -23.146484375, -22.082275390625, -21.01806640625, -19.953857421875, -18.8896484375, -17.825439453125, -16.76123046875, -15.697021484375, -14.6328125, -13.568603515625, -12.50439453125, -11.440185546875, -10.3759765625, -9.311767578125, -8.24755859375, -7.183349609375, -6.119140625, -5.054931640625, -3.99072265625, -2.926513671875, -1.8623046875, -0.798095703125, 0.26611328125, 1.330322265625, 2.39453125, 3.458740234375, 4.52294921875, 5.587158203125, 6.6513671875, 7.715576171875, 8.77978515625, 9.843994140625, 10.908203125, 11.972412109375, 13.03662109375, 14.100830078125, 15.1650390625, 16.229248046875, 17.29345703125, 18.357666015625, 19.421875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 1.0, 4.0, 6.0, 7.0, 17.0, 26.0, 32.0, 56.0, 70.0, 114.0, 151.0, 136.0, 135.0, 97.0, 53.0, 30.0, 18.0, 17.0, 10.0, 9.0, 1.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-214.3878936767578, -209.1502685546875, -203.91262817382812, -198.6750030517578, -193.4373779296875, -188.1997528076172, -182.96212768554688, -177.7244873046875, -172.4868621826172, -167.24923706054688, -162.0115966796875, -156.7739715576172, -151.53634643554688, -146.29872131347656, -141.06109619140625, -135.82345581054688, -130.58583068847656, -125.34820556640625, -120.1105728149414, -114.87294006347656, -109.63531494140625, -104.39768981933594, -99.1600570678711, -93.92242431640625, -88.68479919433594, -83.44717407226562, -78.20954132080078, -72.97190856933594, -67.73428344726562, -62.49665451049805, -57.25902557373047, -52.02139663696289, -46.78375244140625, -41.54612350463867, -36.308494567871094, -31.070865631103516, -25.833236694335938, -20.59560775756836, -15.357978820800781, -10.120349884033203, -4.882720947265625, 0.3549079895019531, 5.592536926269531, 10.83016586303711, 16.067794799804688, 21.305423736572266, 26.543052673339844, 31.780681610107422, 37.018310546875, 42.25593948364258, 47.493568420410156, 52.731197357177734, 57.96882629394531, 63.20645523071289, 68.44408416748047, 73.68171691894531, 78.91934204101562, 84.15696716308594, 89.39459991455078, 94.63223266601562, 99.86985778808594, 105.10748291015625, 110.3451156616211, 115.58274841308594, 120.82037353515625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 4.0, 12.0, 6.0, 10.0, 10.0, 18.0, 22.0, 20.0, 27.0, 28.0, 32.0, 47.0, 34.0, 51.0, 51.0, 41.0, 45.0, 52.0, 44.0, 60.0, 42.0, 46.0, 26.0, 27.0, 38.0, 33.0, 34.0, 19.0, 27.0, 19.0, 17.0, 7.0, 13.0, 12.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-84.69847106933594, -82.26068878173828, -79.82290649414062, -77.38512420654297, -74.94734191894531, -72.50955963134766, -70.07177734375, -67.63398742675781, -65.19621276855469, -62.75843048095703, -60.320648193359375, -57.88286590576172, -55.44508361816406, -53.007301330566406, -50.569515228271484, -48.13173294067383, -45.693946838378906, -43.25616455078125, -40.818382263183594, -38.38059997558594, -35.94281768798828, -33.505035400390625, -31.067249298095703, -28.629467010498047, -26.19168472290039, -23.753902435302734, -21.316120147705078, -18.87833595275879, -16.440553665161133, -14.002771377563477, -11.564988136291504, -9.127204895019531, -6.689422607421875, -4.2516398429870605, -1.813857078552246, 0.6239256858825684, 3.061708450317383, 5.499490737915039, 7.937273979187012, 10.375057220458984, 12.81283950805664, 15.250621795654297, 17.688404083251953, 20.126188278198242, 22.5639705657959, 25.001752853393555, 27.439537048339844, 29.8773193359375, 32.315101623535156, 34.75288391113281, 37.19066619873047, 39.628448486328125, 42.06623077392578, 44.50401306152344, 46.94179916381836, 49.379581451416016, 51.81736373901367, 54.25514602661133, 56.692928314208984, 59.13071060180664, 61.56849670410156, 64.00627899169922, 66.44406127929688, 68.88184356689453, 71.31962585449219]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 7.0, 6.0, 11.0, 11.0, 21.0, 24.0, 32.0, 34.0, 61.0, 83.0, 137.0, 249.0, 334.0, 656.0, 1348.0, 2852.0, 6764.0, 19141.0, 61319.0, 209655.0, 439890.0, 212006.0, 61926.0, 19262.0, 6763.0, 2827.0, 1355.0, 669.0, 387.0, 237.0, 155.0, 88.0, 65.0, 40.0, 35.0, 18.0, 24.0, 14.0, 12.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.6875, -76.0205078125, -73.353515625, -70.6865234375, -68.01953125, -65.3525390625, -62.685546875, -60.0185546875, -57.3515625, -54.6845703125, -52.017578125, -49.3505859375, -46.68359375, -44.0166015625, -41.349609375, -38.6826171875, -36.015625, -33.3486328125, -30.681640625, -28.0146484375, -25.34765625, -22.6806640625, -20.013671875, -17.3466796875, -14.6796875, -12.0126953125, -9.345703125, -6.6787109375, -4.01171875, -1.3447265625, 1.322265625, 3.9892578125, 6.65625, 9.3232421875, 11.990234375, 14.6572265625, 17.32421875, 19.9912109375, 22.658203125, 25.3251953125, 27.9921875, 30.6591796875, 33.326171875, 35.9931640625, 38.66015625, 41.3271484375, 43.994140625, 46.6611328125, 49.328125, 51.9951171875, 54.662109375, 57.3291015625, 59.99609375, 62.6630859375, 65.330078125, 67.9970703125, 70.6640625, 73.3310546875, 75.998046875, 78.6650390625, 81.33203125, 83.9990234375, 86.666015625, 89.3330078125, 92.0]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 7.0, 5.0, 15.0, 15.0, 13.0, 22.0, 25.0, 46.0, 44.0, 58.0, 57.0, 59.0, 74.0, 77.0, 85.0, 56.0, 60.0, 58.0, 48.0, 41.0, 43.0, 30.0, 20.0, 15.0, 10.0, 5.0, 7.0, 8.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.11126708984375, -5.7498779296875, -5.38848876953125, -5.027099609375, -4.66571044921875, -4.3043212890625, -3.94293212890625, -3.58154296875, -3.22015380859375, -2.8587646484375, -2.49737548828125, -2.135986328125, -1.77459716796875, -1.4132080078125, -1.05181884765625, -0.6904296875, -0.32904052734375, 0.0323486328125, 0.39373779296875, 0.755126953125, 1.11651611328125, 1.4779052734375, 1.83929443359375, 2.20068359375, 2.56207275390625, 2.9234619140625, 3.28485107421875, 3.646240234375, 4.00762939453125, 4.3690185546875, 4.73040771484375, 5.091796875, 5.45318603515625, 5.8145751953125, 6.17596435546875, 6.537353515625, 6.89874267578125, 7.2601318359375, 7.62152099609375, 7.98291015625, 8.34429931640625, 8.7056884765625, 9.06707763671875, 9.428466796875, 9.78985595703125, 10.1512451171875, 10.51263427734375, 10.8740234375, 11.23541259765625, 11.5968017578125, 11.95819091796875, 12.319580078125, 12.68096923828125, 13.0423583984375, 13.40374755859375, 13.76513671875, 14.12652587890625, 14.4879150390625, 14.84930419921875, 15.210693359375, 15.57208251953125, 15.9334716796875, 16.29486083984375, 16.65625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 12.0, 12.0, 12.0, 17.0, 21.0, 34.0, 46.0, 81.0, 106.0, 143.0, 197.0, 294.0, 411.0, 599.0, 947.0, 1567.0, 2872.0, 5802.0, 13245.0, 33511.0, 89191.0, 223958.0, 342798.0, 201187.0, 78171.0, 29512.0, 11574.0, 5358.0, 2635.0, 1491.0, 839.0, 558.0, 400.0, 279.0, 186.0, 153.0, 92.0, 59.0, 52.0, 40.0, 23.0, 23.0, 17.0, 14.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.40625, -49.65966796875, -47.9130859375, -46.16650390625, -44.419921875, -42.67333984375, -40.9267578125, -39.18017578125, -37.43359375, -35.68701171875, -33.9404296875, -32.19384765625, -30.447265625, -28.70068359375, -26.9541015625, -25.20751953125, -23.4609375, -21.71435546875, -19.9677734375, -18.22119140625, -16.474609375, -14.72802734375, -12.9814453125, -11.23486328125, -9.48828125, -7.74169921875, -5.9951171875, -4.24853515625, -2.501953125, -0.75537109375, 0.9912109375, 2.73779296875, 4.484375, 6.23095703125, 7.9775390625, 9.72412109375, 11.470703125, 13.21728515625, 14.9638671875, 16.71044921875, 18.45703125, 20.20361328125, 21.9501953125, 23.69677734375, 25.443359375, 27.18994140625, 28.9365234375, 30.68310546875, 32.4296875, 34.17626953125, 35.9228515625, 37.66943359375, 39.416015625, 41.16259765625, 42.9091796875, 44.65576171875, 46.40234375, 48.14892578125, 49.8955078125, 51.64208984375, 53.388671875, 55.13525390625, 56.8818359375, 58.62841796875, 60.375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 9.0, 1.0, 10.0, 6.0, 9.0, 12.0, 17.0, 19.0, 16.0, 18.0, 23.0, 24.0, 16.0, 49.0, 31.0, 39.0, 35.0, 32.0, 44.0, 43.0, 34.0, 42.0, 51.0, 33.0, 45.0, 39.0, 32.0, 24.0, 33.0, 28.0, 32.0, 24.0, 21.0, 16.0, 22.0, 11.0, 14.0, 8.0, 9.0, 3.0, 7.0, 5.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-36.21875, -35.1708984375, -34.123046875, -33.0751953125, -32.02734375, -30.9794921875, -29.931640625, -28.8837890625, -27.8359375, -26.7880859375, -25.740234375, -24.6923828125, -23.64453125, -22.5966796875, -21.548828125, -20.5009765625, -19.453125, -18.4052734375, -17.357421875, -16.3095703125, -15.26171875, -14.2138671875, -13.166015625, -12.1181640625, -11.0703125, -10.0224609375, -8.974609375, -7.9267578125, -6.87890625, -5.8310546875, -4.783203125, -3.7353515625, -2.6875, -1.6396484375, -0.591796875, 0.4560546875, 1.50390625, 2.5517578125, 3.599609375, 4.6474609375, 5.6953125, 6.7431640625, 7.791015625, 8.8388671875, 9.88671875, 10.9345703125, 11.982421875, 13.0302734375, 14.078125, 15.1259765625, 16.173828125, 17.2216796875, 18.26953125, 19.3173828125, 20.365234375, 21.4130859375, 22.4609375, 23.5087890625, 24.556640625, 25.6044921875, 26.65234375, 27.7001953125, 28.748046875, 29.7958984375, 30.84375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 6.0, 5.0, 17.0, 19.0, 24.0, 44.0, 70.0, 82.0, 134.0, 231.0, 391.0, 690.0, 1358.0, 3055.0, 10739.0, 448750.0, 564920.0, 11533.0, 3210.0, 1468.0, 743.0, 397.0, 252.0, 137.0, 91.0, 44.0, 43.0, 34.0, 18.0, 15.0, 5.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.75, -119.486328125, -115.22265625, -110.958984375, -106.6953125, -102.431640625, -98.16796875, -93.904296875, -89.640625, -85.376953125, -81.11328125, -76.849609375, -72.5859375, -68.322265625, -64.05859375, -59.794921875, -55.53125, -51.267578125, -47.00390625, -42.740234375, -38.4765625, -34.212890625, -29.94921875, -25.685546875, -21.421875, -17.158203125, -12.89453125, -8.630859375, -4.3671875, -0.103515625, 4.16015625, 8.423828125, 12.6875, 16.951171875, 21.21484375, 25.478515625, 29.7421875, 34.005859375, 38.26953125, 42.533203125, 46.796875, 51.060546875, 55.32421875, 59.587890625, 63.8515625, 68.115234375, 72.37890625, 76.642578125, 80.90625, 85.169921875, 89.43359375, 93.697265625, 97.9609375, 102.224609375, 106.48828125, 110.751953125, 115.015625, 119.279296875, 123.54296875, 127.806640625, 132.0703125, 136.333984375, 140.59765625, 144.861328125, 149.125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 25.0, 42.0, 119.0, 282.0, 293.0, 132.0, 44.0, 25.0, 12.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0218048095703125, -0.021214723587036133, -0.020624637603759766, -0.0200345516204834, -0.01944446563720703, -0.018854379653930664, -0.018264293670654297, -0.01767420768737793, -0.017084121704101562, -0.016494035720825195, -0.015903949737548828, -0.015313863754272461, -0.014723777770996094, -0.014133691787719727, -0.01354360580444336, -0.012953519821166992, -0.012363433837890625, -0.011773347854614258, -0.01118326187133789, -0.010593175888061523, -0.010003089904785156, -0.009413003921508789, -0.008822917938232422, -0.008232831954956055, -0.0076427459716796875, -0.00705265998840332, -0.006462574005126953, -0.005872488021850586, -0.005282402038574219, -0.0046923160552978516, -0.004102230072021484, -0.003512144088745117, -0.00292205810546875, -0.002331972122192383, -0.0017418861389160156, -0.0011518001556396484, -0.0005617141723632812, 2.8371810913085938e-05, 0.0006184577941894531, 0.0012085437774658203, 0.0017986297607421875, 0.0023887157440185547, 0.002978801727294922, 0.003568887710571289, 0.004158973693847656, 0.0047490596771240234, 0.005339145660400391, 0.005929231643676758, 0.006519317626953125, 0.007109403610229492, 0.007699489593505859, 0.008289575576782227, 0.008879661560058594, 0.009469747543334961, 0.010059833526611328, 0.010649919509887695, 0.011240005493164062, 0.01183009147644043, 0.012420177459716797, 0.013010263442993164, 0.013600349426269531, 0.014190435409545898, 0.014780521392822266, 0.015370607376098633, 0.015960693359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 14.0, 12.0, 22.0, 29.0, 39.0, 58.0, 97.0, 165.0, 315.0, 674.0, 1807.0, 7281.0, 568428.0, 459514.0, 6794.0, 1873.0, 699.0, 301.0, 163.0, 95.0, 59.0, 35.0, 18.0, 18.0, 4.0, 9.0, 3.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-219.0, -212.9140625, -206.828125, -200.7421875, -194.65625, -188.5703125, -182.484375, -176.3984375, -170.3125, -164.2265625, -158.140625, -152.0546875, -145.96875, -139.8828125, -133.796875, -127.7109375, -121.625, -115.5390625, -109.453125, -103.3671875, -97.28125, -91.1953125, -85.109375, -79.0234375, -72.9375, -66.8515625, -60.765625, -54.6796875, -48.59375, -42.5078125, -36.421875, -30.3359375, -24.25, -18.1640625, -12.078125, -5.9921875, 0.09375, 6.1796875, 12.265625, 18.3515625, 24.4375, 30.5234375, 36.609375, 42.6953125, 48.78125, 54.8671875, 60.953125, 67.0390625, 73.125, 79.2109375, 85.296875, 91.3828125, 97.46875, 103.5546875, 109.640625, 115.7265625, 121.8125, 127.8984375, 133.984375, 140.0703125, 146.15625, 152.2421875, 158.328125, 164.4140625, 170.5]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 2.0, 3.0, 4.0, 6.0, 16.0, 17.0, 40.0, 42.0, 80.0, 79.0, 152.0, 193.0, 137.0, 89.0, 59.0, 26.0, 18.0, 14.0, 6.0, 9.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-56.21875, -54.8837890625, -53.548828125, -52.2138671875, -50.87890625, -49.5439453125, -48.208984375, -46.8740234375, -45.5390625, -44.2041015625, -42.869140625, -41.5341796875, -40.19921875, -38.8642578125, -37.529296875, -36.1943359375, -34.859375, -33.5244140625, -32.189453125, -30.8544921875, -29.51953125, -28.1845703125, -26.849609375, -25.5146484375, -24.1796875, -22.8447265625, -21.509765625, -20.1748046875, -18.83984375, -17.5048828125, -16.169921875, -14.8349609375, -13.5, -12.1650390625, -10.830078125, -9.4951171875, -8.16015625, -6.8251953125, -5.490234375, -4.1552734375, -2.8203125, -1.4853515625, -0.150390625, 1.1845703125, 2.51953125, 3.8544921875, 5.189453125, 6.5244140625, 7.859375, 9.1943359375, 10.529296875, 11.8642578125, 13.19921875, 14.5341796875, 15.869140625, 17.2041015625, 18.5390625, 19.8740234375, 21.208984375, 22.5439453125, 23.87890625, 25.2138671875, 26.548828125, 27.8837890625, 29.21875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 7.0, 5.0, 9.0, 14.0, 20.0, 23.0, 52.0, 73.0, 92.0, 110.0, 117.0, 105.0, 107.0, 64.0, 57.0, 49.0, 30.0, 21.0, 12.0, 9.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-397.07916259765625, -382.76373291015625, -368.4482727050781, -354.1328430175781, -339.8173828125, -325.501953125, -311.1865234375, -296.87109375, -282.5556335449219, -268.2402038574219, -253.92474365234375, -239.60931396484375, -225.2938690185547, -210.97842407226562, -196.66299438476562, -182.34754943847656, -168.0321044921875, -153.71665954589844, -139.40121459960938, -125.08578491210938, -110.77033996582031, -96.45489501953125, -82.13945770263672, -67.82402038574219, -53.508575439453125, -39.19313430786133, -24.87769317626953, -10.562252044677734, 3.7531890869140625, 18.068634033203125, 32.384071350097656, 46.69950866699219, 61.01495361328125, 75.33039855957031, 89.64583587646484, 103.96127319335938, 118.27671813964844, 132.5921630859375, 146.9075927734375, 161.22303771972656, 175.53848266601562, 189.8539276123047, 204.16937255859375, 218.48480224609375, 232.8002471923828, 247.11569213867188, 261.4311218261719, 275.74658203125, 290.06201171875, 304.37744140625, 318.6929016113281, 333.0083312988281, 347.32379150390625, 361.63922119140625, 375.95465087890625, 390.27008056640625, 404.5855407714844, 418.9009704589844, 433.2164306640625, 447.5318603515625, 461.8472900390625, 476.1627502441406, 490.4781799316406, 504.79364013671875, 519.1090698242188]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 5.0, 3.0, 7.0, 7.0, 17.0, 14.0, 14.0, 20.0, 21.0, 24.0, 21.0, 29.0, 35.0, 41.0, 31.0, 52.0, 50.0, 44.0, 42.0, 35.0, 54.0, 46.0, 33.0, 53.0, 41.0, 26.0, 25.0, 32.0, 31.0, 16.0, 15.0, 23.0, 19.0, 23.0, 6.0, 11.0, 5.0, 5.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-210.11585998535156, -203.5716552734375, -197.0274658203125, -190.48326110839844, -183.93905639648438, -177.3948516845703, -170.85064697265625, -164.30645751953125, -157.7622528076172, -151.21804809570312, -144.67385864257812, -138.12965393066406, -131.58544921875, -125.04124450683594, -118.4970474243164, -111.95285034179688, -105.40864562988281, -98.86444091796875, -92.32024383544922, -85.77604675292969, -79.23184204101562, -72.68763732910156, -66.14344024658203, -59.599239349365234, -53.05503845214844, -46.51083755493164, -39.966636657714844, -33.42243576049805, -26.87823486328125, -20.334033966064453, -13.789833068847656, -7.245632171630859, -0.701446533203125, 5.842754364013672, 12.386955261230469, 18.931156158447266, 25.475357055664062, 32.01955795288086, 38.563758850097656, 45.10795974731445, 51.65216064453125, 58.19636154174805, 64.74056243896484, 71.28475952148438, 77.82896423339844, 84.3731689453125, 90.91736602783203, 97.46156311035156, 104.00576782226562, 110.54997253417969, 117.09416961669922, 123.63836669921875, 130.1825714111328, 136.72677612304688, 143.27096557617188, 149.81517028808594, 156.359375, 162.90357971191406, 169.44778442382812, 175.99197387695312, 182.5361785888672, 189.08038330078125, 195.62457275390625, 202.1687774658203, 208.71298217773438]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 14.0, 23.0, 27.0, 35.0, 70.0, 89.0, 131.0, 222.0, 415.0, 715.0, 1489.0, 3575.0, 9090.0, 28129.0, 122101.0, 3255549.0, 667685.0, 73701.0, 19239.0, 6573.0, 2699.0, 1244.0, 572.0, 332.0, 191.0, 116.0, 70.0, 42.0, 33.0, 24.0, 27.0, 17.0, 7.0, 5.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-104.125, -100.955078125, -97.78515625, -94.615234375, -91.4453125, -88.275390625, -85.10546875, -81.935546875, -78.765625, -75.595703125, -72.42578125, -69.255859375, -66.0859375, -62.916015625, -59.74609375, -56.576171875, -53.40625, -50.236328125, -47.06640625, -43.896484375, -40.7265625, -37.556640625, -34.38671875, -31.216796875, -28.046875, -24.876953125, -21.70703125, -18.537109375, -15.3671875, -12.197265625, -9.02734375, -5.857421875, -2.6875, 0.482421875, 3.65234375, 6.822265625, 9.9921875, 13.162109375, 16.33203125, 19.501953125, 22.671875, 25.841796875, 29.01171875, 32.181640625, 35.3515625, 38.521484375, 41.69140625, 44.861328125, 48.03125, 51.201171875, 54.37109375, 57.541015625, 60.7109375, 63.880859375, 67.05078125, 70.220703125, 73.390625, 76.560546875, 79.73046875, 82.900390625, 86.0703125, 89.240234375, 92.41015625, 95.580078125, 98.75]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 7.0, 5.0, 7.0, 11.0, 14.0, 22.0, 19.0, 24.0, 31.0, 57.0, 42.0, 66.0, 70.0, 69.0, 81.0, 71.0, 68.0, 57.0, 59.0, 58.0, 48.0, 40.0, 28.0, 17.0, 9.0, 14.0, 5.0, 8.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.46875, -7.09228515625, -6.7158203125, -6.33935546875, -5.962890625, -5.58642578125, -5.2099609375, -4.83349609375, -4.45703125, -4.08056640625, -3.7041015625, -3.32763671875, -2.951171875, -2.57470703125, -2.1982421875, -1.82177734375, -1.4453125, -1.06884765625, -0.6923828125, -0.31591796875, 0.060546875, 0.43701171875, 0.8134765625, 1.18994140625, 1.56640625, 1.94287109375, 2.3193359375, 2.69580078125, 3.072265625, 3.44873046875, 3.8251953125, 4.20166015625, 4.578125, 4.95458984375, 5.3310546875, 5.70751953125, 6.083984375, 6.46044921875, 6.8369140625, 7.21337890625, 7.58984375, 7.96630859375, 8.3427734375, 8.71923828125, 9.095703125, 9.47216796875, 9.8486328125, 10.22509765625, 10.6015625, 10.97802734375, 11.3544921875, 11.73095703125, 12.107421875, 12.48388671875, 12.8603515625, 13.23681640625, 13.61328125, 13.98974609375, 14.3662109375, 14.74267578125, 15.119140625, 15.49560546875, 15.8720703125, 16.24853515625, 16.625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 5.0, 7.0, 9.0, 11.0, 13.0, 20.0, 27.0, 44.0, 63.0, 113.0, 199.0, 300.0, 589.0, 967.0, 2027.0, 4647.0, 11684.0, 36738.0, 151545.0, 2843751.0, 987045.0, 108110.0, 28555.0, 9918.0, 3993.0, 1773.0, 861.0, 457.0, 306.0, 165.0, 109.0, 74.0, 43.0, 37.0, 24.0, 14.0, 14.0, 4.0, 2.0, 4.0, 5.0, 9.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-109.875, -106.896484375, -103.91796875, -100.939453125, -97.9609375, -94.982421875, -92.00390625, -89.025390625, -86.046875, -83.068359375, -80.08984375, -77.111328125, -74.1328125, -71.154296875, -68.17578125, -65.197265625, -62.21875, -59.240234375, -56.26171875, -53.283203125, -50.3046875, -47.326171875, -44.34765625, -41.369140625, -38.390625, -35.412109375, -32.43359375, -29.455078125, -26.4765625, -23.498046875, -20.51953125, -17.541015625, -14.5625, -11.583984375, -8.60546875, -5.626953125, -2.6484375, 0.330078125, 3.30859375, 6.287109375, 9.265625, 12.244140625, 15.22265625, 18.201171875, 21.1796875, 24.158203125, 27.13671875, 30.115234375, 33.09375, 36.072265625, 39.05078125, 42.029296875, 45.0078125, 47.986328125, 50.96484375, 53.943359375, 56.921875, 59.900390625, 62.87890625, 65.857421875, 68.8359375, 71.814453125, 74.79296875, 77.771484375, 80.75]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 6.0, 6.0, 12.0, 6.0, 13.0, 14.0, 21.0, 33.0, 38.0, 60.0, 98.0, 102.0, 173.0, 293.0, 659.0, 1335.0, 430.0, 230.0, 141.0, 89.0, 77.0, 48.0, 40.0, 26.0, 26.0, 32.0, 13.0, 13.0, 10.0, 9.0, 7.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.296875, -26.394287109375, -25.49169921875, -24.589111328125, -23.6865234375, -22.783935546875, -21.88134765625, -20.978759765625, -20.076171875, -19.173583984375, -18.27099609375, -17.368408203125, -16.4658203125, -15.563232421875, -14.66064453125, -13.758056640625, -12.85546875, -11.952880859375, -11.05029296875, -10.147705078125, -9.2451171875, -8.342529296875, -7.43994140625, -6.537353515625, -5.634765625, -4.732177734375, -3.82958984375, -2.927001953125, -2.0244140625, -1.121826171875, -0.21923828125, 0.683349609375, 1.5859375, 2.488525390625, 3.39111328125, 4.293701171875, 5.1962890625, 6.098876953125, 7.00146484375, 7.904052734375, 8.806640625, 9.709228515625, 10.61181640625, 11.514404296875, 12.4169921875, 13.319580078125, 14.22216796875, 15.124755859375, 16.02734375, 16.929931640625, 17.83251953125, 18.735107421875, 19.6376953125, 20.540283203125, 21.44287109375, 22.345458984375, 23.248046875, 24.150634765625, 25.05322265625, 25.955810546875, 26.8583984375, 27.760986328125, 28.66357421875, 29.566162109375, 30.46875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 11.0, 18.0, 45.0, 86.0, 184.0, 233.0, 188.0, 128.0, 53.0, 29.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-370.48114013671875, -355.9477844238281, -341.4144592285156, -326.881103515625, -312.3477783203125, -297.8144226074219, -283.28106689453125, -268.74774169921875, -254.21438598632812, -239.68104553222656, -225.147705078125, -210.61434936523438, -196.0810089111328, -181.54766845703125, -167.0143280029297, -152.48098754882812, -137.94764709472656, -123.414306640625, -108.8809585571289, -94.34761810302734, -79.81427001953125, -65.28092956542969, -50.747589111328125, -36.21424102783203, -21.68090057373047, -7.147557258605957, 7.385786056518555, 21.91912841796875, 36.45247268676758, 50.985816955566406, 65.51915740966797, 80.05250549316406, 94.58584594726562, 109.11918640136719, 123.65253448486328, 138.18588256835938, 152.71922302246094, 167.2525634765625, 181.78590393066406, 196.31924438476562, 210.85260009765625, 225.3859405517578, 239.91928100585938, 254.45263671875, 268.9859619140625, 283.5193176269531, 298.05267333984375, 312.58599853515625, 327.11932373046875, 341.6526794433594, 356.1860046386719, 370.7193603515625, 385.252685546875, 399.7860412597656, 414.31939697265625, 428.85272216796875, 443.3860778808594, 457.91943359375, 472.4527587890625, 486.9861145019531, 501.5194396972656, 516.0527954101562, 530.5861206054688, 545.1195068359375, 559.65283203125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 5.0, 9.0, 14.0, 14.0, 14.0, 19.0, 36.0, 36.0, 47.0, 46.0, 47.0, 51.0, 48.0, 55.0, 53.0, 47.0, 55.0, 58.0, 51.0, 34.0, 46.0, 26.0, 26.0, 28.0, 24.0, 26.0, 17.0, 13.0, 11.0, 11.0, 11.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.26533508300781, -112.77194213867188, -108.27854919433594, -103.78515625, -99.29176330566406, -94.79837036132812, -90.30496978759766, -85.81157684326172, -81.31818389892578, -76.82479095458984, -72.3313980102539, -67.83800506591797, -63.344608306884766, -58.85121536254883, -54.357818603515625, -49.86442565917969, -45.37103271484375, -40.87763977050781, -36.384246826171875, -31.890850067138672, -27.397457122802734, -22.904064178466797, -18.410669326782227, -13.917274475097656, -9.423881530761719, -4.930487632751465, -0.43709373474121094, 4.056300163269043, 8.549694061279297, 13.043087005615234, 17.536481857299805, 22.029876708984375, 26.52325439453125, 31.016647338867188, 35.510040283203125, 40.00343704223633, 44.496829986572266, 48.9902229309082, 53.483619689941406, 57.977012634277344, 62.47040557861328, 66.96379852294922, 71.45719146728516, 75.9505844116211, 80.44398498535156, 84.9373779296875, 89.43077087402344, 93.92416381835938, 98.41755676269531, 102.91094970703125, 107.40434265136719, 111.89773559570312, 116.39112854003906, 120.884521484375, 125.37792205810547, 129.87130737304688, 134.36471557617188, 138.8581085205078, 143.35150146484375, 147.8448944091797, 152.33828735351562, 156.83168029785156, 161.3250732421875, 165.8184814453125, 170.31185913085938]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 13.0, 14.0, 20.0, 40.0, 42.0, 85.0, 84.0, 198.0, 326.0, 600.0, 1395.0, 3709.0, 12213.0, 53330.0, 254996.0, 530899.0, 146864.0, 31266.0, 7822.0, 2489.0, 947.0, 479.0, 250.0, 145.0, 86.0, 61.0, 44.0, 29.0, 28.0, 13.0, 15.0, 6.0, 6.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-121.5625, -118.12109375, -114.6796875, -111.23828125, -107.796875, -104.35546875, -100.9140625, -97.47265625, -94.03125, -90.58984375, -87.1484375, -83.70703125, -80.265625, -76.82421875, -73.3828125, -69.94140625, -66.5, -63.05859375, -59.6171875, -56.17578125, -52.734375, -49.29296875, -45.8515625, -42.41015625, -38.96875, -35.52734375, -32.0859375, -28.64453125, -25.203125, -21.76171875, -18.3203125, -14.87890625, -11.4375, -7.99609375, -4.5546875, -1.11328125, 2.328125, 5.76953125, 9.2109375, 12.65234375, 16.09375, 19.53515625, 22.9765625, 26.41796875, 29.859375, 33.30078125, 36.7421875, 40.18359375, 43.625, 47.06640625, 50.5078125, 53.94921875, 57.390625, 60.83203125, 64.2734375, 67.71484375, 71.15625, 74.59765625, 78.0390625, 81.48046875, 84.921875, 88.36328125, 91.8046875, 95.24609375, 98.6875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 11.0, 8.0, 13.0, 26.0, 26.0, 32.0, 48.0, 67.0, 72.0, 79.0, 81.0, 85.0, 66.0, 63.0, 67.0, 58.0, 51.0, 46.0, 32.0, 29.0, 11.0, 16.0, 9.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.27130126953125, -6.8590087890625, -6.44671630859375, -6.034423828125, -5.62213134765625, -5.2098388671875, -4.79754638671875, -4.38525390625, -3.97296142578125, -3.5606689453125, -3.14837646484375, -2.736083984375, -2.32379150390625, -1.9114990234375, -1.49920654296875, -1.0869140625, -0.67462158203125, -0.2623291015625, 0.14996337890625, 0.562255859375, 0.97454833984375, 1.3868408203125, 1.79913330078125, 2.21142578125, 2.62371826171875, 3.0360107421875, 3.44830322265625, 3.860595703125, 4.27288818359375, 4.6851806640625, 5.09747314453125, 5.509765625, 5.92205810546875, 6.3343505859375, 6.74664306640625, 7.158935546875, 7.57122802734375, 7.9835205078125, 8.39581298828125, 8.80810546875, 9.22039794921875, 9.6326904296875, 10.04498291015625, 10.457275390625, 10.86956787109375, 11.2818603515625, 11.69415283203125, 12.1064453125, 12.51873779296875, 12.9310302734375, 13.34332275390625, 13.755615234375, 14.16790771484375, 14.5802001953125, 14.99249267578125, 15.40478515625, 15.81707763671875, 16.2293701171875, 16.64166259765625, 17.053955078125, 17.46624755859375, 17.8785400390625, 18.29083251953125, 18.703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 4.0, 5.0, 5.0, 11.0, 11.0, 12.0, 18.0, 39.0, 46.0, 67.0, 95.0, 103.0, 166.0, 252.0, 377.0, 580.0, 882.0, 1614.0, 2993.0, 5712.0, 12036.0, 26290.0, 59291.0, 129565.0, 259868.0, 279344.0, 145121.0, 66163.0, 29643.0, 13681.0, 6557.0, 3381.0, 1733.0, 956.0, 632.0, 405.0, 273.0, 164.0, 105.0, 97.0, 76.0, 49.0, 39.0, 30.0, 19.0, 13.0, 9.0, 9.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.90625, -45.52978515625, -44.1533203125, -42.77685546875, -41.400390625, -40.02392578125, -38.6474609375, -37.27099609375, -35.89453125, -34.51806640625, -33.1416015625, -31.76513671875, -30.388671875, -29.01220703125, -27.6357421875, -26.25927734375, -24.8828125, -23.50634765625, -22.1298828125, -20.75341796875, -19.376953125, -18.00048828125, -16.6240234375, -15.24755859375, -13.87109375, -12.49462890625, -11.1181640625, -9.74169921875, -8.365234375, -6.98876953125, -5.6123046875, -4.23583984375, -2.859375, -1.48291015625, -0.1064453125, 1.27001953125, 2.646484375, 4.02294921875, 5.3994140625, 6.77587890625, 8.15234375, 9.52880859375, 10.9052734375, 12.28173828125, 13.658203125, 15.03466796875, 16.4111328125, 17.78759765625, 19.1640625, 20.54052734375, 21.9169921875, 23.29345703125, 24.669921875, 26.04638671875, 27.4228515625, 28.79931640625, 30.17578125, 31.55224609375, 32.9287109375, 34.30517578125, 35.681640625, 37.05810546875, 38.4345703125, 39.81103515625, 41.1875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 9.0, 7.0, 14.0, 14.0, 16.0, 15.0, 25.0, 20.0, 22.0, 26.0, 32.0, 35.0, 42.0, 32.0, 39.0, 44.0, 38.0, 38.0, 51.0, 45.0, 42.0, 56.0, 41.0, 34.0, 34.0, 21.0, 31.0, 26.0, 24.0, 20.0, 13.0, 20.0, 9.0, 12.0, 13.0, 5.0, 6.0, 1.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.59375, -33.53076171875, -32.4677734375, -31.40478515625, -30.341796875, -29.27880859375, -28.2158203125, -27.15283203125, -26.08984375, -25.02685546875, -23.9638671875, -22.90087890625, -21.837890625, -20.77490234375, -19.7119140625, -18.64892578125, -17.5859375, -16.52294921875, -15.4599609375, -14.39697265625, -13.333984375, -12.27099609375, -11.2080078125, -10.14501953125, -9.08203125, -8.01904296875, -6.9560546875, -5.89306640625, -4.830078125, -3.76708984375, -2.7041015625, -1.64111328125, -0.578125, 0.48486328125, 1.5478515625, 2.61083984375, 3.673828125, 4.73681640625, 5.7998046875, 6.86279296875, 7.92578125, 8.98876953125, 10.0517578125, 11.11474609375, 12.177734375, 13.24072265625, 14.3037109375, 15.36669921875, 16.4296875, 17.49267578125, 18.5556640625, 19.61865234375, 20.681640625, 21.74462890625, 22.8076171875, 23.87060546875, 24.93359375, 25.99658203125, 27.0595703125, 28.12255859375, 29.185546875, 30.24853515625, 31.3115234375, 32.37451171875, 33.4375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 2.0, 7.0, 13.0, 15.0, 12.0, 30.0, 37.0, 56.0, 83.0, 161.0, 272.0, 499.0, 1035.0, 2188.0, 5638.0, 18987.0, 93666.0, 576461.0, 290134.0, 41869.0, 10708.0, 3577.0, 1472.0, 659.0, 375.0, 205.0, 135.0, 77.0, 41.0, 31.0, 37.0, 16.0, 10.0, 15.0, 7.0, 4.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-57.40625, -55.75537109375, -54.1044921875, -52.45361328125, -50.802734375, -49.15185546875, -47.5009765625, -45.85009765625, -44.19921875, -42.54833984375, -40.8974609375, -39.24658203125, -37.595703125, -35.94482421875, -34.2939453125, -32.64306640625, -30.9921875, -29.34130859375, -27.6904296875, -26.03955078125, -24.388671875, -22.73779296875, -21.0869140625, -19.43603515625, -17.78515625, -16.13427734375, -14.4833984375, -12.83251953125, -11.181640625, -9.53076171875, -7.8798828125, -6.22900390625, -4.578125, -2.92724609375, -1.2763671875, 0.37451171875, 2.025390625, 3.67626953125, 5.3271484375, 6.97802734375, 8.62890625, 10.27978515625, 11.9306640625, 13.58154296875, 15.232421875, 16.88330078125, 18.5341796875, 20.18505859375, 21.8359375, 23.48681640625, 25.1376953125, 26.78857421875, 28.439453125, 30.09033203125, 31.7412109375, 33.39208984375, 35.04296875, 36.69384765625, 38.3447265625, 39.99560546875, 41.646484375, 43.29736328125, 44.9482421875, 46.59912109375, 48.25]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 1.0, 9.0, 11.0, 19.0, 18.0, 23.0, 29.0, 44.0, 44.0, 64.0, 77.0, 87.0, 114.0, 104.0, 64.0, 62.0, 50.0, 35.0, 26.0, 25.0, 14.0, 13.0, 10.0, 13.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004863739013671875, -0.004704892635345459, -0.004546046257019043, -0.004387199878692627, -0.004228353500366211, -0.004069507122039795, -0.003910660743713379, -0.003751814365386963, -0.003592967987060547, -0.003434121608734131, -0.003275275230407715, -0.003116428852081299, -0.002957582473754883, -0.002798736095428467, -0.0026398897171020508, -0.0024810433387756348, -0.0023221969604492188, -0.0021633505821228027, -0.0020045042037963867, -0.0018456578254699707, -0.0016868114471435547, -0.0015279650688171387, -0.0013691186904907227, -0.0012102723121643066, -0.0010514259338378906, -0.0008925795555114746, -0.0007337331771850586, -0.0005748867988586426, -0.00041604042053222656, -0.00025719404220581055, -9.834766387939453e-05, 6.0498714447021484e-05, 0.0002193450927734375, 0.0003781914710998535, 0.0005370378494262695, 0.0006958842277526855, 0.0008547306060791016, 0.0010135769844055176, 0.0011724233627319336, 0.0013312697410583496, 0.0014901161193847656, 0.0016489624977111816, 0.0018078088760375977, 0.0019666552543640137, 0.0021255016326904297, 0.0022843480110168457, 0.0024431943893432617, 0.0026020407676696777, 0.0027608871459960938, 0.0029197335243225098, 0.0030785799026489258, 0.003237426280975342, 0.003396272659301758, 0.003555119037628174, 0.00371396541595459, 0.003872811794281006, 0.004031658172607422, 0.004190504550933838, 0.004349350929260254, 0.00450819730758667, 0.004667043685913086, 0.004825890064239502, 0.004984736442565918, 0.005143582820892334, 0.00530242919921875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 12.0, 7.0, 12.0, 17.0, 13.0, 30.0, 64.0, 99.0, 163.0, 248.0, 491.0, 876.0, 1816.0, 4182.0, 12111.0, 50530.0, 389188.0, 499534.0, 65242.0, 14674.0, 4840.0, 2145.0, 1041.0, 504.0, 291.0, 136.0, 108.0, 55.0, 36.0, 32.0, 25.0, 14.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.09375, -57.359375, -55.625, -53.890625, -52.15625, -50.421875, -48.6875, -46.953125, -45.21875, -43.484375, -41.75, -40.015625, -38.28125, -36.546875, -34.8125, -33.078125, -31.34375, -29.609375, -27.875, -26.140625, -24.40625, -22.671875, -20.9375, -19.203125, -17.46875, -15.734375, -14.0, -12.265625, -10.53125, -8.796875, -7.0625, -5.328125, -3.59375, -1.859375, -0.125, 1.609375, 3.34375, 5.078125, 6.8125, 8.546875, 10.28125, 12.015625, 13.75, 15.484375, 17.21875, 18.953125, 20.6875, 22.421875, 24.15625, 25.890625, 27.625, 29.359375, 31.09375, 32.828125, 34.5625, 36.296875, 38.03125, 39.765625, 41.5, 43.234375, 44.96875, 46.703125, 48.4375, 50.171875, 51.90625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 10.0, 14.0, 16.0, 28.0, 34.0, 36.0, 59.0, 70.0, 78.0, 88.0, 100.0, 90.0, 74.0, 67.0, 49.0, 48.0, 30.0, 27.0, 15.0, 15.0, 11.0, 11.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.125, -35.253662109375, -34.38232421875, -33.510986328125, -32.6396484375, -31.768310546875, -30.89697265625, -30.025634765625, -29.154296875, -28.282958984375, -27.41162109375, -26.540283203125, -25.6689453125, -24.797607421875, -23.92626953125, -23.054931640625, -22.18359375, -21.312255859375, -20.44091796875, -19.569580078125, -18.6982421875, -17.826904296875, -16.95556640625, -16.084228515625, -15.212890625, -14.341552734375, -13.47021484375, -12.598876953125, -11.7275390625, -10.856201171875, -9.98486328125, -9.113525390625, -8.2421875, -7.370849609375, -6.49951171875, -5.628173828125, -4.7568359375, -3.885498046875, -3.01416015625, -2.142822265625, -1.271484375, -0.400146484375, 0.47119140625, 1.342529296875, 2.2138671875, 3.085205078125, 3.95654296875, 4.827880859375, 5.69921875, 6.570556640625, 7.44189453125, 8.313232421875, 9.1845703125, 10.055908203125, 10.92724609375, 11.798583984375, 12.669921875, 13.541259765625, 14.41259765625, 15.283935546875, 16.1552734375, 17.026611328125, 17.89794921875, 18.769287109375, 19.640625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 17.0, 26.0, 52.0, 66.0, 119.0, 162.0, 180.0, 138.0, 95.0, 48.0, 39.0, 19.0, 10.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-852.5416259765625, -833.6793823242188, -814.817138671875, -795.9548950195312, -777.0926513671875, -758.2303466796875, -739.3681030273438, -720.505859375, -701.6436157226562, -682.7813720703125, -663.9191284179688, -645.056884765625, -626.194580078125, -607.3323364257812, -588.4700927734375, -569.6078491210938, -550.74560546875, -531.8833618164062, -513.0211181640625, -494.1588439941406, -475.2966003417969, -456.4343566894531, -437.57208251953125, -418.7098388671875, -399.84759521484375, -380.9853515625, -362.12310791015625, -343.2608337402344, -324.3985900878906, -305.5363464355469, -286.674072265625, -267.81182861328125, -248.94955444335938, -230.08731079101562, -211.2250518798828, -192.36279296875, -173.50054931640625, -154.6383056640625, -135.7760467529297, -116.91378784179688, -98.05154418945312, -79.18929290771484, -60.32704162597656, -41.46479034423828, -22.6025390625, -3.7402877807617188, 15.121963500976562, 33.984222412109375, 52.846466064453125, 71.7087173461914, 90.57096862792969, 109.43321990966797, 128.29547119140625, 147.15771484375, 166.0199737548828, 184.88223266601562, 203.74447631835938, 222.60671997070312, 241.46897888183594, 260.33123779296875, 279.1934814453125, 298.05572509765625, 316.91796875, 335.7802429199219, 354.6424865722656]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 10.0, 5.0, 6.0, 7.0, 14.0, 9.0, 8.0, 11.0, 21.0, 11.0, 21.0, 26.0, 22.0, 34.0, 32.0, 33.0, 40.0, 34.0, 52.0, 44.0, 52.0, 42.0, 44.0, 38.0, 39.0, 47.0, 30.0, 37.0, 17.0, 34.0, 22.0, 22.0, 18.0, 18.0, 20.0, 8.0, 13.0, 11.0, 8.0, 6.0, 8.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-191.688232421875, -185.8914031982422, -180.09458923339844, -174.29776000976562, -168.5009307861328, -162.7041015625, -156.90728759765625, -151.11045837402344, -145.31362915039062, -139.5167999267578, -133.71998596191406, -127.92315673828125, -122.12632751464844, -116.32950592041016, -110.53268432617188, -104.73585510253906, -98.93904113769531, -93.14221954345703, -87.34539031982422, -81.54856872558594, -75.75173950195312, -69.95491790771484, -64.15809631347656, -58.361270904541016, -52.56444549560547, -46.76762008666992, -40.970794677734375, -35.173973083496094, -29.377147674560547, -23.580322265625, -17.78350067138672, -11.986675262451172, -6.1898345947265625, -0.39301013946533203, 5.403814315795898, 11.200637817382812, 16.99746322631836, 22.794288635253906, 28.591110229492188, 34.387935638427734, 40.18476104736328, 45.98158645629883, 51.778411865234375, 57.575233459472656, 63.3720588684082, 69.16888427734375, 74.96570587158203, 80.76252746582031, 86.55935668945312, 92.3561782836914, 98.15300750732422, 103.9498291015625, 109.74665832519531, 115.5434799194336, 121.34030151367188, 127.13713073730469, 132.9339599609375, 138.7307891845703, 144.52760314941406, 150.32443237304688, 156.1212615966797, 161.9180908203125, 167.71490478515625, 173.51173400878906, 179.3085479736328]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 12.0, 14.0, 21.0, 35.0, 63.0, 98.0, 161.0, 321.0, 573.0, 1355.0, 3469.0, 11218.0, 50221.0, 3011631.0, 1054122.0, 44816.0, 10219.0, 3312.0, 1328.0, 568.0, 305.0, 162.0, 79.0, 51.0, 42.0, 27.0, 11.0, 10.0, 7.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.875, -103.875, -99.875, -95.875, -91.875, -87.875, -83.875, -79.875, -75.875, -71.875, -67.875, -63.875, -59.875, -55.875, -51.875, -47.875, -43.875, -39.875, -35.875, -31.875, -27.875, -23.875, -19.875, -15.875, -11.875, -7.875, -3.875, 0.125, 4.125, 8.125, 12.125, 16.125, 20.125, 24.125, 28.125, 32.125, 36.125, 40.125, 44.125, 48.125, 52.125, 56.125, 60.125, 64.125, 68.125, 72.125, 76.125, 80.125, 84.125, 88.125, 92.125, 96.125, 100.125, 104.125, 108.125, 112.125, 116.125, 120.125, 124.125, 128.125, 132.125, 136.125, 140.125, 144.125, 148.125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 8.0, 7.0, 15.0, 17.0, 31.0, 41.0, 42.0, 51.0, 61.0, 86.0, 65.0, 80.0, 75.0, 72.0, 67.0, 58.0, 63.0, 54.0, 33.0, 19.0, 18.0, 16.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.765625, -7.354736328125, -6.94384765625, -6.532958984375, -6.1220703125, -5.711181640625, -5.30029296875, -4.889404296875, -4.478515625, -4.067626953125, -3.65673828125, -3.245849609375, -2.8349609375, -2.424072265625, -2.01318359375, -1.602294921875, -1.19140625, -0.780517578125, -0.36962890625, 0.041259765625, 0.4521484375, 0.863037109375, 1.27392578125, 1.684814453125, 2.095703125, 2.506591796875, 2.91748046875, 3.328369140625, 3.7392578125, 4.150146484375, 4.56103515625, 4.971923828125, 5.3828125, 5.793701171875, 6.20458984375, 6.615478515625, 7.0263671875, 7.437255859375, 7.84814453125, 8.259033203125, 8.669921875, 9.080810546875, 9.49169921875, 9.902587890625, 10.3134765625, 10.724365234375, 11.13525390625, 11.546142578125, 11.95703125, 12.367919921875, 12.77880859375, 13.189697265625, 13.6005859375, 14.011474609375, 14.42236328125, 14.833251953125, 15.244140625, 15.655029296875, 16.06591796875, 16.476806640625, 16.8876953125, 17.298583984375, 17.70947265625, 18.120361328125, 18.53125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 11.0, 11.0, 23.0, 15.0, 29.0, 39.0, 52.0, 92.0, 161.0, 273.0, 491.0, 1117.0, 3037.0, 9789.0, 41161.0, 274191.0, 3628035.0, 190397.0, 32450.0, 8272.0, 2554.0, 984.0, 448.0, 209.0, 131.0, 87.0, 69.0, 49.0, 31.0, 28.0, 16.0, 11.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.375, -120.1640625, -116.953125, -113.7421875, -110.53125, -107.3203125, -104.109375, -100.8984375, -97.6875, -94.4765625, -91.265625, -88.0546875, -84.84375, -81.6328125, -78.421875, -75.2109375, -72.0, -68.7890625, -65.578125, -62.3671875, -59.15625, -55.9453125, -52.734375, -49.5234375, -46.3125, -43.1015625, -39.890625, -36.6796875, -33.46875, -30.2578125, -27.046875, -23.8359375, -20.625, -17.4140625, -14.203125, -10.9921875, -7.78125, -4.5703125, -1.359375, 1.8515625, 5.0625, 8.2734375, 11.484375, 14.6953125, 17.90625, 21.1171875, 24.328125, 27.5390625, 30.75, 33.9609375, 37.171875, 40.3828125, 43.59375, 46.8046875, 50.015625, 53.2265625, 56.4375, 59.6484375, 62.859375, 66.0703125, 69.28125, 72.4921875, 75.703125, 78.9140625, 82.125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 5.0, 4.0, 9.0, 21.0, 30.0, 46.0, 54.0, 83.0, 180.0, 348.0, 1923.0, 770.0, 229.0, 125.0, 78.0, 63.0, 38.0, 21.0, 20.0, 9.0, 8.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.6875, -29.58349609375, -28.4794921875, -27.37548828125, -26.271484375, -25.16748046875, -24.0634765625, -22.95947265625, -21.85546875, -20.75146484375, -19.6474609375, -18.54345703125, -17.439453125, -16.33544921875, -15.2314453125, -14.12744140625, -13.0234375, -11.91943359375, -10.8154296875, -9.71142578125, -8.607421875, -7.50341796875, -6.3994140625, -5.29541015625, -4.19140625, -3.08740234375, -1.9833984375, -0.87939453125, 0.224609375, 1.32861328125, 2.4326171875, 3.53662109375, 4.640625, 5.74462890625, 6.8486328125, 7.95263671875, 9.056640625, 10.16064453125, 11.2646484375, 12.36865234375, 13.47265625, 14.57666015625, 15.6806640625, 16.78466796875, 17.888671875, 18.99267578125, 20.0966796875, 21.20068359375, 22.3046875, 23.40869140625, 24.5126953125, 25.61669921875, 26.720703125, 27.82470703125, 28.9287109375, 30.03271484375, 31.13671875, 32.24072265625, 33.3447265625, 34.44873046875, 35.552734375, 36.65673828125, 37.7607421875, 38.86474609375, 39.96875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 11.0, 48.0, 66.0, 163.0, 248.0, 218.0, 131.0, 67.0, 26.0, 12.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-573.6349487304688, -562.0990600585938, -550.5631713867188, -539.02734375, -527.491455078125, -515.95556640625, -504.419677734375, -492.8837890625, -481.347900390625, -469.81201171875, -458.2761535644531, -446.7402648925781, -435.2043762207031, -423.66851806640625, -412.13262939453125, -400.59674072265625, -389.0608825683594, -377.5249938964844, -365.9891357421875, -354.4532470703125, -342.9173583984375, -331.3814697265625, -319.8456115722656, -308.3097229003906, -296.77386474609375, -285.23797607421875, -273.7021179199219, -262.1662292480469, -250.63034057617188, -239.09446716308594, -227.55859375, -216.022705078125, -204.48684692382812, -192.9509735107422, -181.4150848388672, -169.87921142578125, -158.34332275390625, -146.8074493408203, -135.27157592773438, -123.7356948852539, -112.19981384277344, -100.66393280029297, -89.1280517578125, -77.59217834472656, -66.0562973022461, -54.520416259765625, -42.98454284667969, -31.44866180419922, -19.91278076171875, -8.376901626586914, 3.158977508544922, 14.694854736328125, 26.230735778808594, 37.76661682128906, 49.302490234375, 60.83837127685547, 72.37425231933594, 83.9101333618164, 95.44601440429688, 106.98188781738281, 118.51776885986328, 130.05364990234375, 141.5895233154297, 153.12539672851562, 164.66128540039062]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 6.0, 11.0, 2.0, 9.0, 17.0, 14.0, 12.0, 19.0, 17.0, 24.0, 36.0, 31.0, 29.0, 25.0, 34.0, 54.0, 40.0, 51.0, 43.0, 37.0, 43.0, 43.0, 47.0, 37.0, 49.0, 31.0, 39.0, 36.0, 28.0, 25.0, 18.0, 22.0, 15.0, 15.0, 13.0, 7.0, 4.0, 4.0, 9.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0], "bins": [-111.92119598388672, -109.01945495605469, -106.11770629882812, -103.2159652709961, -100.31421661376953, -97.4124755859375, -94.51072692871094, -91.6089859008789, -88.70724487304688, -85.80550384521484, -82.90375518798828, -80.00201416015625, -77.10026550292969, -74.19852447509766, -71.29678344726562, -68.39503479003906, -65.4932861328125, -62.5915412902832, -59.689796447753906, -56.788055419921875, -53.88630676269531, -50.98456573486328, -48.082820892333984, -45.18107604980469, -42.27933120727539, -39.377586364746094, -36.4758415222168, -33.5740966796875, -30.672353744506836, -27.77060890197754, -24.868865966796875, -21.967121124267578, -19.06536865234375, -16.163623809814453, -13.261879920959473, -10.360136032104492, -7.458391189575195, -4.556646347045898, -1.6549034118652344, 1.2468414306640625, 4.148586273193359, 7.050330638885498, 9.952075004577637, 12.853818893432617, 15.755563735961914, 18.65730857849121, 21.559051513671875, 24.460796356201172, 27.36254119873047, 30.264286041259766, 33.16603088378906, 36.067771911621094, 38.969520568847656, 41.87126159667969, 44.773006439208984, 47.67475128173828, 50.57649612426758, 53.478240966796875, 56.37998580932617, 59.28173065185547, 62.1834716796875, 65.08522033691406, 67.9869613647461, 70.88870239257812, 73.79045104980469]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 5.0, 8.0, 8.0, 13.0, 25.0, 25.0, 32.0, 56.0, 78.0, 121.0, 243.0, 388.0, 711.0, 1493.0, 3930.0, 11747.0, 43529.0, 191536.0, 528183.0, 201210.0, 45533.0, 12292.0, 4079.0, 1618.0, 706.0, 372.0, 209.0, 137.0, 63.0, 47.0, 44.0, 36.0, 16.0, 17.0, 21.0, 3.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-125.0, -121.48046875, -117.9609375, -114.44140625, -110.921875, -107.40234375, -103.8828125, -100.36328125, -96.84375, -93.32421875, -89.8046875, -86.28515625, -82.765625, -79.24609375, -75.7265625, -72.20703125, -68.6875, -65.16796875, -61.6484375, -58.12890625, -54.609375, -51.08984375, -47.5703125, -44.05078125, -40.53125, -37.01171875, -33.4921875, -29.97265625, -26.453125, -22.93359375, -19.4140625, -15.89453125, -12.375, -8.85546875, -5.3359375, -1.81640625, 1.703125, 5.22265625, 8.7421875, 12.26171875, 15.78125, 19.30078125, 22.8203125, 26.33984375, 29.859375, 33.37890625, 36.8984375, 40.41796875, 43.9375, 47.45703125, 50.9765625, 54.49609375, 58.015625, 61.53515625, 65.0546875, 68.57421875, 72.09375, 75.61328125, 79.1328125, 82.65234375, 86.171875, 89.69140625, 93.2109375, 96.73046875, 100.25]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 4.0, 7.0, 10.0, 12.0, 22.0, 25.0, 27.0, 34.0, 41.0, 71.0, 53.0, 65.0, 82.0, 76.0, 75.0, 61.0, 66.0, 54.0, 50.0, 42.0, 49.0, 23.0, 19.0, 16.0, 8.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5546875, -8.1405029296875, -7.726318359375, -7.3121337890625, -6.89794921875, -6.4837646484375, -6.069580078125, -5.6553955078125, -5.2412109375, -4.8270263671875, -4.412841796875, -3.9986572265625, -3.58447265625, -3.1702880859375, -2.756103515625, -2.3419189453125, -1.927734375, -1.5135498046875, -1.099365234375, -0.6851806640625, -0.27099609375, 0.1431884765625, 0.557373046875, 0.9715576171875, 1.3857421875, 1.7999267578125, 2.214111328125, 2.6282958984375, 3.04248046875, 3.4566650390625, 3.870849609375, 4.2850341796875, 4.69921875, 5.1134033203125, 5.527587890625, 5.9417724609375, 6.35595703125, 6.7701416015625, 7.184326171875, 7.5985107421875, 8.0126953125, 8.4268798828125, 8.841064453125, 9.2552490234375, 9.66943359375, 10.0836181640625, 10.497802734375, 10.9119873046875, 11.326171875, 11.7403564453125, 12.154541015625, 12.5687255859375, 12.98291015625, 13.3970947265625, 13.811279296875, 14.2254638671875, 14.6396484375, 15.0538330078125, 15.468017578125, 15.8822021484375, 16.29638671875, 16.7105712890625, 17.124755859375, 17.5389404296875, 17.953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 10.0, 18.0, 28.0, 26.0, 44.0, 53.0, 84.0, 129.0, 157.0, 255.0, 367.0, 595.0, 944.0, 1727.0, 3651.0, 9080.0, 24768.0, 73988.0, 219080.0, 400606.0, 204186.0, 69262.0, 23192.0, 8549.0, 3462.0, 1695.0, 901.0, 529.0, 387.0, 205.0, 188.0, 117.0, 75.0, 65.0, 32.0, 29.0, 19.0, 20.0, 10.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-58.375, -56.458984375, -54.54296875, -52.626953125, -50.7109375, -48.794921875, -46.87890625, -44.962890625, -43.046875, -41.130859375, -39.21484375, -37.298828125, -35.3828125, -33.466796875, -31.55078125, -29.634765625, -27.71875, -25.802734375, -23.88671875, -21.970703125, -20.0546875, -18.138671875, -16.22265625, -14.306640625, -12.390625, -10.474609375, -8.55859375, -6.642578125, -4.7265625, -2.810546875, -0.89453125, 1.021484375, 2.9375, 4.853515625, 6.76953125, 8.685546875, 10.6015625, 12.517578125, 14.43359375, 16.349609375, 18.265625, 20.181640625, 22.09765625, 24.013671875, 25.9296875, 27.845703125, 29.76171875, 31.677734375, 33.59375, 35.509765625, 37.42578125, 39.341796875, 41.2578125, 43.173828125, 45.08984375, 47.005859375, 48.921875, 50.837890625, 52.75390625, 54.669921875, 56.5859375, 58.501953125, 60.41796875, 62.333984375, 64.25]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 6.0, 10.0, 9.0, 6.0, 11.0, 16.0, 14.0, 28.0, 36.0, 28.0, 28.0, 33.0, 49.0, 39.0, 36.0, 47.0, 44.0, 33.0, 46.0, 42.0, 50.0, 39.0, 45.0, 35.0, 41.0, 33.0, 29.0, 23.0, 22.0, 24.0, 13.0, 13.0, 14.0, 11.0, 15.0, 10.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-44.0, -42.75439453125, -41.5087890625, -40.26318359375, -39.017578125, -37.77197265625, -36.5263671875, -35.28076171875, -34.03515625, -32.78955078125, -31.5439453125, -30.29833984375, -29.052734375, -27.80712890625, -26.5615234375, -25.31591796875, -24.0703125, -22.82470703125, -21.5791015625, -20.33349609375, -19.087890625, -17.84228515625, -16.5966796875, -15.35107421875, -14.10546875, -12.85986328125, -11.6142578125, -10.36865234375, -9.123046875, -7.87744140625, -6.6318359375, -5.38623046875, -4.140625, -2.89501953125, -1.6494140625, -0.40380859375, 0.841796875, 2.08740234375, 3.3330078125, 4.57861328125, 5.82421875, 7.06982421875, 8.3154296875, 9.56103515625, 10.806640625, 12.05224609375, 13.2978515625, 14.54345703125, 15.7890625, 17.03466796875, 18.2802734375, 19.52587890625, 20.771484375, 22.01708984375, 23.2626953125, 24.50830078125, 25.75390625, 26.99951171875, 28.2451171875, 29.49072265625, 30.736328125, 31.98193359375, 33.2275390625, 34.47314453125, 35.71875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 17.0, 23.0, 37.0, 84.0, 108.0, 232.0, 562.0, 1761.0, 8786.0, 132084.0, 847427.0, 50199.0, 5081.0, 1297.0, 420.0, 195.0, 98.0, 46.0, 26.0, 20.0, 13.0, 9.0, 9.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.4375, -99.271484375, -96.10546875, -92.939453125, -89.7734375, -86.607421875, -83.44140625, -80.275390625, -77.109375, -73.943359375, -70.77734375, -67.611328125, -64.4453125, -61.279296875, -58.11328125, -54.947265625, -51.78125, -48.615234375, -45.44921875, -42.283203125, -39.1171875, -35.951171875, -32.78515625, -29.619140625, -26.453125, -23.287109375, -20.12109375, -16.955078125, -13.7890625, -10.623046875, -7.45703125, -4.291015625, -1.125, 2.041015625, 5.20703125, 8.373046875, 11.5390625, 14.705078125, 17.87109375, 21.037109375, 24.203125, 27.369140625, 30.53515625, 33.701171875, 36.8671875, 40.033203125, 43.19921875, 46.365234375, 49.53125, 52.697265625, 55.86328125, 59.029296875, 62.1953125, 65.361328125, 68.52734375, 71.693359375, 74.859375, 78.025390625, 81.19140625, 84.357421875, 87.5234375, 90.689453125, 93.85546875, 97.021484375, 100.1875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 9.0, 15.0, 35.0, 106.0, 234.0, 323.0, 169.0, 67.0, 24.0, 11.0, 7.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01175689697265625, -0.0111464262008667, -0.010535955429077148, -0.009925484657287598, -0.009315013885498047, -0.008704543113708496, -0.008094072341918945, -0.0074836015701293945, -0.006873130798339844, -0.006262660026550293, -0.005652189254760742, -0.005041718482971191, -0.004431247711181641, -0.00382077693939209, -0.003210306167602539, -0.0025998353958129883, -0.0019893646240234375, -0.0013788938522338867, -0.0007684230804443359, -0.00015795230865478516, 0.0004525184631347656, 0.0010629892349243164, 0.0016734600067138672, 0.002283930778503418, 0.0028944015502929688, 0.0035048723220825195, 0.00411534309387207, 0.004725813865661621, 0.005336284637451172, 0.005946755409240723, 0.0065572261810302734, 0.007167696952819824, 0.007778167724609375, 0.008388638496398926, 0.008999109268188477, 0.009609580039978027, 0.010220050811767578, 0.010830521583557129, 0.01144099235534668, 0.01205146312713623, 0.012661933898925781, 0.013272404670715332, 0.013882875442504883, 0.014493346214294434, 0.015103816986083984, 0.015714287757873535, 0.016324758529663086, 0.016935229301452637, 0.017545700073242188, 0.01815617084503174, 0.01876664161682129, 0.01937711238861084, 0.01998758316040039, 0.02059805393218994, 0.021208524703979492, 0.021818995475769043, 0.022429466247558594, 0.023039937019348145, 0.023650407791137695, 0.024260878562927246, 0.024871349334716797, 0.025481820106506348, 0.0260922908782959, 0.02670276165008545, 0.027313232421875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 10.0, 11.0, 13.0, 21.0, 39.0, 61.0, 75.0, 162.0, 248.0, 547.0, 1479.0, 5694.0, 63727.0, 919690.0, 49141.0, 5167.0, 1346.0, 469.0, 265.0, 138.0, 80.0, 50.0, 45.0, 24.0, 15.0, 10.0, 6.0, 5.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-119.1875, -115.3994140625, -111.611328125, -107.8232421875, -104.03515625, -100.2470703125, -96.458984375, -92.6708984375, -88.8828125, -85.0947265625, -81.306640625, -77.5185546875, -73.73046875, -69.9423828125, -66.154296875, -62.3662109375, -58.578125, -54.7900390625, -51.001953125, -47.2138671875, -43.42578125, -39.6376953125, -35.849609375, -32.0615234375, -28.2734375, -24.4853515625, -20.697265625, -16.9091796875, -13.12109375, -9.3330078125, -5.544921875, -1.7568359375, 2.03125, 5.8193359375, 9.607421875, 13.3955078125, 17.18359375, 20.9716796875, 24.759765625, 28.5478515625, 32.3359375, 36.1240234375, 39.912109375, 43.7001953125, 47.48828125, 51.2763671875, 55.064453125, 58.8525390625, 62.640625, 66.4287109375, 70.216796875, 74.0048828125, 77.79296875, 81.5810546875, 85.369140625, 89.1572265625, 92.9453125, 96.7333984375, 100.521484375, 104.3095703125, 108.09765625, 111.8857421875, 115.673828125, 119.4619140625, 123.25]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 6.0, 14.0, 27.0, 51.0, 82.0, 200.0, 242.0, 179.0, 98.0, 52.0, 19.0, 10.0, 5.0, 1.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.0625, -63.7373046875, -61.412109375, -59.0869140625, -56.76171875, -54.4365234375, -52.111328125, -49.7861328125, -47.4609375, -45.1357421875, -42.810546875, -40.4853515625, -38.16015625, -35.8349609375, -33.509765625, -31.1845703125, -28.859375, -26.5341796875, -24.208984375, -21.8837890625, -19.55859375, -17.2333984375, -14.908203125, -12.5830078125, -10.2578125, -7.9326171875, -5.607421875, -3.2822265625, -0.95703125, 1.3681640625, 3.693359375, 6.0185546875, 8.34375, 10.6689453125, 12.994140625, 15.3193359375, 17.64453125, 19.9697265625, 22.294921875, 24.6201171875, 26.9453125, 29.2705078125, 31.595703125, 33.9208984375, 36.24609375, 38.5712890625, 40.896484375, 43.2216796875, 45.546875, 47.8720703125, 50.197265625, 52.5224609375, 54.84765625, 57.1728515625, 59.498046875, 61.8232421875, 64.1484375, 66.4736328125, 68.798828125, 71.1240234375, 73.44921875, 75.7744140625, 78.099609375, 80.4248046875, 82.75]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 9.0, 17.0, 15.0, 28.0, 34.0, 50.0, 79.0, 86.0, 76.0, 102.0, 96.0, 89.0, 78.0, 53.0, 44.0, 39.0, 25.0, 22.0, 8.0, 14.0, 10.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-291.9845275878906, -280.6142272949219, -269.24395751953125, -257.8736572265625, -246.5033721923828, -235.13308715820312, -223.76278686523438, -212.3925018310547, -201.022216796875, -189.6519317626953, -178.28164672851562, -166.91134643554688, -155.5410614013672, -144.1707763671875, -132.80047607421875, -121.43019104003906, -110.05990600585938, -98.68962097167969, -87.31932830810547, -75.94903564453125, -64.57875061035156, -53.20846176147461, -41.838172912597656, -30.467880249023438, -19.09759521484375, -7.727306365966797, 3.6429824829101562, 15.01327133178711, 26.383560180664062, 37.753849029541016, 49.12413787841797, 60.49443054199219, 71.86471557617188, 83.23500061035156, 94.60529327392578, 105.9755859375, 117.34587097167969, 128.71615600585938, 140.08645629882812, 151.4567413330078, 162.8270263671875, 174.1973114013672, 185.56759643554688, 196.93789672851562, 208.3081817626953, 219.678466796875, 231.04876708984375, 242.41905212402344, 253.78933715820312, 265.1596374511719, 276.5299072265625, 287.90020751953125, 299.2705078125, 310.6407775878906, 322.0110778808594, 333.38134765625, 344.75164794921875, 356.1219482421875, 367.4922180175781, 378.8625183105469, 390.2327880859375, 401.60308837890625, 412.973388671875, 424.34368896484375, 435.7139587402344]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 6.0, 12.0, 10.0, 14.0, 16.0, 14.0, 30.0, 23.0, 19.0, 31.0, 31.0, 28.0, 46.0, 34.0, 34.0, 40.0, 36.0, 42.0, 38.0, 39.0, 43.0, 39.0, 42.0, 38.0, 31.0, 37.0, 31.0, 21.0, 19.0, 17.0, 17.0, 25.0, 14.0, 16.0, 10.0, 8.0, 7.0, 12.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-239.72491455078125, -232.7813262939453, -225.83773803710938, -218.89414978027344, -211.9505615234375, -205.00697326660156, -198.06338500976562, -191.11978149414062, -184.17620849609375, -177.2326202392578, -170.28903198242188, -163.34544372558594, -156.40185546875, -149.45826721191406, -142.51467895507812, -135.57107543945312, -128.6274871826172, -121.68389892578125, -114.74031066894531, -107.79672241210938, -100.85313415527344, -93.9095458984375, -86.96595001220703, -80.0223617553711, -73.07877349853516, -66.13518524169922, -59.19159698486328, -52.24800491333008, -45.30441665649414, -38.3608283996582, -31.417236328125, -24.473648071289062, -17.530044555664062, -10.586455345153809, -3.6428661346435547, 3.3007240295410156, 10.244312286376953, 17.18790054321289, 24.131492614746094, 31.07508087158203, 38.01866912841797, 44.962257385253906, 51.905845642089844, 58.84943771362305, 65.79302978515625, 72.73661804199219, 79.68020629882812, 86.62379455566406, 93.5673828125, 100.51097106933594, 107.45455932617188, 114.39814758300781, 121.34173583984375, 128.2853240966797, 135.22891235351562, 142.17251586914062, 149.1160888671875, 156.05967712402344, 163.00326538085938, 169.9468536376953, 176.89044189453125, 183.8340301513672, 190.77761840820312, 197.72122192382812, 204.66481018066406]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 1.0, 11.0, 11.0, 15.0, 14.0, 40.0, 42.0, 57.0, 109.0, 168.0, 344.0, 602.0, 1319.0, 2962.0, 7618.0, 24315.0, 107657.0, 3398732.0, 563621.0, 61078.0, 15813.0, 5377.0, 2177.0, 974.0, 506.0, 265.0, 170.0, 77.0, 55.0, 50.0, 25.0, 18.0, 14.0, 6.0, 6.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-99.5625, -96.4345703125, -93.306640625, -90.1787109375, -87.05078125, -83.9228515625, -80.794921875, -77.6669921875, -74.5390625, -71.4111328125, -68.283203125, -65.1552734375, -62.02734375, -58.8994140625, -55.771484375, -52.6435546875, -49.515625, -46.3876953125, -43.259765625, -40.1318359375, -37.00390625, -33.8759765625, -30.748046875, -27.6201171875, -24.4921875, -21.3642578125, -18.236328125, -15.1083984375, -11.98046875, -8.8525390625, -5.724609375, -2.5966796875, 0.53125, 3.6591796875, 6.787109375, 9.9150390625, 13.04296875, 16.1708984375, 19.298828125, 22.4267578125, 25.5546875, 28.6826171875, 31.810546875, 34.9384765625, 38.06640625, 41.1943359375, 44.322265625, 47.4501953125, 50.578125, 53.7060546875, 56.833984375, 59.9619140625, 63.08984375, 66.2177734375, 69.345703125, 72.4736328125, 75.6015625, 78.7294921875, 81.857421875, 84.9853515625, 88.11328125, 91.2412109375, 94.369140625, 97.4970703125, 100.625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 12.0, 7.0, 11.0, 23.0, 24.0, 26.0, 37.0, 49.0, 52.0, 55.0, 71.0, 75.0, 71.0, 67.0, 58.0, 68.0, 44.0, 53.0, 48.0, 34.0, 36.0, 24.0, 19.0, 10.0, 7.0, 6.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80078125, -7.40838623046875, -7.0159912109375, -6.62359619140625, -6.231201171875, -5.83880615234375, -5.4464111328125, -5.05401611328125, -4.66162109375, -4.26922607421875, -3.8768310546875, -3.48443603515625, -3.092041015625, -2.69964599609375, -2.3072509765625, -1.91485595703125, -1.5224609375, -1.13006591796875, -0.7376708984375, -0.34527587890625, 0.047119140625, 0.43951416015625, 0.8319091796875, 1.22430419921875, 1.61669921875, 2.00909423828125, 2.4014892578125, 2.79388427734375, 3.186279296875, 3.57867431640625, 3.9710693359375, 4.36346435546875, 4.755859375, 5.14825439453125, 5.5406494140625, 5.93304443359375, 6.325439453125, 6.71783447265625, 7.1102294921875, 7.50262451171875, 7.89501953125, 8.28741455078125, 8.6798095703125, 9.07220458984375, 9.464599609375, 9.85699462890625, 10.2493896484375, 10.64178466796875, 11.0341796875, 11.42657470703125, 11.8189697265625, 12.21136474609375, 12.603759765625, 12.99615478515625, 13.3885498046875, 13.78094482421875, 14.17333984375, 14.56573486328125, 14.9581298828125, 15.35052490234375, 15.742919921875, 16.13531494140625, 16.5277099609375, 16.92010498046875, 17.3125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 7.0, 6.0, 6.0, 15.0, 38.0, 54.0, 69.0, 114.0, 192.0, 286.0, 520.0, 903.0, 1766.0, 3362.0, 7600.0, 19516.0, 60099.0, 275154.0, 3272210.0, 431880.0, 78349.0, 24500.0, 9286.0, 4050.0, 1845.0, 1015.0, 555.0, 342.0, 194.0, 120.0, 79.0, 48.0, 28.0, 27.0, 18.0, 7.0, 5.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-69.125, -67.0048828125, -64.884765625, -62.7646484375, -60.64453125, -58.5244140625, -56.404296875, -54.2841796875, -52.1640625, -50.0439453125, -47.923828125, -45.8037109375, -43.68359375, -41.5634765625, -39.443359375, -37.3232421875, -35.203125, -33.0830078125, -30.962890625, -28.8427734375, -26.72265625, -24.6025390625, -22.482421875, -20.3623046875, -18.2421875, -16.1220703125, -14.001953125, -11.8818359375, -9.76171875, -7.6416015625, -5.521484375, -3.4013671875, -1.28125, 0.8388671875, 2.958984375, 5.0791015625, 7.19921875, 9.3193359375, 11.439453125, 13.5595703125, 15.6796875, 17.7998046875, 19.919921875, 22.0400390625, 24.16015625, 26.2802734375, 28.400390625, 30.5205078125, 32.640625, 34.7607421875, 36.880859375, 39.0009765625, 41.12109375, 43.2412109375, 45.361328125, 47.4814453125, 49.6015625, 51.7216796875, 53.841796875, 55.9619140625, 58.08203125, 60.2021484375, 62.322265625, 64.4423828125, 66.5625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 7.0, 9.0, 10.0, 16.0, 15.0, 22.0, 38.0, 60.0, 97.0, 131.0, 199.0, 438.0, 1505.0, 727.0, 285.0, 153.0, 98.0, 74.0, 41.0, 36.0, 22.0, 24.0, 13.0, 10.0, 9.0, 6.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.8125, -30.869873046875, -29.92724609375, -28.984619140625, -28.0419921875, -27.099365234375, -26.15673828125, -25.214111328125, -24.271484375, -23.328857421875, -22.38623046875, -21.443603515625, -20.5009765625, -19.558349609375, -18.61572265625, -17.673095703125, -16.73046875, -15.787841796875, -14.84521484375, -13.902587890625, -12.9599609375, -12.017333984375, -11.07470703125, -10.132080078125, -9.189453125, -8.246826171875, -7.30419921875, -6.361572265625, -5.4189453125, -4.476318359375, -3.53369140625, -2.591064453125, -1.6484375, -0.705810546875, 0.23681640625, 1.179443359375, 2.1220703125, 3.064697265625, 4.00732421875, 4.949951171875, 5.892578125, 6.835205078125, 7.77783203125, 8.720458984375, 9.6630859375, 10.605712890625, 11.54833984375, 12.490966796875, 13.43359375, 14.376220703125, 15.31884765625, 16.261474609375, 17.2041015625, 18.146728515625, 19.08935546875, 20.031982421875, 20.974609375, 21.917236328125, 22.85986328125, 23.802490234375, 24.7451171875, 25.687744140625, 26.63037109375, 27.572998046875, 28.515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 20.0, 78.0, 135.0, 229.0, 226.0, 174.0, 74.0, 36.0, 10.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-684.462890625, -671.3668823242188, -658.2708740234375, -645.1748046875, -632.0787963867188, -618.9827880859375, -605.8867797851562, -592.790771484375, -579.6947021484375, -566.5986938476562, -553.502685546875, -540.4066162109375, -527.3106079101562, -514.214599609375, -501.11859130859375, -488.0225524902344, -474.9265441894531, -461.8305358886719, -448.7344970703125, -435.63848876953125, -422.5424499511719, -409.4464416503906, -396.35040283203125, -383.25439453125, -370.15838623046875, -357.0623779296875, -343.9663391113281, -330.8703308105469, -317.7742919921875, -304.67828369140625, -291.582275390625, -278.4862365722656, -265.39019775390625, -252.29417419433594, -239.19815063476562, -226.10214233398438, -213.006103515625, -199.91009521484375, -186.81407165527344, -173.71804809570312, -160.62203979492188, -147.52601623535156, -134.42999267578125, -121.33397674560547, -108.23795318603516, -95.14192962646484, -82.04591369628906, -68.94989013671875, -55.85386657714844, -42.757843017578125, -29.661823272705078, -16.56580352783203, -3.4697799682617188, 9.626243591308594, 22.722259521484375, 35.81828308105469, 48.914306640625, 62.01033020019531, 75.10635375976562, 88.2023696899414, 101.29839324951172, 114.39441680908203, 127.49043273925781, 140.58645629882812, 153.68247985839844]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 14.0, 14.0, 8.0, 9.0, 12.0, 15.0, 18.0, 18.0, 27.0, 25.0, 29.0, 31.0, 28.0, 32.0, 33.0, 35.0, 38.0, 47.0, 39.0, 47.0, 52.0, 24.0, 35.0, 33.0, 39.0, 35.0, 35.0, 26.0, 32.0, 22.0, 19.0, 21.0, 12.0, 16.0, 13.0, 11.0, 9.0, 10.0, 6.0, 5.0, 3.0, 4.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0], "bins": [-96.74041748046875, -93.87686157226562, -91.01329803466797, -88.14974212646484, -85.28617858886719, -82.42262268066406, -79.55906677246094, -76.69550323486328, -73.83193969726562, -70.9683837890625, -68.10482025146484, -65.24126434326172, -62.37770080566406, -59.51414489746094, -56.65058517456055, -53.787025451660156, -50.92346954345703, -48.05990982055664, -45.19635009765625, -42.332794189453125, -39.46923065185547, -36.605674743652344, -33.74211502075195, -30.878555297851562, -28.014995574951172, -25.15143585205078, -22.28787612915039, -19.424318313598633, -16.560758590698242, -13.697198867797852, -10.833641052246094, -7.970081329345703, -5.1065216064453125, -2.24296236038208, 0.6205968856811523, 3.4841556549072266, 6.347715377807617, 9.211275100708008, 12.074832916259766, 14.938392639160156, 17.801952362060547, 20.665512084960938, 23.529071807861328, 26.392629623413086, 29.256189346313477, 32.1197509765625, 34.983306884765625, 37.846866607666016, 40.710426330566406, 43.5739860534668, 46.43754577636719, 49.30110168457031, 52.16466522216797, 55.028221130371094, 57.891780853271484, 60.755340576171875, 63.618900299072266, 66.48246002197266, 69.34601593017578, 72.20957946777344, 75.07313537597656, 77.93669891357422, 80.80025482177734, 83.663818359375, 86.52737426757812]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 10.0, 5.0, 8.0, 5.0, 18.0, 19.0, 17.0, 41.0, 43.0, 72.0, 112.0, 176.0, 308.0, 661.0, 1398.0, 3211.0, 9049.0, 29547.0, 124192.0, 586522.0, 224545.0, 47015.0, 13104.0, 4604.0, 1906.0, 873.0, 421.0, 236.0, 149.0, 97.0, 51.0, 36.0, 30.0, 19.0, 15.0, 10.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-106.125, -102.876953125, -99.62890625, -96.380859375, -93.1328125, -89.884765625, -86.63671875, -83.388671875, -80.140625, -76.892578125, -73.64453125, -70.396484375, -67.1484375, -63.900390625, -60.65234375, -57.404296875, -54.15625, -50.908203125, -47.66015625, -44.412109375, -41.1640625, -37.916015625, -34.66796875, -31.419921875, -28.171875, -24.923828125, -21.67578125, -18.427734375, -15.1796875, -11.931640625, -8.68359375, -5.435546875, -2.1875, 1.060546875, 4.30859375, 7.556640625, 10.8046875, 14.052734375, 17.30078125, 20.548828125, 23.796875, 27.044921875, 30.29296875, 33.541015625, 36.7890625, 40.037109375, 43.28515625, 46.533203125, 49.78125, 53.029296875, 56.27734375, 59.525390625, 62.7734375, 66.021484375, 69.26953125, 72.517578125, 75.765625, 79.013671875, 82.26171875, 85.509765625, 88.7578125, 92.005859375, 95.25390625, 98.501953125, 101.75]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 12.0, 17.0, 20.0, 23.0, 30.0, 42.0, 52.0, 43.0, 64.0, 65.0, 73.0, 67.0, 60.0, 72.0, 67.0, 53.0, 54.0, 36.0, 37.0, 22.0, 30.0, 16.0, 14.0, 7.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.71875, -9.309326171875, -8.89990234375, -8.490478515625, -8.0810546875, -7.671630859375, -7.26220703125, -6.852783203125, -6.443359375, -6.033935546875, -5.62451171875, -5.215087890625, -4.8056640625, -4.396240234375, -3.98681640625, -3.577392578125, -3.16796875, -2.758544921875, -2.34912109375, -1.939697265625, -1.5302734375, -1.120849609375, -0.71142578125, -0.302001953125, 0.107421875, 0.516845703125, 0.92626953125, 1.335693359375, 1.7451171875, 2.154541015625, 2.56396484375, 2.973388671875, 3.3828125, 3.792236328125, 4.20166015625, 4.611083984375, 5.0205078125, 5.429931640625, 5.83935546875, 6.248779296875, 6.658203125, 7.067626953125, 7.47705078125, 7.886474609375, 8.2958984375, 8.705322265625, 9.11474609375, 9.524169921875, 9.93359375, 10.343017578125, 10.75244140625, 11.161865234375, 11.5712890625, 11.980712890625, 12.39013671875, 12.799560546875, 13.208984375, 13.618408203125, 14.02783203125, 14.437255859375, 14.8466796875, 15.256103515625, 15.66552734375, 16.074951171875, 16.484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 10.0, 18.0, 24.0, 29.0, 53.0, 66.0, 131.0, 170.0, 283.0, 498.0, 900.0, 1691.0, 3623.0, 9070.0, 30584.0, 130599.0, 569055.0, 230399.0, 48232.0, 13315.0, 4867.0, 2139.0, 1143.0, 615.0, 376.0, 223.0, 159.0, 85.0, 53.0, 42.0, 24.0, 23.0, 10.0, 13.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-104.9375, -102.2919921875, -99.646484375, -97.0009765625, -94.35546875, -91.7099609375, -89.064453125, -86.4189453125, -83.7734375, -81.1279296875, -78.482421875, -75.8369140625, -73.19140625, -70.5458984375, -67.900390625, -65.2548828125, -62.609375, -59.9638671875, -57.318359375, -54.6728515625, -52.02734375, -49.3818359375, -46.736328125, -44.0908203125, -41.4453125, -38.7998046875, -36.154296875, -33.5087890625, -30.86328125, -28.2177734375, -25.572265625, -22.9267578125, -20.28125, -17.6357421875, -14.990234375, -12.3447265625, -9.69921875, -7.0537109375, -4.408203125, -1.7626953125, 0.8828125, 3.5283203125, 6.173828125, 8.8193359375, 11.46484375, 14.1103515625, 16.755859375, 19.4013671875, 22.046875, 24.6923828125, 27.337890625, 29.9833984375, 32.62890625, 35.2744140625, 37.919921875, 40.5654296875, 43.2109375, 45.8564453125, 48.501953125, 51.1474609375, 53.79296875, 56.4384765625, 59.083984375, 61.7294921875, 64.375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 9.0, 7.0, 6.0, 11.0, 16.0, 10.0, 19.0, 18.0, 19.0, 26.0, 32.0, 33.0, 35.0, 33.0, 49.0, 37.0, 44.0, 48.0, 44.0, 39.0, 39.0, 56.0, 31.0, 50.0, 25.0, 21.0, 37.0, 34.0, 22.0, 19.0, 15.0, 27.0, 20.0, 16.0, 12.0, 2.0, 7.0, 12.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.59375, -30.4697265625, -29.345703125, -28.2216796875, -27.09765625, -25.9736328125, -24.849609375, -23.7255859375, -22.6015625, -21.4775390625, -20.353515625, -19.2294921875, -18.10546875, -16.9814453125, -15.857421875, -14.7333984375, -13.609375, -12.4853515625, -11.361328125, -10.2373046875, -9.11328125, -7.9892578125, -6.865234375, -5.7412109375, -4.6171875, -3.4931640625, -2.369140625, -1.2451171875, -0.12109375, 1.0029296875, 2.126953125, 3.2509765625, 4.375, 5.4990234375, 6.623046875, 7.7470703125, 8.87109375, 9.9951171875, 11.119140625, 12.2431640625, 13.3671875, 14.4912109375, 15.615234375, 16.7392578125, 17.86328125, 18.9873046875, 20.111328125, 21.2353515625, 22.359375, 23.4833984375, 24.607421875, 25.7314453125, 26.85546875, 27.9794921875, 29.103515625, 30.2275390625, 31.3515625, 32.4755859375, 33.599609375, 34.7236328125, 35.84765625, 36.9716796875, 38.095703125, 39.2197265625, 40.34375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 2.0, 8.0, 6.0, 10.0, 18.0, 33.0, 38.0, 59.0, 92.0, 159.0, 285.0, 488.0, 1045.0, 2558.0, 8935.0, 97794.0, 874453.0, 51792.0, 6600.0, 2193.0, 947.0, 410.0, 252.0, 99.0, 84.0, 65.0, 34.0, 30.0, 16.0, 10.0, 6.0, 13.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-90.125, -87.6494140625, -85.173828125, -82.6982421875, -80.22265625, -77.7470703125, -75.271484375, -72.7958984375, -70.3203125, -67.8447265625, -65.369140625, -62.8935546875, -60.41796875, -57.9423828125, -55.466796875, -52.9912109375, -50.515625, -48.0400390625, -45.564453125, -43.0888671875, -40.61328125, -38.1376953125, -35.662109375, -33.1865234375, -30.7109375, -28.2353515625, -25.759765625, -23.2841796875, -20.80859375, -18.3330078125, -15.857421875, -13.3818359375, -10.90625, -8.4306640625, -5.955078125, -3.4794921875, -1.00390625, 1.4716796875, 3.947265625, 6.4228515625, 8.8984375, 11.3740234375, 13.849609375, 16.3251953125, 18.80078125, 21.2763671875, 23.751953125, 26.2275390625, 28.703125, 31.1787109375, 33.654296875, 36.1298828125, 38.60546875, 41.0810546875, 43.556640625, 46.0322265625, 48.5078125, 50.9833984375, 53.458984375, 55.9345703125, 58.41015625, 60.8857421875, 63.361328125, 65.8369140625, 68.3125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 9.0, 13.0, 6.0, 12.0, 15.0, 28.0, 37.0, 69.0, 99.0, 172.0, 180.0, 115.0, 74.0, 45.0, 29.0, 20.0, 28.0, 9.0, 8.0, 5.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005992889404296875, -0.0057623982429504395, -0.005531907081604004, -0.005301415920257568, -0.005070924758911133, -0.004840433597564697, -0.004609942436218262, -0.004379451274871826, -0.004148960113525391, -0.003918468952178955, -0.0036879777908325195, -0.003457486629486084, -0.0032269954681396484, -0.002996504306793213, -0.0027660131454467773, -0.002535521984100342, -0.0023050308227539062, -0.0020745396614074707, -0.0018440485000610352, -0.0016135573387145996, -0.001383066177368164, -0.0011525750160217285, -0.000922083854675293, -0.0006915926933288574, -0.0004611015319824219, -0.00023061037063598633, -1.1920928955078125e-07, 0.00023037195205688477, 0.0004608631134033203, 0.0006913542747497559, 0.0009218454360961914, 0.001152336597442627, 0.0013828277587890625, 0.001613318920135498, 0.0018438100814819336, 0.002074301242828369, 0.0023047924041748047, 0.0025352835655212402, 0.0027657747268676758, 0.0029962658882141113, 0.003226757049560547, 0.0034572482109069824, 0.003687739372253418, 0.0039182305335998535, 0.004148721694946289, 0.004379212856292725, 0.00460970401763916, 0.004840195178985596, 0.005070686340332031, 0.005301177501678467, 0.005531668663024902, 0.005762159824371338, 0.0059926509857177734, 0.006223142147064209, 0.0064536333084106445, 0.00668412446975708, 0.006914615631103516, 0.007145106792449951, 0.007375597953796387, 0.007606089115142822, 0.007836580276489258, 0.008067071437835693, 0.008297562599182129, 0.008528053760528564, 0.008758544921875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 8.0, 8.0, 17.0, 27.0, 28.0, 48.0, 68.0, 117.0, 206.0, 428.0, 1066.0, 3109.0, 14466.0, 696757.0, 317386.0, 10527.0, 2510.0, 939.0, 361.0, 177.0, 104.0, 59.0, 47.0, 36.0, 22.0, 6.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.0, -98.9013671875, -95.802734375, -92.7041015625, -89.60546875, -86.5068359375, -83.408203125, -80.3095703125, -77.2109375, -74.1123046875, -71.013671875, -67.9150390625, -64.81640625, -61.7177734375, -58.619140625, -55.5205078125, -52.421875, -49.3232421875, -46.224609375, -43.1259765625, -40.02734375, -36.9287109375, -33.830078125, -30.7314453125, -27.6328125, -24.5341796875, -21.435546875, -18.3369140625, -15.23828125, -12.1396484375, -9.041015625, -5.9423828125, -2.84375, 0.2548828125, 3.353515625, 6.4521484375, 9.55078125, 12.6494140625, 15.748046875, 18.8466796875, 21.9453125, 25.0439453125, 28.142578125, 31.2412109375, 34.33984375, 37.4384765625, 40.537109375, 43.6357421875, 46.734375, 49.8330078125, 52.931640625, 56.0302734375, 59.12890625, 62.2275390625, 65.326171875, 68.4248046875, 71.5234375, 74.6220703125, 77.720703125, 80.8193359375, 83.91796875, 87.0166015625, 90.115234375, 93.2138671875, 96.3125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 10.0, 3.0, 4.0, 10.0, 11.0, 30.0, 43.0, 82.0, 170.0, 237.0, 183.0, 104.0, 41.0, 26.0, 14.0, 14.0, 6.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.03125, -46.64599609375, -45.2607421875, -43.87548828125, -42.490234375, -41.10498046875, -39.7197265625, -38.33447265625, -36.94921875, -35.56396484375, -34.1787109375, -32.79345703125, -31.408203125, -30.02294921875, -28.6376953125, -27.25244140625, -25.8671875, -24.48193359375, -23.0966796875, -21.71142578125, -20.326171875, -18.94091796875, -17.5556640625, -16.17041015625, -14.78515625, -13.39990234375, -12.0146484375, -10.62939453125, -9.244140625, -7.85888671875, -6.4736328125, -5.08837890625, -3.703125, -2.31787109375, -0.9326171875, 0.45263671875, 1.837890625, 3.22314453125, 4.6083984375, 5.99365234375, 7.37890625, 8.76416015625, 10.1494140625, 11.53466796875, 12.919921875, 14.30517578125, 15.6904296875, 17.07568359375, 18.4609375, 19.84619140625, 21.2314453125, 22.61669921875, 24.001953125, 25.38720703125, 26.7724609375, 28.15771484375, 29.54296875, 30.92822265625, 32.3134765625, 33.69873046875, 35.083984375, 36.46923828125, 37.8544921875, 39.23974609375, 40.625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 21.0, 27.0, 60.0, 136.0, 206.0, 200.0, 160.0, 96.0, 49.0, 21.0, 9.0, 5.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-867.89501953125, -845.2411499023438, -822.5872802734375, -799.9334716796875, -777.2796020507812, -754.625732421875, -731.9718627929688, -709.3179931640625, -686.6641845703125, -664.0103149414062, -641.3564453125, -618.70263671875, -596.0487670898438, -573.3948974609375, -550.7410278320312, -528.087158203125, -505.43328857421875, -482.7794189453125, -460.1255798339844, -437.4717102050781, -414.81787109375, -392.16400146484375, -369.5101318359375, -346.85626220703125, -324.2024230957031, -301.5485534667969, -278.89471435546875, -256.2408447265625, -233.5869903564453, -210.93313598632812, -188.27926635742188, -165.6254119873047, -142.9715576171875, -120.31770324707031, -97.6638412475586, -75.00997924804688, -52.35612487792969, -29.7022705078125, -7.04840087890625, 15.605453491210938, 38.259307861328125, 60.91316604614258, 83.56702423095703, 106.22088623046875, 128.87474060058594, 151.52859497070312, 174.18246459960938, 196.83631896972656, 219.49017333984375, 242.14402770996094, 264.7978820800781, 287.4517517089844, 310.1055908203125, 332.75946044921875, 355.413330078125, 378.06719970703125, 400.7210388183594, 423.3749084472656, 446.02874755859375, 468.6826171875, 491.33648681640625, 513.9903564453125, 536.6441650390625, 559.2980346679688, 581.951904296875]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 6.0, 9.0, 15.0, 9.0, 17.0, 17.0, 25.0, 22.0, 20.0, 25.0, 28.0, 24.0, 50.0, 41.0, 39.0, 38.0, 37.0, 50.0, 37.0, 47.0, 30.0, 36.0, 33.0, 41.0, 30.0, 32.0, 28.0, 32.0, 33.0, 26.0, 21.0, 17.0, 7.0, 7.0, 16.0, 11.0, 6.0, 3.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-168.54010009765625, -162.70712280273438, -156.8741455078125, -151.04115295410156, -145.2081756591797, -139.3751983642578, -133.54222106933594, -127.70923614501953, -121.87625122070312, -116.04327392578125, -110.21028900146484, -104.37731170654297, -98.54432678222656, -92.71134948730469, -86.87837219238281, -81.0453872680664, -75.21240997314453, -69.37943267822266, -63.54644775390625, -57.713470458984375, -51.88048553466797, -46.047508239746094, -40.21452713012695, -34.38154602050781, -28.548564910888672, -22.71558380126953, -16.88260269165039, -11.049623489379883, -5.216642379760742, 0.6163387298583984, 6.449317932128906, 12.282299041748047, 18.115280151367188, 23.948261260986328, 29.78124237060547, 35.614219665527344, 41.44720458984375, 47.280181884765625, 53.113162994384766, 58.946144104003906, 64.77912902832031, 70.61210632324219, 76.4450912475586, 82.27806854248047, 88.11105346679688, 93.94403076171875, 99.77700805664062, 105.60999298095703, 111.4429702758789, 117.27594757080078, 123.10893249511719, 128.94190979003906, 134.77488708496094, 140.60787963867188, 146.44085693359375, 152.27383422851562, 158.1068115234375, 163.93978881835938, 169.77276611328125, 175.6057586669922, 181.43873596191406, 187.27171325683594, 193.1046905517578, 198.93768310546875, 204.77066040039062]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 4.0, 9.0, 7.0, 12.0, 10.0, 23.0, 26.0, 60.0, 66.0, 118.0, 219.0, 497.0, 1172.0, 3104.0, 10251.0, 44525.0, 773574.0, 3284950.0, 57107.0, 12372.0, 3639.0, 1325.0, 553.0, 256.0, 163.0, 73.0, 52.0, 34.0, 26.0, 17.0, 21.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.125, -151.796875, -147.46875, -143.140625, -138.8125, -134.484375, -130.15625, -125.828125, -121.5, -117.171875, -112.84375, -108.515625, -104.1875, -99.859375, -95.53125, -91.203125, -86.875, -82.546875, -78.21875, -73.890625, -69.5625, -65.234375, -60.90625, -56.578125, -52.25, -47.921875, -43.59375, -39.265625, -34.9375, -30.609375, -26.28125, -21.953125, -17.625, -13.296875, -8.96875, -4.640625, -0.3125, 4.015625, 8.34375, 12.671875, 17.0, 21.328125, 25.65625, 29.984375, 34.3125, 38.640625, 42.96875, 47.296875, 51.625, 55.953125, 60.28125, 64.609375, 68.9375, 73.265625, 77.59375, 81.921875, 86.25, 90.578125, 94.90625, 99.234375, 103.5625, 107.890625, 112.21875, 116.546875, 120.875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 5.0, 17.0, 18.0, 17.0, 27.0, 37.0, 47.0, 56.0, 48.0, 65.0, 61.0, 66.0, 66.0, 68.0, 68.0, 65.0, 52.0, 48.0, 30.0, 39.0, 26.0, 17.0, 16.0, 10.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4140625, -10.0013427734375, -9.588623046875, -9.1759033203125, -8.76318359375, -8.3504638671875, -7.937744140625, -7.5250244140625, -7.1123046875, -6.6995849609375, -6.286865234375, -5.8741455078125, -5.46142578125, -5.0487060546875, -4.635986328125, -4.2232666015625, -3.810546875, -3.3978271484375, -2.985107421875, -2.5723876953125, -2.15966796875, -1.7469482421875, -1.334228515625, -0.9215087890625, -0.5087890625, -0.0960693359375, 0.316650390625, 0.7293701171875, 1.14208984375, 1.5548095703125, 1.967529296875, 2.3802490234375, 2.79296875, 3.2056884765625, 3.618408203125, 4.0311279296875, 4.44384765625, 4.8565673828125, 5.269287109375, 5.6820068359375, 6.0947265625, 6.5074462890625, 6.920166015625, 7.3328857421875, 7.74560546875, 8.1583251953125, 8.571044921875, 8.9837646484375, 9.396484375, 9.8092041015625, 10.221923828125, 10.6346435546875, 11.04736328125, 11.4600830078125, 11.872802734375, 12.2855224609375, 12.6982421875, 13.1109619140625, 13.523681640625, 13.9364013671875, 14.34912109375, 14.7618408203125, 15.174560546875, 15.5872802734375, 16.0]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 16.0, 26.0, 29.0, 55.0, 83.0, 133.0, 231.0, 424.0, 863.0, 1662.0, 3544.0, 7902.0, 19614.0, 56999.0, 245600.0, 3393386.0, 352906.0, 69997.0, 23511.0, 9367.0, 4066.0, 1812.0, 890.0, 476.0, 268.0, 170.0, 96.0, 51.0, 32.0, 27.0, 16.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.90625, -44.73291015625, -42.5595703125, -40.38623046875, -38.212890625, -36.03955078125, -33.8662109375, -31.69287109375, -29.51953125, -27.34619140625, -25.1728515625, -22.99951171875, -20.826171875, -18.65283203125, -16.4794921875, -14.30615234375, -12.1328125, -9.95947265625, -7.7861328125, -5.61279296875, -3.439453125, -1.26611328125, 0.9072265625, 3.08056640625, 5.25390625, 7.42724609375, 9.6005859375, 11.77392578125, 13.947265625, 16.12060546875, 18.2939453125, 20.46728515625, 22.640625, 24.81396484375, 26.9873046875, 29.16064453125, 31.333984375, 33.50732421875, 35.6806640625, 37.85400390625, 40.02734375, 42.20068359375, 44.3740234375, 46.54736328125, 48.720703125, 50.89404296875, 53.0673828125, 55.24072265625, 57.4140625, 59.58740234375, 61.7607421875, 63.93408203125, 66.107421875, 68.28076171875, 70.4541015625, 72.62744140625, 74.80078125, 76.97412109375, 79.1474609375, 81.32080078125, 83.494140625, 85.66748046875, 87.8408203125, 90.01416015625, 92.1875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 3.0, 6.0, 15.0, 23.0, 41.0, 61.0, 46.0, 79.0, 121.0, 271.0, 853.0, 1613.0, 383.0, 183.0, 83.0, 75.0, 57.0, 40.0, 25.0, 14.0, 14.0, 14.0, 10.0, 9.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.171875, -20.295654296875, -19.41943359375, -18.543212890625, -17.6669921875, -16.790771484375, -15.91455078125, -15.038330078125, -14.162109375, -13.285888671875, -12.40966796875, -11.533447265625, -10.6572265625, -9.781005859375, -8.90478515625, -8.028564453125, -7.15234375, -6.276123046875, -5.39990234375, -4.523681640625, -3.6474609375, -2.771240234375, -1.89501953125, -1.018798828125, -0.142578125, 0.733642578125, 1.60986328125, 2.486083984375, 3.3623046875, 4.238525390625, 5.11474609375, 5.990966796875, 6.8671875, 7.743408203125, 8.61962890625, 9.495849609375, 10.3720703125, 11.248291015625, 12.12451171875, 13.000732421875, 13.876953125, 14.753173828125, 15.62939453125, 16.505615234375, 17.3818359375, 18.258056640625, 19.13427734375, 20.010498046875, 20.88671875, 21.762939453125, 22.63916015625, 23.515380859375, 24.3916015625, 25.267822265625, 26.14404296875, 27.020263671875, 27.896484375, 28.772705078125, 29.64892578125, 30.525146484375, 31.4013671875, 32.277587890625, 33.15380859375, 34.030029296875, 34.90625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 22.0, 62.0, 166.0, 250.0, 234.0, 142.0, 73.0, 26.0, 13.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-558.0977172851562, -545.6300048828125, -533.1622924804688, -520.694580078125, -508.2268981933594, -495.7591857910156, -483.29150390625, -470.82379150390625, -458.3560791015625, -445.88836669921875, -433.4206848144531, -420.9529724121094, -408.4852600097656, -396.0175476074219, -383.54986572265625, -371.0821533203125, -358.61444091796875, -346.146728515625, -333.6790466308594, -321.2113342285156, -308.7436218261719, -296.2759094238281, -283.8082275390625, -271.34051513671875, -258.8728332519531, -246.40513610839844, -233.9374237060547, -221.4697265625, -209.00201416015625, -196.53431701660156, -184.06661987304688, -171.59890747070312, -159.13121032714844, -146.66351318359375, -134.19580078125, -121.72810363769531, -109.26039123535156, -96.79269409179688, -84.32498931884766, -71.85728454589844, -59.38957977294922, -46.921875, -34.45417022705078, -21.986469268798828, -9.51876449584961, 2.9489402770996094, 15.416641235351562, 27.88434600830078, 40.35205078125, 52.81975555419922, 65.28746032714844, 77.75515747070312, 90.22286987304688, 102.69056701660156, 115.15827178955078, 127.6259765625, 140.09368896484375, 152.56138610839844, 165.0290985107422, 177.49679565429688, 189.96450805664062, 202.4322052001953, 214.89990234375, 227.36761474609375, 239.83531188964844]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 10.0, 10.0, 20.0, 14.0, 16.0, 23.0, 29.0, 21.0, 37.0, 46.0, 47.0, 52.0, 43.0, 59.0, 49.0, 45.0, 62.0, 47.0, 51.0, 48.0, 39.0, 42.0, 34.0, 35.0, 25.0, 21.0, 18.0, 12.0, 11.0, 10.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-131.56179809570312, -128.248046875, -124.93431091308594, -121.62055969238281, -118.30681610107422, -114.99307250976562, -111.6793212890625, -108.3655776977539, -105.05183410644531, -101.73809051513672, -98.42434692382812, -95.110595703125, -91.7968521118164, -88.48310852050781, -85.16935729980469, -81.8556137084961, -78.5418701171875, -75.2281265258789, -71.91438293457031, -68.60063171386719, -65.2868881225586, -61.97314453125, -58.65939712524414, -55.34564971923828, -52.03190612792969, -48.718162536621094, -45.404415130615234, -42.090667724609375, -38.77692413330078, -35.46318054199219, -32.14943313598633, -28.8356876373291, -25.521942138671875, -22.20819664001465, -18.894451141357422, -15.580705642700195, -12.266960144042969, -8.953214645385742, -5.639469146728516, -2.325723648071289, 0.9880218505859375, 4.301767349243164, 7.615512847900391, 10.929258346557617, 14.243003845214844, 17.55674934387207, 20.870494842529297, 24.184240341186523, 27.49798583984375, 30.811731338500977, 34.1254768371582, 37.43922424316406, 40.752967834472656, 44.06671142578125, 47.38045883178711, 50.69420623779297, 54.00794982910156, 57.321693420410156, 60.635440826416016, 63.949188232421875, 67.26293182373047, 70.57667541503906, 73.89042663574219, 77.20417022705078, 80.51791381835938]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 15.0, 14.0, 18.0, 31.0, 41.0, 56.0, 95.0, 130.0, 262.0, 472.0, 994.0, 2770.0, 8621.0, 31629.0, 134480.0, 607042.0, 200624.0, 43797.0, 11262.0, 3490.0, 1349.0, 579.0, 322.0, 165.0, 95.0, 64.0, 44.0, 30.0, 16.0, 12.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.6875, -79.693359375, -76.69921875, -73.705078125, -70.7109375, -67.716796875, -64.72265625, -61.728515625, -58.734375, -55.740234375, -52.74609375, -49.751953125, -46.7578125, -43.763671875, -40.76953125, -37.775390625, -34.78125, -31.787109375, -28.79296875, -25.798828125, -22.8046875, -19.810546875, -16.81640625, -13.822265625, -10.828125, -7.833984375, -4.83984375, -1.845703125, 1.1484375, 4.142578125, 7.13671875, 10.130859375, 13.125, 16.119140625, 19.11328125, 22.107421875, 25.1015625, 28.095703125, 31.08984375, 34.083984375, 37.078125, 40.072265625, 43.06640625, 46.060546875, 49.0546875, 52.048828125, 55.04296875, 58.037109375, 61.03125, 64.025390625, 67.01953125, 70.013671875, 73.0078125, 76.001953125, 78.99609375, 81.990234375, 84.984375, 87.978515625, 90.97265625, 93.966796875, 96.9609375, 99.955078125, 102.94921875, 105.943359375, 108.9375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 2.0, 5.0, 6.0, 5.0, 13.0, 20.0, 22.0, 26.0, 32.0, 49.0, 31.0, 39.0, 44.0, 62.0, 63.0, 73.0, 49.0, 65.0, 67.0, 54.0, 47.0, 49.0, 34.0, 44.0, 26.0, 14.0, 20.0, 15.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9140625, -9.5032958984375, -9.092529296875, -8.6817626953125, -8.27099609375, -7.8602294921875, -7.449462890625, -7.0386962890625, -6.6279296875, -6.2171630859375, -5.806396484375, -5.3956298828125, -4.98486328125, -4.5740966796875, -4.163330078125, -3.7525634765625, -3.341796875, -2.9310302734375, -2.520263671875, -2.1094970703125, -1.69873046875, -1.2879638671875, -0.877197265625, -0.4664306640625, -0.0556640625, 0.3551025390625, 0.765869140625, 1.1766357421875, 1.58740234375, 1.9981689453125, 2.408935546875, 2.8197021484375, 3.23046875, 3.6412353515625, 4.052001953125, 4.4627685546875, 4.87353515625, 5.2843017578125, 5.695068359375, 6.1058349609375, 6.5166015625, 6.9273681640625, 7.338134765625, 7.7489013671875, 8.15966796875, 8.5704345703125, 8.981201171875, 9.3919677734375, 9.802734375, 10.2135009765625, 10.624267578125, 11.0350341796875, 11.44580078125, 11.8565673828125, 12.267333984375, 12.6781005859375, 13.0888671875, 13.4996337890625, 13.910400390625, 14.3211669921875, 14.73193359375, 15.1427001953125, 15.553466796875, 15.9642333984375, 16.375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 9.0, 11.0, 10.0, 18.0, 30.0, 49.0, 67.0, 114.0, 169.0, 314.0, 574.0, 1240.0, 2937.0, 7496.0, 21829.0, 64155.0, 223559.0, 492767.0, 158052.0, 48220.0, 16468.0, 5869.0, 2297.0, 1029.0, 500.0, 258.0, 157.0, 106.0, 61.0, 51.0, 40.0, 21.0, 16.0, 16.0, 9.0, 10.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.25, -46.4873046875, -44.724609375, -42.9619140625, -41.19921875, -39.4365234375, -37.673828125, -35.9111328125, -34.1484375, -32.3857421875, -30.623046875, -28.8603515625, -27.09765625, -25.3349609375, -23.572265625, -21.8095703125, -20.046875, -18.2841796875, -16.521484375, -14.7587890625, -12.99609375, -11.2333984375, -9.470703125, -7.7080078125, -5.9453125, -4.1826171875, -2.419921875, -0.6572265625, 1.10546875, 2.8681640625, 4.630859375, 6.3935546875, 8.15625, 9.9189453125, 11.681640625, 13.4443359375, 15.20703125, 16.9697265625, 18.732421875, 20.4951171875, 22.2578125, 24.0205078125, 25.783203125, 27.5458984375, 29.30859375, 31.0712890625, 32.833984375, 34.5966796875, 36.359375, 38.1220703125, 39.884765625, 41.6474609375, 43.41015625, 45.1728515625, 46.935546875, 48.6982421875, 50.4609375, 52.2236328125, 53.986328125, 55.7490234375, 57.51171875, 59.2744140625, 61.037109375, 62.7998046875, 64.5625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 2.0, 3.0, 2.0, 7.0, 7.0, 8.0, 14.0, 20.0, 18.0, 27.0, 34.0, 35.0, 31.0, 39.0, 54.0, 44.0, 48.0, 45.0, 52.0, 60.0, 60.0, 44.0, 38.0, 44.0, 39.0, 30.0, 27.0, 22.0, 24.0, 25.0, 25.0, 14.0, 14.0, 8.0, 8.0, 5.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.875, -37.4736328125, -36.072265625, -34.6708984375, -33.26953125, -31.8681640625, -30.466796875, -29.0654296875, -27.6640625, -26.2626953125, -24.861328125, -23.4599609375, -22.05859375, -20.6572265625, -19.255859375, -17.8544921875, -16.453125, -15.0517578125, -13.650390625, -12.2490234375, -10.84765625, -9.4462890625, -8.044921875, -6.6435546875, -5.2421875, -3.8408203125, -2.439453125, -1.0380859375, 0.36328125, 1.7646484375, 3.166015625, 4.5673828125, 5.96875, 7.3701171875, 8.771484375, 10.1728515625, 11.57421875, 12.9755859375, 14.376953125, 15.7783203125, 17.1796875, 18.5810546875, 19.982421875, 21.3837890625, 22.78515625, 24.1865234375, 25.587890625, 26.9892578125, 28.390625, 29.7919921875, 31.193359375, 32.5947265625, 33.99609375, 35.3974609375, 36.798828125, 38.2001953125, 39.6015625, 41.0029296875, 42.404296875, 43.8056640625, 45.20703125, 46.6083984375, 48.009765625, 49.4111328125, 50.8125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 7.0, 7.0, 16.0, 14.0, 20.0, 23.0, 27.0, 51.0, 66.0, 130.0, 206.0, 346.0, 734.0, 1526.0, 3880.0, 10108.0, 33334.0, 141742.0, 511671.0, 262355.0, 56852.0, 15632.0, 5438.0, 2206.0, 962.0, 465.0, 237.0, 157.0, 88.0, 73.0, 53.0, 34.0, 22.0, 22.0, 11.0, 2.0, 5.0, 5.0, 1.0, 5.0, 0.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.5625, -20.783935546875, -20.00537109375, -19.226806640625, -18.4482421875, -17.669677734375, -16.89111328125, -16.112548828125, -15.333984375, -14.555419921875, -13.77685546875, -12.998291015625, -12.2197265625, -11.441162109375, -10.66259765625, -9.884033203125, -9.10546875, -8.326904296875, -7.54833984375, -6.769775390625, -5.9912109375, -5.212646484375, -4.43408203125, -3.655517578125, -2.876953125, -2.098388671875, -1.31982421875, -0.541259765625, 0.2373046875, 1.015869140625, 1.79443359375, 2.572998046875, 3.3515625, 4.130126953125, 4.90869140625, 5.687255859375, 6.4658203125, 7.244384765625, 8.02294921875, 8.801513671875, 9.580078125, 10.358642578125, 11.13720703125, 11.915771484375, 12.6943359375, 13.472900390625, 14.25146484375, 15.030029296875, 15.80859375, 16.587158203125, 17.36572265625, 18.144287109375, 18.9228515625, 19.701416015625, 20.47998046875, 21.258544921875, 22.037109375, 22.815673828125, 23.59423828125, 24.372802734375, 25.1513671875, 25.929931640625, 26.70849609375, 27.487060546875, 28.265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 11.0, 6.0, 15.0, 23.0, 47.0, 76.0, 143.0, 253.0, 217.0, 95.0, 46.0, 27.0, 17.0, 11.0, 3.0, 4.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0129241943359375, -0.012634813785552979, -0.012345433235168457, -0.012056052684783936, -0.011766672134399414, -0.011477291584014893, -0.011187911033630371, -0.01089853048324585, -0.010609149932861328, -0.010319769382476807, -0.010030388832092285, -0.009741008281707764, -0.009451627731323242, -0.00916224718093872, -0.0088728666305542, -0.008583486080169678, -0.008294105529785156, -0.008004724979400635, -0.007715344429016113, -0.007425963878631592, -0.00713658332824707, -0.006847202777862549, -0.006557822227478027, -0.006268441677093506, -0.005979061126708984, -0.005689680576324463, -0.005400300025939941, -0.00511091947555542, -0.0048215389251708984, -0.004532158374786377, -0.0042427778244018555, -0.003953397274017334, -0.0036640167236328125, -0.003374636173248291, -0.0030852556228637695, -0.002795875072479248, -0.0025064945220947266, -0.002217113971710205, -0.0019277334213256836, -0.0016383528709411621, -0.0013489723205566406, -0.0010595917701721191, -0.0007702112197875977, -0.00048083066940307617, -0.0001914501190185547, 9.79304313659668e-05, 0.0003873109817504883, 0.0006766915321350098, 0.0009660720825195312, 0.0012554526329040527, 0.0015448331832885742, 0.0018342137336730957, 0.002123594284057617, 0.0024129748344421387, 0.00270235538482666, 0.0029917359352111816, 0.003281116485595703, 0.0035704970359802246, 0.003859877586364746, 0.004149258136749268, 0.004438638687133789, 0.0047280192375183105, 0.005017399787902832, 0.0053067803382873535, 0.005596160888671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 9.0, 12.0, 21.0, 46.0, 82.0, 142.0, 328.0, 805.0, 2656.0, 12512.0, 103031.0, 763007.0, 145146.0, 16057.0, 3119.0, 892.0, 345.0, 173.0, 74.0, 47.0, 29.0, 14.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.0625, -43.830078125, -42.59765625, -41.365234375, -40.1328125, -38.900390625, -37.66796875, -36.435546875, -35.203125, -33.970703125, -32.73828125, -31.505859375, -30.2734375, -29.041015625, -27.80859375, -26.576171875, -25.34375, -24.111328125, -22.87890625, -21.646484375, -20.4140625, -19.181640625, -17.94921875, -16.716796875, -15.484375, -14.251953125, -13.01953125, -11.787109375, -10.5546875, -9.322265625, -8.08984375, -6.857421875, -5.625, -4.392578125, -3.16015625, -1.927734375, -0.6953125, 0.537109375, 1.76953125, 3.001953125, 4.234375, 5.466796875, 6.69921875, 7.931640625, 9.1640625, 10.396484375, 11.62890625, 12.861328125, 14.09375, 15.326171875, 16.55859375, 17.791015625, 19.0234375, 20.255859375, 21.48828125, 22.720703125, 23.953125, 25.185546875, 26.41796875, 27.650390625, 28.8828125, 30.115234375, 31.34765625, 32.580078125, 33.8125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 4.0, 3.0, 11.0, 11.0, 14.0, 24.0, 31.0, 32.0, 74.0, 83.0, 97.0, 98.0, 126.0, 82.0, 83.0, 61.0, 53.0, 15.0, 15.0, 14.0, 12.0, 12.0, 4.0, 7.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.8125, -20.17822265625, -19.5439453125, -18.90966796875, -18.275390625, -17.64111328125, -17.0068359375, -16.37255859375, -15.73828125, -15.10400390625, -14.4697265625, -13.83544921875, -13.201171875, -12.56689453125, -11.9326171875, -11.29833984375, -10.6640625, -10.02978515625, -9.3955078125, -8.76123046875, -8.126953125, -7.49267578125, -6.8583984375, -6.22412109375, -5.58984375, -4.95556640625, -4.3212890625, -3.68701171875, -3.052734375, -2.41845703125, -1.7841796875, -1.14990234375, -0.515625, 0.11865234375, 0.7529296875, 1.38720703125, 2.021484375, 2.65576171875, 3.2900390625, 3.92431640625, 4.55859375, 5.19287109375, 5.8271484375, 6.46142578125, 7.095703125, 7.72998046875, 8.3642578125, 8.99853515625, 9.6328125, 10.26708984375, 10.9013671875, 11.53564453125, 12.169921875, 12.80419921875, 13.4384765625, 14.07275390625, 14.70703125, 15.34130859375, 15.9755859375, 16.60986328125, 17.244140625, 17.87841796875, 18.5126953125, 19.14697265625, 19.78125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 18.0, 40.0, 115.0, 194.0, 236.0, 201.0, 117.0, 57.0, 16.0, 7.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-896.938720703125, -874.2700805664062, -851.6015014648438, -828.932861328125, -806.2642822265625, -783.5956420898438, -760.927001953125, -738.2584228515625, -715.5897827148438, -692.921142578125, -670.2525634765625, -647.5839233398438, -624.915283203125, -602.2467041015625, -579.5780639648438, -556.909423828125, -534.2408447265625, -511.5722351074219, -488.90362548828125, -466.2349853515625, -443.5663757324219, -420.89776611328125, -398.2291259765625, -375.5605163574219, -352.89190673828125, -330.2232971191406, -307.5546875, -284.88604736328125, -262.2174377441406, -239.548828125, -216.8802032470703, -194.21157836914062, -171.54290771484375, -148.87429809570312, -126.20567321777344, -103.53705596923828, -80.86843872070312, -58.19982147216797, -35.53120422363281, -12.862579345703125, 9.8060302734375, 32.474647521972656, 55.14326477050781, 77.81188201904297, 100.48049926757812, 123.14911651611328, 145.81773376464844, 168.48635864257812, 191.15496826171875, 213.82357788085938, 236.49220275878906, 259.16082763671875, 281.8294372558594, 304.498046875, 327.16668701171875, 349.8352966308594, 372.50390625, 395.1725158691406, 417.84112548828125, 440.509765625, 463.1783752441406, 485.84698486328125, 508.515625, 531.1842041015625, 553.8528442382812]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 8.0, 3.0, 7.0, 5.0, 7.0, 14.0, 13.0, 17.0, 14.0, 19.0, 24.0, 29.0, 30.0, 29.0, 43.0, 31.0, 35.0, 41.0, 41.0, 36.0, 36.0, 30.0, 40.0, 42.0, 44.0, 35.0, 36.0, 26.0, 27.0, 32.0, 28.0, 30.0, 21.0, 25.0, 13.0, 19.0, 13.0, 12.0, 9.0, 5.0, 5.0, 6.0, 7.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0], "bins": [-166.53012084960938, -161.3583221435547, -156.1865234375, -151.01470947265625, -145.84291076660156, -140.67111206054688, -135.4993133544922, -130.3275146484375, -125.15570831298828, -119.9839096069336, -114.81210327148438, -109.64030456542969, -104.468505859375, -99.29669952392578, -94.1249008178711, -88.95309448242188, -83.78129577636719, -78.6094970703125, -73.43769073486328, -68.2658920288086, -63.09408950805664, -57.92228698730469, -52.75048828125, -47.57868576049805, -42.406883239746094, -37.23508071899414, -32.06327819824219, -26.8914794921875, -21.719676971435547, -16.547874450683594, -11.376073837280273, -6.204273223876953, -1.032470703125, 4.139330863952637, 9.311132431030273, 14.48293399810791, 19.654735565185547, 24.8265380859375, 29.99833869934082, 35.17013931274414, 40.341941833496094, 45.51374435424805, 50.685546875, 55.85734558105469, 61.02914810180664, 66.2009506225586, 71.37274932861328, 76.5445556640625, 81.71635437011719, 86.88815307617188, 92.0599594116211, 97.23175811767578, 102.403564453125, 107.57536315917969, 112.74716186523438, 117.91896057128906, 123.09076690673828, 128.2625732421875, 133.4343719482422, 138.60617065429688, 143.77796936035156, 148.94976806640625, 154.12158203125, 159.2933807373047, 164.46517944335938]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 13.0, 8.0, 10.0, 19.0, 33.0, 27.0, 54.0, 99.0, 137.0, 220.0, 429.0, 814.0, 1630.0, 3887.0, 10224.0, 33816.0, 167324.0, 3676555.0, 237146.0, 41520.0, 12041.0, 4305.0, 1865.0, 902.0, 471.0, 257.0, 140.0, 99.0, 69.0, 52.0, 36.0, 24.0, 13.0, 8.0, 8.0, 6.0, 6.0, 3.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.375, -121.5263671875, -117.677734375, -113.8291015625, -109.98046875, -106.1318359375, -102.283203125, -98.4345703125, -94.5859375, -90.7373046875, -86.888671875, -83.0400390625, -79.19140625, -75.3427734375, -71.494140625, -67.6455078125, -63.796875, -59.9482421875, -56.099609375, -52.2509765625, -48.40234375, -44.5537109375, -40.705078125, -36.8564453125, -33.0078125, -29.1591796875, -25.310546875, -21.4619140625, -17.61328125, -13.7646484375, -9.916015625, -6.0673828125, -2.21875, 1.6298828125, 5.478515625, 9.3271484375, 13.17578125, 17.0244140625, 20.873046875, 24.7216796875, 28.5703125, 32.4189453125, 36.267578125, 40.1162109375, 43.96484375, 47.8134765625, 51.662109375, 55.5107421875, 59.359375, 63.2080078125, 67.056640625, 70.9052734375, 74.75390625, 78.6025390625, 82.451171875, 86.2998046875, 90.1484375, 93.9970703125, 97.845703125, 101.6943359375, 105.54296875, 109.3916015625, 113.240234375, 117.0888671875, 120.9375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 9.0, 10.0, 12.0, 12.0, 14.0, 24.0, 23.0, 21.0, 41.0, 36.0, 54.0, 50.0, 53.0, 71.0, 59.0, 53.0, 59.0, 54.0, 52.0, 50.0, 50.0, 36.0, 35.0, 30.0, 24.0, 13.0, 15.0, 13.0, 10.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796875, -9.39306640625, -8.9892578125, -8.58544921875, -8.181640625, -7.77783203125, -7.3740234375, -6.97021484375, -6.56640625, -6.16259765625, -5.7587890625, -5.35498046875, -4.951171875, -4.54736328125, -4.1435546875, -3.73974609375, -3.3359375, -2.93212890625, -2.5283203125, -2.12451171875, -1.720703125, -1.31689453125, -0.9130859375, -0.50927734375, -0.10546875, 0.29833984375, 0.7021484375, 1.10595703125, 1.509765625, 1.91357421875, 2.3173828125, 2.72119140625, 3.125, 3.52880859375, 3.9326171875, 4.33642578125, 4.740234375, 5.14404296875, 5.5478515625, 5.95166015625, 6.35546875, 6.75927734375, 7.1630859375, 7.56689453125, 7.970703125, 8.37451171875, 8.7783203125, 9.18212890625, 9.5859375, 9.98974609375, 10.3935546875, 10.79736328125, 11.201171875, 11.60498046875, 12.0087890625, 12.41259765625, 12.81640625, 13.22021484375, 13.6240234375, 14.02783203125, 14.431640625, 14.83544921875, 15.2392578125, 15.64306640625, 16.046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 14.0, 19.0, 32.0, 57.0, 85.0, 121.0, 205.0, 355.0, 649.0, 1143.0, 2085.0, 4112.0, 8601.0, 18427.0, 44306.0, 134230.0, 888950.0, 2804416.0, 186476.0, 57118.0, 22269.0, 10186.0, 4766.0, 2510.0, 1359.0, 727.0, 440.0, 245.0, 141.0, 81.0, 58.0, 44.0, 19.0, 12.0, 10.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.6875, -51.7783203125, -49.869140625, -47.9599609375, -46.05078125, -44.1416015625, -42.232421875, -40.3232421875, -38.4140625, -36.5048828125, -34.595703125, -32.6865234375, -30.77734375, -28.8681640625, -26.958984375, -25.0498046875, -23.140625, -21.2314453125, -19.322265625, -17.4130859375, -15.50390625, -13.5947265625, -11.685546875, -9.7763671875, -7.8671875, -5.9580078125, -4.048828125, -2.1396484375, -0.23046875, 1.6787109375, 3.587890625, 5.4970703125, 7.40625, 9.3154296875, 11.224609375, 13.1337890625, 15.04296875, 16.9521484375, 18.861328125, 20.7705078125, 22.6796875, 24.5888671875, 26.498046875, 28.4072265625, 30.31640625, 32.2255859375, 34.134765625, 36.0439453125, 37.953125, 39.8623046875, 41.771484375, 43.6806640625, 45.58984375, 47.4990234375, 49.408203125, 51.3173828125, 53.2265625, 55.1357421875, 57.044921875, 58.9541015625, 60.86328125, 62.7724609375, 64.681640625, 66.5908203125, 68.5]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 2.0, 11.0, 8.0, 8.0, 10.0, 18.0, 21.0, 25.0, 25.0, 41.0, 61.0, 79.0, 125.0, 216.0, 390.0, 1680.0, 575.0, 272.0, 145.0, 101.0, 50.0, 48.0, 37.0, 23.0, 18.0, 16.0, 19.0, 8.0, 8.0, 9.0, 6.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.75, -22.949951171875, -22.14990234375, -21.349853515625, -20.5498046875, -19.749755859375, -18.94970703125, -18.149658203125, -17.349609375, -16.549560546875, -15.74951171875, -14.949462890625, -14.1494140625, -13.349365234375, -12.54931640625, -11.749267578125, -10.94921875, -10.149169921875, -9.34912109375, -8.549072265625, -7.7490234375, -6.948974609375, -6.14892578125, -5.348876953125, -4.548828125, -3.748779296875, -2.94873046875, -2.148681640625, -1.3486328125, -0.548583984375, 0.25146484375, 1.051513671875, 1.8515625, 2.651611328125, 3.45166015625, 4.251708984375, 5.0517578125, 5.851806640625, 6.65185546875, 7.451904296875, 8.251953125, 9.052001953125, 9.85205078125, 10.652099609375, 11.4521484375, 12.252197265625, 13.05224609375, 13.852294921875, 14.65234375, 15.452392578125, 16.25244140625, 17.052490234375, 17.8525390625, 18.652587890625, 19.45263671875, 20.252685546875, 21.052734375, 21.852783203125, 22.65283203125, 23.452880859375, 24.2529296875, 25.052978515625, 25.85302734375, 26.653076171875, 27.453125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 12.0, 11.0, 19.0, 33.0, 70.0, 131.0, 149.0, 163.0, 172.0, 100.0, 69.0, 35.0, 13.0, 14.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-343.56982421875, -336.17041015625, -328.7710266113281, -321.3716125488281, -313.97222900390625, -306.57281494140625, -299.17340087890625, -291.7740173339844, -284.3746032714844, -276.9751892089844, -269.5758056640625, -262.1763916015625, -254.77699279785156, -247.37759399414062, -239.97817993164062, -232.5787811279297, -225.17938232421875, -217.7799835205078, -210.38058471679688, -202.98117065429688, -195.58177185058594, -188.182373046875, -180.782958984375, -173.38356018066406, -165.98416137695312, -158.5847625732422, -151.18536376953125, -143.78594970703125, -136.3865509033203, -128.98715209960938, -121.5877456665039, -114.18833923339844, -106.7889404296875, -99.38954162597656, -91.9901351928711, -84.59072875976562, -77.19132995605469, -69.79193115234375, -62.39252471923828, -54.99312210083008, -47.593719482421875, -40.19431686401367, -32.79491424560547, -25.395511627197266, -17.996109008789062, -10.59670639038086, -3.1973037719726562, 4.202098846435547, 11.60150146484375, 19.000904083251953, 26.400306701660156, 33.79970932006836, 41.19911193847656, 48.598514556884766, 55.99791717529297, 63.39731979370117, 70.79672241210938, 78.19612121582031, 85.59552764892578, 92.99493408203125, 100.39433288574219, 107.79373168945312, 115.1931381225586, 122.59254455566406, 129.991943359375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 3.0, 5.0, 6.0, 9.0, 17.0, 15.0, 14.0, 18.0, 28.0, 23.0, 24.0, 31.0, 40.0, 27.0, 39.0, 42.0, 44.0, 38.0, 47.0, 51.0, 45.0, 41.0, 35.0, 40.0, 40.0, 37.0, 26.0, 29.0, 29.0, 35.0, 23.0, 23.0, 15.0, 14.0, 13.0, 2.0, 10.0, 7.0, 5.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-83.47816467285156, -80.70133209228516, -77.92449951171875, -75.14766693115234, -72.37083435058594, -69.59400939941406, -66.81717681884766, -64.04034423828125, -61.263511657714844, -58.48667907714844, -55.70984649658203, -52.93301773071289, -50.156185150146484, -47.37935256958008, -44.60252380371094, -41.82569122314453, -39.048858642578125, -36.27202606201172, -33.49519348144531, -30.718364715576172, -27.941532135009766, -25.16469955444336, -22.387868881225586, -19.611038208007812, -16.834205627441406, -14.057374000549316, -11.280542373657227, -8.503710746765137, -5.726879119873047, -2.950047492980957, -0.1732158660888672, 2.6036148071289062, 5.380455017089844, 8.157286643981934, 10.934118270874023, 13.710949897766113, 16.487781524658203, 19.26461410522461, 22.041444778442383, 24.818275451660156, 27.595108032226562, 30.37194061279297, 33.148773193359375, 35.925601959228516, 38.70243453979492, 41.47926712036133, 44.25609588623047, 47.032928466796875, 49.80976104736328, 52.58659362792969, 55.363426208496094, 58.140254974365234, 60.91708755493164, 63.69392013549805, 66.47074890136719, 69.2475814819336, 72.0244140625, 74.8012466430664, 77.57807922363281, 80.35491180419922, 83.13174438476562, 85.9085693359375, 88.6854019165039, 91.46223449707031, 94.23906707763672]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 7.0, 10.0, 11.0, 16.0, 18.0, 36.0, 71.0, 76.0, 137.0, 202.0, 363.0, 666.0, 1440.0, 3881.0, 12204.0, 46152.0, 187579.0, 533488.0, 194376.0, 47930.0, 12758.0, 3972.0, 1534.0, 694.0, 339.0, 215.0, 103.0, 75.0, 62.0, 45.0, 16.0, 21.0, 15.0, 12.0, 12.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-101.75, -98.7138671875, -95.677734375, -92.6416015625, -89.60546875, -86.5693359375, -83.533203125, -80.4970703125, -77.4609375, -74.4248046875, -71.388671875, -68.3525390625, -65.31640625, -62.2802734375, -59.244140625, -56.2080078125, -53.171875, -50.1357421875, -47.099609375, -44.0634765625, -41.02734375, -37.9912109375, -34.955078125, -31.9189453125, -28.8828125, -25.8466796875, -22.810546875, -19.7744140625, -16.73828125, -13.7021484375, -10.666015625, -7.6298828125, -4.59375, -1.5576171875, 1.478515625, 4.5146484375, 7.55078125, 10.5869140625, 13.623046875, 16.6591796875, 19.6953125, 22.7314453125, 25.767578125, 28.8037109375, 31.83984375, 34.8759765625, 37.912109375, 40.9482421875, 43.984375, 47.0205078125, 50.056640625, 53.0927734375, 56.12890625, 59.1650390625, 62.201171875, 65.2373046875, 68.2734375, 71.3095703125, 74.345703125, 77.3818359375, 80.41796875, 83.4541015625, 86.490234375, 89.5263671875, 92.5625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 6.0, 9.0, 10.0, 11.0, 11.0, 16.0, 25.0, 33.0, 36.0, 32.0, 40.0, 49.0, 52.0, 65.0, 47.0, 53.0, 61.0, 41.0, 69.0, 49.0, 46.0, 44.0, 36.0, 40.0, 19.0, 28.0, 11.0, 15.0, 12.0, 10.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.765625, -9.355712890625, -8.94580078125, -8.535888671875, -8.1259765625, -7.716064453125, -7.30615234375, -6.896240234375, -6.486328125, -6.076416015625, -5.66650390625, -5.256591796875, -4.8466796875, -4.436767578125, -4.02685546875, -3.616943359375, -3.20703125, -2.797119140625, -2.38720703125, -1.977294921875, -1.5673828125, -1.157470703125, -0.74755859375, -0.337646484375, 0.072265625, 0.482177734375, 0.89208984375, 1.302001953125, 1.7119140625, 2.121826171875, 2.53173828125, 2.941650390625, 3.3515625, 3.761474609375, 4.17138671875, 4.581298828125, 4.9912109375, 5.401123046875, 5.81103515625, 6.220947265625, 6.630859375, 7.040771484375, 7.45068359375, 7.860595703125, 8.2705078125, 8.680419921875, 9.09033203125, 9.500244140625, 9.91015625, 10.320068359375, 10.72998046875, 11.139892578125, 11.5498046875, 11.959716796875, 12.36962890625, 12.779541015625, 13.189453125, 13.599365234375, 14.00927734375, 14.419189453125, 14.8291015625, 15.239013671875, 15.64892578125, 16.058837890625, 16.46875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 3.0, 12.0, 12.0, 28.0, 37.0, 46.0, 51.0, 100.0, 110.0, 137.0, 174.0, 316.0, 450.0, 700.0, 1269.0, 2858.0, 7523.0, 23610.0, 78446.0, 273456.0, 450735.0, 143987.0, 42637.0, 12734.0, 4573.0, 1857.0, 927.0, 552.0, 331.0, 251.0, 192.0, 95.0, 89.0, 67.0, 59.0, 25.0, 32.0, 17.0, 14.0, 15.0, 13.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.25, -56.3857421875, -54.521484375, -52.6572265625, -50.79296875, -48.9287109375, -47.064453125, -45.2001953125, -43.3359375, -41.4716796875, -39.607421875, -37.7431640625, -35.87890625, -34.0146484375, -32.150390625, -30.2861328125, -28.421875, -26.5576171875, -24.693359375, -22.8291015625, -20.96484375, -19.1005859375, -17.236328125, -15.3720703125, -13.5078125, -11.6435546875, -9.779296875, -7.9150390625, -6.05078125, -4.1865234375, -2.322265625, -0.4580078125, 1.40625, 3.2705078125, 5.134765625, 6.9990234375, 8.86328125, 10.7275390625, 12.591796875, 14.4560546875, 16.3203125, 18.1845703125, 20.048828125, 21.9130859375, 23.77734375, 25.6416015625, 27.505859375, 29.3701171875, 31.234375, 33.0986328125, 34.962890625, 36.8271484375, 38.69140625, 40.5556640625, 42.419921875, 44.2841796875, 46.1484375, 48.0126953125, 49.876953125, 51.7412109375, 53.60546875, 55.4697265625, 57.333984375, 59.1982421875, 61.0625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 0.0, 6.0, 6.0, 10.0, 10.0, 23.0, 20.0, 14.0, 19.0, 17.0, 28.0, 41.0, 33.0, 38.0, 39.0, 45.0, 43.0, 47.0, 60.0, 51.0, 39.0, 58.0, 43.0, 37.0, 37.0, 31.0, 38.0, 23.0, 28.0, 21.0, 19.0, 18.0, 8.0, 12.0, 14.0, 5.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.0, -44.46484375, -42.9296875, -41.39453125, -39.859375, -38.32421875, -36.7890625, -35.25390625, -33.71875, -32.18359375, -30.6484375, -29.11328125, -27.578125, -26.04296875, -24.5078125, -22.97265625, -21.4375, -19.90234375, -18.3671875, -16.83203125, -15.296875, -13.76171875, -12.2265625, -10.69140625, -9.15625, -7.62109375, -6.0859375, -4.55078125, -3.015625, -1.48046875, 0.0546875, 1.58984375, 3.125, 4.66015625, 6.1953125, 7.73046875, 9.265625, 10.80078125, 12.3359375, 13.87109375, 15.40625, 16.94140625, 18.4765625, 20.01171875, 21.546875, 23.08203125, 24.6171875, 26.15234375, 27.6875, 29.22265625, 30.7578125, 32.29296875, 33.828125, 35.36328125, 36.8984375, 38.43359375, 39.96875, 41.50390625, 43.0390625, 44.57421875, 46.109375, 47.64453125, 49.1796875, 50.71484375, 52.25]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 10.0, 23.0, 16.0, 23.0, 33.0, 73.0, 94.0, 142.0, 233.0, 405.0, 792.0, 1753.0, 4483.0, 14950.0, 71540.0, 506048.0, 376111.0, 52851.0, 11925.0, 3812.0, 1525.0, 716.0, 384.0, 209.0, 121.0, 81.0, 53.0, 36.0, 32.0, 19.0, 14.0, 14.0, 8.0, 5.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.0625, -39.81494140625, -38.5673828125, -37.31982421875, -36.072265625, -34.82470703125, -33.5771484375, -32.32958984375, -31.08203125, -29.83447265625, -28.5869140625, -27.33935546875, -26.091796875, -24.84423828125, -23.5966796875, -22.34912109375, -21.1015625, -19.85400390625, -18.6064453125, -17.35888671875, -16.111328125, -14.86376953125, -13.6162109375, -12.36865234375, -11.12109375, -9.87353515625, -8.6259765625, -7.37841796875, -6.130859375, -4.88330078125, -3.6357421875, -2.38818359375, -1.140625, 0.10693359375, 1.3544921875, 2.60205078125, 3.849609375, 5.09716796875, 6.3447265625, 7.59228515625, 8.83984375, 10.08740234375, 11.3349609375, 12.58251953125, 13.830078125, 15.07763671875, 16.3251953125, 17.57275390625, 18.8203125, 20.06787109375, 21.3154296875, 22.56298828125, 23.810546875, 25.05810546875, 26.3056640625, 27.55322265625, 28.80078125, 30.04833984375, 31.2958984375, 32.54345703125, 33.791015625, 35.03857421875, 36.2861328125, 37.53369140625, 38.78125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 11.0, 16.0, 22.0, 35.0, 50.0, 79.0, 158.0, 200.0, 166.0, 83.0, 61.0, 37.0, 35.0, 9.0, 13.0, 3.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007717132568359375, -0.007426202297210693, -0.007135272026062012, -0.00684434175491333, -0.0065534114837646484, -0.006262481212615967, -0.005971550941467285, -0.0056806206703186035, -0.005389690399169922, -0.00509876012802124, -0.004807829856872559, -0.004516899585723877, -0.004225969314575195, -0.003935039043426514, -0.003644108772277832, -0.0033531785011291504, -0.0030622482299804688, -0.002771317958831787, -0.0024803876876831055, -0.002189457416534424, -0.0018985271453857422, -0.0016075968742370605, -0.001316666603088379, -0.0010257363319396973, -0.0007348060607910156, -0.000443875789642334, -0.00015294551849365234, 0.0001379847526550293, 0.00042891502380371094, 0.0007198452949523926, 0.0010107755661010742, 0.0013017058372497559, 0.0015926361083984375, 0.0018835663795471191, 0.0021744966506958008, 0.0024654269218444824, 0.002756357192993164, 0.0030472874641418457, 0.0033382177352905273, 0.003629148006439209, 0.003920078277587891, 0.004211008548736572, 0.004501938819885254, 0.0047928690910339355, 0.005083799362182617, 0.005374729633331299, 0.0056656599044799805, 0.005956590175628662, 0.006247520446777344, 0.006538450717926025, 0.006829380989074707, 0.007120311260223389, 0.00741124153137207, 0.007702171802520752, 0.007993102073669434, 0.008284032344818115, 0.008574962615966797, 0.008865892887115479, 0.00915682315826416, 0.009447753429412842, 0.009738683700561523, 0.010029613971710205, 0.010320544242858887, 0.010611474514007568, 0.01090240478515625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 15.0, 13.0, 29.0, 57.0, 116.0, 226.0, 443.0, 1085.0, 3105.0, 13801.0, 144948.0, 790031.0, 81012.0, 9619.0, 2397.0, 926.0, 338.0, 178.0, 109.0, 38.0, 29.0, 13.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.125, -70.08740234375, -68.0498046875, -66.01220703125, -63.974609375, -61.93701171875, -59.8994140625, -57.86181640625, -55.82421875, -53.78662109375, -51.7490234375, -49.71142578125, -47.673828125, -45.63623046875, -43.5986328125, -41.56103515625, -39.5234375, -37.48583984375, -35.4482421875, -33.41064453125, -31.373046875, -29.33544921875, -27.2978515625, -25.26025390625, -23.22265625, -21.18505859375, -19.1474609375, -17.10986328125, -15.072265625, -13.03466796875, -10.9970703125, -8.95947265625, -6.921875, -4.88427734375, -2.8466796875, -0.80908203125, 1.228515625, 3.26611328125, 5.3037109375, 7.34130859375, 9.37890625, 11.41650390625, 13.4541015625, 15.49169921875, 17.529296875, 19.56689453125, 21.6044921875, 23.64208984375, 25.6796875, 27.71728515625, 29.7548828125, 31.79248046875, 33.830078125, 35.86767578125, 37.9052734375, 39.94287109375, 41.98046875, 44.01806640625, 46.0556640625, 48.09326171875, 50.130859375, 52.16845703125, 54.2060546875, 56.24365234375, 58.28125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 9.0, 6.0, 13.0, 20.0, 31.0, 48.0, 85.0, 112.0, 147.0, 159.0, 126.0, 76.0, 64.0, 33.0, 27.0, 17.0, 11.0, 11.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-68.0, -66.584716796875, -65.16943359375, -63.754150390625, -62.3388671875, -60.923583984375, -59.50830078125, -58.093017578125, -56.677734375, -55.262451171875, -53.84716796875, -52.431884765625, -51.0166015625, -49.601318359375, -48.18603515625, -46.770751953125, -45.35546875, -43.940185546875, -42.52490234375, -41.109619140625, -39.6943359375, -38.279052734375, -36.86376953125, -35.448486328125, -34.033203125, -32.617919921875, -31.20263671875, -29.787353515625, -28.3720703125, -26.956787109375, -25.54150390625, -24.126220703125, -22.7109375, -21.295654296875, -19.88037109375, -18.465087890625, -17.0498046875, -15.634521484375, -14.21923828125, -12.803955078125, -11.388671875, -9.973388671875, -8.55810546875, -7.142822265625, -5.7275390625, -4.312255859375, -2.89697265625, -1.481689453125, -0.06640625, 1.348876953125, 2.76416015625, 4.179443359375, 5.5947265625, 7.010009765625, 8.42529296875, 9.840576171875, 11.255859375, 12.671142578125, 14.08642578125, 15.501708984375, 16.9169921875, 18.332275390625, 19.74755859375, 21.162841796875, 22.578125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 9.0, 4.0, 10.0, 32.0, 56.0, 78.0, 120.0, 142.0, 139.0, 119.0, 109.0, 67.0, 53.0, 23.0, 23.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-708.301025390625, -691.5404663085938, -674.7799682617188, -658.0194091796875, -641.2589111328125, -624.4983520507812, -607.73779296875, -590.977294921875, -574.2167358398438, -557.4561767578125, -540.6956787109375, -523.9351196289062, -507.1745910644531, -490.4140625, -473.6535339355469, -456.89300537109375, -440.1324768066406, -423.3719482421875, -406.6114196777344, -389.85089111328125, -373.09033203125, -356.3298034667969, -339.56927490234375, -322.8087463378906, -306.0482177734375, -289.2876892089844, -272.52716064453125, -255.76661682128906, -239.00607299804688, -222.24554443359375, -205.48501586914062, -188.7244873046875, -171.96389770507812, -155.203369140625, -138.4428253173828, -121.68229675292969, -104.92176055908203, -88.16122436523438, -71.40069580078125, -54.640159606933594, -37.87962341308594, -21.119089126586914, -4.358554840087891, 12.4019775390625, 29.162513732910156, 45.92304992675781, 62.68357849121094, 79.4441146850586, 96.20465087890625, 112.9651870727539, 129.72572326660156, 146.4862518310547, 163.24679565429688, 180.00732421875, 196.76785278320312, 213.52838134765625, 230.28892517089844, 247.04945373535156, 263.80999755859375, 280.5705261230469, 297.3310546875, 314.09161376953125, 330.85211181640625, 347.6126708984375, 364.3731994628906]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 7.0, 6.0, 5.0, 6.0, 8.0, 12.0, 7.0, 13.0, 27.0, 25.0, 23.0, 21.0, 17.0, 37.0, 38.0, 31.0, 29.0, 41.0, 43.0, 37.0, 43.0, 50.0, 41.0, 46.0, 32.0, 40.0, 51.0, 34.0, 43.0, 24.0, 29.0, 30.0, 14.0, 15.0, 16.0, 8.0, 10.0, 12.0, 8.0, 3.0, 7.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.30807495117188, -228.4667510986328, -220.62542724609375, -212.78408813476562, -204.94276428222656, -197.1014404296875, -189.26011657714844, -181.41879272460938, -173.57745361328125, -165.7361297607422, -157.89480590820312, -150.053466796875, -142.21214294433594, -134.37081909179688, -126.52949523925781, -118.68817138671875, -110.84684753417969, -103.00552368164062, -95.16419219970703, -87.32286834716797, -79.48153686523438, -71.64021301269531, -63.79888916015625, -55.95756149291992, -48.116233825683594, -40.274906158447266, -32.43357849121094, -24.592254638671875, -16.750926971435547, -8.909599304199219, -1.0682754516601562, 6.773052215576172, 14.6143798828125, 22.455707550048828, 30.297033309936523, 38.13835906982422, 45.97968673706055, 53.821014404296875, 61.66233825683594, 69.503662109375, 77.3449935913086, 85.18631744384766, 93.02764892578125, 100.86897277832031, 108.71029663085938, 116.55162811279297, 124.39295196533203, 132.23428344726562, 140.0756072998047, 147.91693115234375, 155.7582550048828, 163.59957885742188, 171.44091796875, 179.28224182128906, 187.12356567382812, 194.9648895263672, 202.80621337890625, 210.6475372314453, 218.48886108398438, 226.3302001953125, 234.17152404785156, 242.01284790039062, 249.8541717529297, 257.69549560546875, 265.5368347167969]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 8.0, 3.0, 6.0, 8.0, 13.0, 13.0, 31.0, 30.0, 45.0, 102.0, 152.0, 212.0, 388.0, 757.0, 1526.0, 3788.0, 10600.0, 36987.0, 186378.0, 3402576.0, 459325.0, 64516.0, 16661.0, 5505.0, 2258.0, 1020.0, 565.0, 297.0, 175.0, 110.0, 61.0, 37.0, 45.0, 24.0, 22.0, 15.0, 6.0, 2.0, 4.0, 6.0, 5.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-109.3125, -106.068359375, -102.82421875, -99.580078125, -96.3359375, -93.091796875, -89.84765625, -86.603515625, -83.359375, -80.115234375, -76.87109375, -73.626953125, -70.3828125, -67.138671875, -63.89453125, -60.650390625, -57.40625, -54.162109375, -50.91796875, -47.673828125, -44.4296875, -41.185546875, -37.94140625, -34.697265625, -31.453125, -28.208984375, -24.96484375, -21.720703125, -18.4765625, -15.232421875, -11.98828125, -8.744140625, -5.5, -2.255859375, 0.98828125, 4.232421875, 7.4765625, 10.720703125, 13.96484375, 17.208984375, 20.453125, 23.697265625, 26.94140625, 30.185546875, 33.4296875, 36.673828125, 39.91796875, 43.162109375, 46.40625, 49.650390625, 52.89453125, 56.138671875, 59.3828125, 62.626953125, 65.87109375, 69.115234375, 72.359375, 75.603515625, 78.84765625, 82.091796875, 85.3359375, 88.580078125, 91.82421875, 95.068359375, 98.3125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 8.0, 12.0, 19.0, 13.0, 16.0, 23.0, 25.0, 29.0, 38.0, 52.0, 52.0, 38.0, 56.0, 52.0, 48.0, 46.0, 74.0, 56.0, 56.0, 52.0, 35.0, 27.0, 39.0, 38.0, 17.0, 13.0, 13.0, 6.0, 8.0, 11.0, 5.0, 5.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1015625, -10.685791015625, -10.27001953125, -9.854248046875, -9.4384765625, -9.022705078125, -8.60693359375, -8.191162109375, -7.775390625, -7.359619140625, -6.94384765625, -6.528076171875, -6.1123046875, -5.696533203125, -5.28076171875, -4.864990234375, -4.44921875, -4.033447265625, -3.61767578125, -3.201904296875, -2.7861328125, -2.370361328125, -1.95458984375, -1.538818359375, -1.123046875, -0.707275390625, -0.29150390625, 0.124267578125, 0.5400390625, 0.955810546875, 1.37158203125, 1.787353515625, 2.203125, 2.618896484375, 3.03466796875, 3.450439453125, 3.8662109375, 4.281982421875, 4.69775390625, 5.113525390625, 5.529296875, 5.945068359375, 6.36083984375, 6.776611328125, 7.1923828125, 7.608154296875, 8.02392578125, 8.439697265625, 8.85546875, 9.271240234375, 9.68701171875, 10.102783203125, 10.5185546875, 10.934326171875, 11.35009765625, 11.765869140625, 12.181640625, 12.597412109375, 13.01318359375, 13.428955078125, 13.8447265625, 14.260498046875, 14.67626953125, 15.092041015625, 15.5078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 13.0, 15.0, 20.0, 30.0, 50.0, 79.0, 90.0, 153.0, 213.0, 353.0, 584.0, 980.0, 1835.0, 3696.0, 8148.0, 20534.0, 61071.0, 235467.0, 2550557.0, 1075088.0, 160238.0, 45567.0, 15967.0, 6683.0, 3019.0, 1527.0, 912.0, 469.0, 309.0, 188.0, 136.0, 79.0, 72.0, 41.0, 33.0, 19.0, 10.0, 6.0, 5.0, 7.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.0625, -51.224609375, -49.38671875, -47.548828125, -45.7109375, -43.873046875, -42.03515625, -40.197265625, -38.359375, -36.521484375, -34.68359375, -32.845703125, -31.0078125, -29.169921875, -27.33203125, -25.494140625, -23.65625, -21.818359375, -19.98046875, -18.142578125, -16.3046875, -14.466796875, -12.62890625, -10.791015625, -8.953125, -7.115234375, -5.27734375, -3.439453125, -1.6015625, 0.236328125, 2.07421875, 3.912109375, 5.75, 7.587890625, 9.42578125, 11.263671875, 13.1015625, 14.939453125, 16.77734375, 18.615234375, 20.453125, 22.291015625, 24.12890625, 25.966796875, 27.8046875, 29.642578125, 31.48046875, 33.318359375, 35.15625, 36.994140625, 38.83203125, 40.669921875, 42.5078125, 44.345703125, 46.18359375, 48.021484375, 49.859375, 51.697265625, 53.53515625, 55.373046875, 57.2109375, 59.048828125, 60.88671875, 62.724609375, 64.5625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 5.0, 7.0, 12.0, 21.0, 34.0, 42.0, 60.0, 74.0, 107.0, 192.0, 308.0, 697.0, 1321.0, 462.0, 255.0, 158.0, 87.0, 60.0, 48.0, 34.0, 19.0, 15.0, 16.0, 11.0, 8.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-47.34375, -46.250244140625, -45.15673828125, -44.063232421875, -42.9697265625, -41.876220703125, -40.78271484375, -39.689208984375, -38.595703125, -37.502197265625, -36.40869140625, -35.315185546875, -34.2216796875, -33.128173828125, -32.03466796875, -30.941162109375, -29.84765625, -28.754150390625, -27.66064453125, -26.567138671875, -25.4736328125, -24.380126953125, -23.28662109375, -22.193115234375, -21.099609375, -20.006103515625, -18.91259765625, -17.819091796875, -16.7255859375, -15.632080078125, -14.53857421875, -13.445068359375, -12.3515625, -11.258056640625, -10.16455078125, -9.071044921875, -7.9775390625, -6.884033203125, -5.79052734375, -4.697021484375, -3.603515625, -2.510009765625, -1.41650390625, -0.322998046875, 0.7705078125, 1.864013671875, 2.95751953125, 4.051025390625, 5.14453125, 6.238037109375, 7.33154296875, 8.425048828125, 9.5185546875, 10.612060546875, 11.70556640625, 12.799072265625, 13.892578125, 14.986083984375, 16.07958984375, 17.173095703125, 18.2666015625, 19.360107421875, 20.45361328125, 21.547119140625, 22.640625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 12.0, 12.0, 37.0, 41.0, 84.0, 109.0, 167.0, 159.0, 126.0, 95.0, 53.0, 38.0, 27.0, 11.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-399.27655029296875, -389.57904052734375, -379.88153076171875, -370.1840515136719, -360.4865417480469, -350.7890319824219, -341.0915222167969, -331.39404296875, -321.696533203125, -311.9990234375, -302.301513671875, -292.6040344238281, -282.9065246582031, -273.2090148925781, -263.5115051269531, -253.8140106201172, -244.1165008544922, -234.4189910888672, -224.72149658203125, -215.02398681640625, -205.3264923095703, -195.6289825439453, -185.93148803710938, -176.23397827148438, -166.53646850585938, -156.83895874023438, -147.14146423339844, -137.44395446777344, -127.7464599609375, -118.0489501953125, -108.35144805908203, -98.65394592285156, -88.95643615722656, -79.2589340209961, -69.56143188476562, -59.86392593383789, -50.16642379760742, -40.46892166137695, -30.77141571044922, -21.07391357421875, -11.376411437988281, -1.678908348083496, 8.018594741821289, 17.71609878540039, 27.41360092163086, 37.11110305786133, 46.80860900878906, 56.50611114501953, 66.20361328125, 75.90111541748047, 85.59861755371094, 95.29612731933594, 104.99362182617188, 114.69113159179688, 124.38863372802734, 134.0861358642578, 143.78363037109375, 153.48114013671875, 163.1786346435547, 172.8761444091797, 182.57363891601562, 192.27114868164062, 201.96865844726562, 211.66615295410156, 221.36366271972656]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 11.0, 7.0, 11.0, 11.0, 21.0, 27.0, 20.0, 32.0, 44.0, 36.0, 39.0, 38.0, 42.0, 45.0, 41.0, 41.0, 55.0, 41.0, 53.0, 62.0, 51.0, 35.0, 36.0, 24.0, 33.0, 18.0, 19.0, 24.0, 10.0, 18.0, 5.0, 12.0, 3.0, 2.0, 4.0, 9.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-130.43902587890625, -126.33580780029297, -122.23258209228516, -118.12936401367188, -114.02613830566406, -109.92292022705078, -105.8197021484375, -101.71647644042969, -97.61325073242188, -93.5100326538086, -89.40680694580078, -85.3035888671875, -81.20036315917969, -77.0971450805664, -72.99392700195312, -68.89070129394531, -64.78748321533203, -60.684261322021484, -56.58103942871094, -52.477821350097656, -48.374595642089844, -44.27137756347656, -40.168155670166016, -36.06493377685547, -31.961711883544922, -27.858489990234375, -23.755268096923828, -19.652048110961914, -15.548826217651367, -11.44560432434082, -7.342384338378906, -3.2391624450683594, 0.8640594482421875, 4.967280864715576, 9.070502281188965, 13.173723220825195, 17.276945114135742, 21.38016700744629, 25.483386993408203, 29.58660888671875, 33.6898307800293, 37.793052673339844, 41.89627456665039, 45.99949645996094, 50.10271453857422, 54.20594024658203, 58.30915832519531, 62.41238021850586, 66.5156021118164, 70.61882019042969, 74.7220458984375, 78.82526397705078, 82.9284896850586, 87.03170776367188, 91.13493347167969, 95.23815155029297, 99.34136962890625, 103.44458770751953, 107.54781341552734, 111.65103149414062, 115.75425720214844, 119.85747528076172, 123.960693359375, 128.0639190673828, 132.16714477539062]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 11.0, 14.0, 16.0, 27.0, 21.0, 66.0, 94.0, 124.0, 236.0, 320.0, 577.0, 1102.0, 2573.0, 6488.0, 18211.0, 59781.0, 200771.0, 407529.0, 241080.0, 73454.0, 22336.0, 7711.0, 2985.0, 1331.0, 700.0, 338.0, 209.0, 134.0, 84.0, 62.0, 46.0, 28.0, 17.0, 20.0, 11.0, 5.0, 8.0, 9.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-80.9375, -78.6630859375, -76.388671875, -74.1142578125, -71.83984375, -69.5654296875, -67.291015625, -65.0166015625, -62.7421875, -60.4677734375, -58.193359375, -55.9189453125, -53.64453125, -51.3701171875, -49.095703125, -46.8212890625, -44.546875, -42.2724609375, -39.998046875, -37.7236328125, -35.44921875, -33.1748046875, -30.900390625, -28.6259765625, -26.3515625, -24.0771484375, -21.802734375, -19.5283203125, -17.25390625, -14.9794921875, -12.705078125, -10.4306640625, -8.15625, -5.8818359375, -3.607421875, -1.3330078125, 0.94140625, 3.2158203125, 5.490234375, 7.7646484375, 10.0390625, 12.3134765625, 14.587890625, 16.8623046875, 19.13671875, 21.4111328125, 23.685546875, 25.9599609375, 28.234375, 30.5087890625, 32.783203125, 35.0576171875, 37.33203125, 39.6064453125, 41.880859375, 44.1552734375, 46.4296875, 48.7041015625, 50.978515625, 53.2529296875, 55.52734375, 57.8017578125, 60.076171875, 62.3505859375, 64.625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 8.0, 11.0, 15.0, 21.0, 20.0, 37.0, 27.0, 36.0, 46.0, 43.0, 50.0, 62.0, 49.0, 50.0, 59.0, 51.0, 57.0, 58.0, 33.0, 47.0, 44.0, 25.0, 31.0, 19.0, 17.0, 15.0, 9.0, 8.0, 8.0, 5.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.453125, -10.0146484375, -9.576171875, -9.1376953125, -8.69921875, -8.2607421875, -7.822265625, -7.3837890625, -6.9453125, -6.5068359375, -6.068359375, -5.6298828125, -5.19140625, -4.7529296875, -4.314453125, -3.8759765625, -3.4375, -2.9990234375, -2.560546875, -2.1220703125, -1.68359375, -1.2451171875, -0.806640625, -0.3681640625, 0.0703125, 0.5087890625, 0.947265625, 1.3857421875, 1.82421875, 2.2626953125, 2.701171875, 3.1396484375, 3.578125, 4.0166015625, 4.455078125, 4.8935546875, 5.33203125, 5.7705078125, 6.208984375, 6.6474609375, 7.0859375, 7.5244140625, 7.962890625, 8.4013671875, 8.83984375, 9.2783203125, 9.716796875, 10.1552734375, 10.59375, 11.0322265625, 11.470703125, 11.9091796875, 12.34765625, 12.7861328125, 13.224609375, 13.6630859375, 14.1015625, 14.5400390625, 14.978515625, 15.4169921875, 15.85546875, 16.2939453125, 16.732421875, 17.1708984375, 17.609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 6.0, 7.0, 8.0, 11.0, 21.0, 19.0, 25.0, 43.0, 40.0, 81.0, 105.0, 130.0, 246.0, 311.0, 491.0, 739.0, 1424.0, 2911.0, 7377.0, 23383.0, 82152.0, 290311.0, 425137.0, 151113.0, 40832.0, 12404.0, 4449.0, 1906.0, 1034.0, 602.0, 355.0, 245.0, 163.0, 117.0, 80.0, 89.0, 50.0, 32.0, 31.0, 24.0, 12.0, 14.0, 4.0, 4.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-65.1875, -63.1650390625, -61.142578125, -59.1201171875, -57.09765625, -55.0751953125, -53.052734375, -51.0302734375, -49.0078125, -46.9853515625, -44.962890625, -42.9404296875, -40.91796875, -38.8955078125, -36.873046875, -34.8505859375, -32.828125, -30.8056640625, -28.783203125, -26.7607421875, -24.73828125, -22.7158203125, -20.693359375, -18.6708984375, -16.6484375, -14.6259765625, -12.603515625, -10.5810546875, -8.55859375, -6.5361328125, -4.513671875, -2.4912109375, -0.46875, 1.5537109375, 3.576171875, 5.5986328125, 7.62109375, 9.6435546875, 11.666015625, 13.6884765625, 15.7109375, 17.7333984375, 19.755859375, 21.7783203125, 23.80078125, 25.8232421875, 27.845703125, 29.8681640625, 31.890625, 33.9130859375, 35.935546875, 37.9580078125, 39.98046875, 42.0029296875, 44.025390625, 46.0478515625, 48.0703125, 50.0927734375, 52.115234375, 54.1376953125, 56.16015625, 58.1826171875, 60.205078125, 62.2275390625, 64.25]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 4.0, 3.0, 6.0, 6.0, 12.0, 8.0, 11.0, 20.0, 13.0, 22.0, 25.0, 23.0, 32.0, 30.0, 37.0, 26.0, 41.0, 38.0, 34.0, 39.0, 37.0, 43.0, 40.0, 45.0, 43.0, 39.0, 28.0, 36.0, 29.0, 28.0, 27.0, 27.0, 18.0, 17.0, 12.0, 23.0, 13.0, 13.0, 13.0, 9.0, 6.0, 7.0, 0.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-51.9375, -50.376953125, -48.81640625, -47.255859375, -45.6953125, -44.134765625, -42.57421875, -41.013671875, -39.453125, -37.892578125, -36.33203125, -34.771484375, -33.2109375, -31.650390625, -30.08984375, -28.529296875, -26.96875, -25.408203125, -23.84765625, -22.287109375, -20.7265625, -19.166015625, -17.60546875, -16.044921875, -14.484375, -12.923828125, -11.36328125, -9.802734375, -8.2421875, -6.681640625, -5.12109375, -3.560546875, -2.0, -0.439453125, 1.12109375, 2.681640625, 4.2421875, 5.802734375, 7.36328125, 8.923828125, 10.484375, 12.044921875, 13.60546875, 15.166015625, 16.7265625, 18.287109375, 19.84765625, 21.408203125, 22.96875, 24.529296875, 26.08984375, 27.650390625, 29.2109375, 30.771484375, 32.33203125, 33.892578125, 35.453125, 37.013671875, 38.57421875, 40.134765625, 41.6953125, 43.255859375, 44.81640625, 46.376953125, 47.9375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 13.0, 14.0, 21.0, 27.0, 47.0, 103.0, 134.0, 248.0, 421.0, 777.0, 1410.0, 3036.0, 7161.0, 20018.0, 64567.0, 217923.0, 420413.0, 214842.0, 64269.0, 19735.0, 7078.0, 3089.0, 1413.0, 744.0, 426.0, 236.0, 133.0, 80.0, 46.0, 34.0, 25.0, 14.0, 8.0, 12.0, 7.0, 6.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.984375, -27.173095703125, -26.36181640625, -25.550537109375, -24.7392578125, -23.927978515625, -23.11669921875, -22.305419921875, -21.494140625, -20.682861328125, -19.87158203125, -19.060302734375, -18.2490234375, -17.437744140625, -16.62646484375, -15.815185546875, -15.00390625, -14.192626953125, -13.38134765625, -12.570068359375, -11.7587890625, -10.947509765625, -10.13623046875, -9.324951171875, -8.513671875, -7.702392578125, -6.89111328125, -6.079833984375, -5.2685546875, -4.457275390625, -3.64599609375, -2.834716796875, -2.0234375, -1.212158203125, -0.40087890625, 0.410400390625, 1.2216796875, 2.032958984375, 2.84423828125, 3.655517578125, 4.466796875, 5.278076171875, 6.08935546875, 6.900634765625, 7.7119140625, 8.523193359375, 9.33447265625, 10.145751953125, 10.95703125, 11.768310546875, 12.57958984375, 13.390869140625, 14.2021484375, 15.013427734375, 15.82470703125, 16.635986328125, 17.447265625, 18.258544921875, 19.06982421875, 19.881103515625, 20.6923828125, 21.503662109375, 22.31494140625, 23.126220703125, 23.9375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 9.0, 11.0, 18.0, 16.0, 17.0, 31.0, 42.0, 41.0, 40.0, 50.0, 53.0, 62.0, 49.0, 53.0, 62.0, 58.0, 58.0, 52.0, 44.0, 34.0, 32.0, 31.0, 23.0, 13.0, 26.0, 11.0, 9.0, 6.0, 7.0, 7.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002956390380859375, -0.002844691276550293, -0.002732992172241211, -0.002621293067932129, -0.002509593963623047, -0.002397894859313965, -0.002286195755004883, -0.0021744966506958008, -0.0020627975463867188, -0.0019510984420776367, -0.0018393993377685547, -0.0017277002334594727, -0.0016160011291503906, -0.0015043020248413086, -0.0013926029205322266, -0.0012809038162231445, -0.0011692047119140625, -0.0010575056076049805, -0.0009458065032958984, -0.0008341073989868164, -0.0007224082946777344, -0.0006107091903686523, -0.0004990100860595703, -0.0003873109817504883, -0.00027561187744140625, -0.00016391277313232422, -5.221366882324219e-05, 5.9485435485839844e-05, 0.00017118453979492188, 0.0002828836441040039, 0.00039458274841308594, 0.000506281852722168, 0.00061798095703125, 0.000729680061340332, 0.0008413791656494141, 0.0009530782699584961, 0.0010647773742675781, 0.0011764764785766602, 0.0012881755828857422, 0.0013998746871948242, 0.0015115737915039062, 0.0016232728958129883, 0.0017349720001220703, 0.0018466711044311523, 0.0019583702087402344, 0.0020700693130493164, 0.0021817684173583984, 0.0022934675216674805, 0.0024051666259765625, 0.0025168657302856445, 0.0026285648345947266, 0.0027402639389038086, 0.0028519630432128906, 0.0029636621475219727, 0.0030753612518310547, 0.0031870603561401367, 0.0032987594604492188, 0.0034104585647583008, 0.003522157669067383, 0.003633856773376465, 0.003745555877685547, 0.003857254981994629, 0.003968954086303711, 0.004080653190612793, 0.004192352294921875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 8.0, 10.0, 21.0, 34.0, 35.0, 55.0, 76.0, 100.0, 134.0, 235.0, 375.0, 617.0, 1181.0, 2451.0, 6214.0, 17586.0, 63160.0, 242701.0, 456752.0, 185504.0, 47549.0, 14027.0, 5056.0, 2066.0, 1011.0, 559.0, 336.0, 200.0, 148.0, 110.0, 57.0, 43.0, 35.0, 36.0, 14.0, 10.0, 7.0, 7.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.484375, -29.571533203125, -28.65869140625, -27.745849609375, -26.8330078125, -25.920166015625, -25.00732421875, -24.094482421875, -23.181640625, -22.268798828125, -21.35595703125, -20.443115234375, -19.5302734375, -18.617431640625, -17.70458984375, -16.791748046875, -15.87890625, -14.966064453125, -14.05322265625, -13.140380859375, -12.2275390625, -11.314697265625, -10.40185546875, -9.489013671875, -8.576171875, -7.663330078125, -6.75048828125, -5.837646484375, -4.9248046875, -4.011962890625, -3.09912109375, -2.186279296875, -1.2734375, -0.360595703125, 0.55224609375, 1.465087890625, 2.3779296875, 3.290771484375, 4.20361328125, 5.116455078125, 6.029296875, 6.942138671875, 7.85498046875, 8.767822265625, 9.6806640625, 10.593505859375, 11.50634765625, 12.419189453125, 13.33203125, 14.244873046875, 15.15771484375, 16.070556640625, 16.9833984375, 17.896240234375, 18.80908203125, 19.721923828125, 20.634765625, 21.547607421875, 22.46044921875, 23.373291015625, 24.2861328125, 25.198974609375, 26.11181640625, 27.024658203125, 27.9375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 6.0, 6.0, 9.0, 15.0, 16.0, 19.0, 22.0, 23.0, 28.0, 32.0, 42.0, 42.0, 49.0, 62.0, 48.0, 68.0, 66.0, 62.0, 39.0, 42.0, 47.0, 38.0, 37.0, 19.0, 23.0, 26.0, 22.0, 12.0, 16.0, 11.0, 9.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.53125, -19.85107421875, -19.1708984375, -18.49072265625, -17.810546875, -17.13037109375, -16.4501953125, -15.77001953125, -15.08984375, -14.40966796875, -13.7294921875, -13.04931640625, -12.369140625, -11.68896484375, -11.0087890625, -10.32861328125, -9.6484375, -8.96826171875, -8.2880859375, -7.60791015625, -6.927734375, -6.24755859375, -5.5673828125, -4.88720703125, -4.20703125, -3.52685546875, -2.8466796875, -2.16650390625, -1.486328125, -0.80615234375, -0.1259765625, 0.55419921875, 1.234375, 1.91455078125, 2.5947265625, 3.27490234375, 3.955078125, 4.63525390625, 5.3154296875, 5.99560546875, 6.67578125, 7.35595703125, 8.0361328125, 8.71630859375, 9.396484375, 10.07666015625, 10.7568359375, 11.43701171875, 12.1171875, 12.79736328125, 13.4775390625, 14.15771484375, 14.837890625, 15.51806640625, 16.1982421875, 16.87841796875, 17.55859375, 18.23876953125, 18.9189453125, 19.59912109375, 20.279296875, 20.95947265625, 21.6396484375, 22.31982421875, 23.0]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 3.0, 11.0, 17.0, 48.0, 53.0, 83.0, 154.0, 148.0, 172.0, 133.0, 62.0, 46.0, 36.0, 16.0, 13.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-614.4017944335938, -594.3441772460938, -574.28662109375, -554.22900390625, -534.17138671875, -514.1138305664062, -494.05621337890625, -473.9986267089844, -453.9410400390625, -433.8834533691406, -413.8258361816406, -393.76824951171875, -373.7106628417969, -353.653076171875, -333.595458984375, -313.5378723144531, -293.4802551269531, -273.42266845703125, -253.3650665283203, -233.30746459960938, -213.2498779296875, -193.19227600097656, -173.13467407226562, -153.07708740234375, -133.0194854736328, -112.9618911743164, -92.904296875, -72.84669494628906, -52.789100646972656, -32.73150634765625, -12.673904418945312, 7.3836822509765625, 27.4412841796875, 47.498878479003906, 67.55647277832031, 87.61407470703125, 107.67166900634766, 127.72926330566406, 147.786865234375, 167.84445190429688, 187.9020538330078, 207.95965576171875, 228.01724243164062, 248.07484436035156, 268.1324462890625, 288.1900329589844, 308.24761962890625, 328.30523681640625, 348.3628234863281, 368.42041015625, 388.47802734375, 408.5356140136719, 428.59320068359375, 448.65081787109375, 468.7084045410156, 488.7659912109375, 508.8236083984375, 528.8812255859375, 548.9387817382812, 568.9963989257812, 589.0540161132812, 609.111572265625, 629.169189453125, 649.226806640625, 669.2843627929688]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 4.0, 12.0, 14.0, 8.0, 19.0, 17.0, 12.0, 39.0, 31.0, 34.0, 41.0, 38.0, 33.0, 40.0, 37.0, 45.0, 30.0, 36.0, 48.0, 46.0, 50.0, 37.0, 47.0, 43.0, 30.0, 32.0, 28.0, 26.0, 17.0, 8.0, 15.0, 12.0, 12.0, 11.0, 11.0, 6.0, 5.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-294.7973937988281, -286.0057678222656, -277.2141418457031, -268.4225158691406, -259.6308898925781, -250.83926391601562, -242.0476531982422, -233.2560272216797, -224.4644012451172, -215.6727752685547, -206.8811492919922, -198.0895233154297, -189.29791259765625, -180.50628662109375, -171.71466064453125, -162.92303466796875, -154.13140869140625, -145.33978271484375, -136.54815673828125, -127.75653839111328, -118.96491241455078, -110.17328643798828, -101.38166809082031, -92.59004211425781, -83.79841613769531, -75.00679016113281, -66.21516418457031, -57.423545837402344, -48.631919860839844, -39.840293884277344, -31.04867172241211, -22.257049560546875, -13.46539306640625, -4.673768997192383, 4.117855072021484, 12.909479141235352, 21.70110321044922, 30.49272918701172, 39.28435134887695, 48.07597351074219, 56.86759948730469, 65.65922546386719, 74.45085144042969, 83.24246978759766, 92.03409576416016, 100.82572174072266, 109.61734008789062, 118.40896606445312, 127.20059204101562, 135.99221801757812, 144.78384399414062, 153.57546997070312, 162.36709594726562, 171.15872192382812, 179.95033264160156, 188.74195861816406, 197.53358459472656, 206.32521057128906, 215.11683654785156, 223.90846252441406, 232.7000732421875, 241.49169921875, 250.2833251953125, 259.074951171875, 267.8665771484375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 7.0, 12.0, 17.0, 30.0, 48.0, 98.0, 156.0, 296.0, 568.0, 1147.0, 3307.0, 18149.0, 4086182.0, 74239.0, 6545.0, 1804.0, 809.0, 385.0, 163.0, 102.0, 58.0, 55.0, 31.0, 14.0, 9.0, 10.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.625, -195.57421875, -188.5234375, -181.47265625, -174.421875, -167.37109375, -160.3203125, -153.26953125, -146.21875, -139.16796875, -132.1171875, -125.06640625, -118.015625, -110.96484375, -103.9140625, -96.86328125, -89.8125, -82.76171875, -75.7109375, -68.66015625, -61.609375, -54.55859375, -47.5078125, -40.45703125, -33.40625, -26.35546875, -19.3046875, -12.25390625, -5.203125, 1.84765625, 8.8984375, 15.94921875, 23.0, 30.05078125, 37.1015625, 44.15234375, 51.203125, 58.25390625, 65.3046875, 72.35546875, 79.40625, 86.45703125, 93.5078125, 100.55859375, 107.609375, 114.66015625, 121.7109375, 128.76171875, 135.8125, 142.86328125, 149.9140625, 156.96484375, 164.015625, 171.06640625, 178.1171875, 185.16796875, 192.21875, 199.26953125, 206.3203125, 213.37109375, 220.421875, 227.47265625, 234.5234375, 241.57421875, 248.625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 3.0, 7.0, 6.0, 9.0, 14.0, 12.0, 21.0, 16.0, 27.0, 41.0, 38.0, 37.0, 41.0, 42.0, 44.0, 48.0, 50.0, 61.0, 60.0, 63.0, 57.0, 40.0, 41.0, 47.0, 37.0, 25.0, 19.0, 12.0, 22.0, 14.0, 15.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.546875, -12.085205078125, -11.62353515625, -11.161865234375, -10.7001953125, -10.238525390625, -9.77685546875, -9.315185546875, -8.853515625, -8.391845703125, -7.93017578125, -7.468505859375, -7.0068359375, -6.545166015625, -6.08349609375, -5.621826171875, -5.16015625, -4.698486328125, -4.23681640625, -3.775146484375, -3.3134765625, -2.851806640625, -2.39013671875, -1.928466796875, -1.466796875, -1.005126953125, -0.54345703125, -0.081787109375, 0.3798828125, 0.841552734375, 1.30322265625, 1.764892578125, 2.2265625, 2.688232421875, 3.14990234375, 3.611572265625, 4.0732421875, 4.534912109375, 4.99658203125, 5.458251953125, 5.919921875, 6.381591796875, 6.84326171875, 7.304931640625, 7.7666015625, 8.228271484375, 8.68994140625, 9.151611328125, 9.61328125, 10.074951171875, 10.53662109375, 10.998291015625, 11.4599609375, 11.921630859375, 12.38330078125, 12.844970703125, 13.306640625, 13.768310546875, 14.22998046875, 14.691650390625, 15.1533203125, 15.614990234375, 16.07666015625, 16.538330078125, 17.0]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 16.0, 13.0, 23.0, 21.0, 37.0, 48.0, 59.0, 102.0, 157.0, 230.0, 392.0, 712.0, 1092.0, 2220.0, 5357.0, 17117.0, 131744.0, 3966147.0, 50199.0, 10499.0, 3873.0, 1727.0, 978.0, 580.0, 317.0, 185.0, 136.0, 99.0, 62.0, 39.0, 32.0, 11.0, 17.0, 7.0, 8.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-112.8125, -109.6181640625, -106.423828125, -103.2294921875, -100.03515625, -96.8408203125, -93.646484375, -90.4521484375, -87.2578125, -84.0634765625, -80.869140625, -77.6748046875, -74.48046875, -71.2861328125, -68.091796875, -64.8974609375, -61.703125, -58.5087890625, -55.314453125, -52.1201171875, -48.92578125, -45.7314453125, -42.537109375, -39.3427734375, -36.1484375, -32.9541015625, -29.759765625, -26.5654296875, -23.37109375, -20.1767578125, -16.982421875, -13.7880859375, -10.59375, -7.3994140625, -4.205078125, -1.0107421875, 2.18359375, 5.3779296875, 8.572265625, 11.7666015625, 14.9609375, 18.1552734375, 21.349609375, 24.5439453125, 27.73828125, 30.9326171875, 34.126953125, 37.3212890625, 40.515625, 43.7099609375, 46.904296875, 50.0986328125, 53.29296875, 56.4873046875, 59.681640625, 62.8759765625, 66.0703125, 69.2646484375, 72.458984375, 75.6533203125, 78.84765625, 82.0419921875, 85.236328125, 88.4306640625, 91.625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 10.0, 21.0, 25.0, 43.0, 100.0, 288.0, 3262.0, 174.0, 63.0, 24.0, 14.0, 15.0, 5.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.703125, -23.067626953125, -22.43212890625, -21.796630859375, -21.1611328125, -20.525634765625, -19.89013671875, -19.254638671875, -18.619140625, -17.983642578125, -17.34814453125, -16.712646484375, -16.0771484375, -15.441650390625, -14.80615234375, -14.170654296875, -13.53515625, -12.899658203125, -12.26416015625, -11.628662109375, -10.9931640625, -10.357666015625, -9.72216796875, -9.086669921875, -8.451171875, -7.815673828125, -7.18017578125, -6.544677734375, -5.9091796875, -5.273681640625, -4.63818359375, -4.002685546875, -3.3671875, -2.731689453125, -2.09619140625, -1.460693359375, -0.8251953125, -0.189697265625, 0.44580078125, 1.081298828125, 1.716796875, 2.352294921875, 2.98779296875, 3.623291015625, 4.2587890625, 4.894287109375, 5.52978515625, 6.165283203125, 6.80078125, 7.436279296875, 8.07177734375, 8.707275390625, 9.3427734375, 9.978271484375, 10.61376953125, 11.249267578125, 11.884765625, 12.520263671875, 13.15576171875, 13.791259765625, 14.4267578125, 15.062255859375, 15.69775390625, 16.333251953125, 16.96875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 13.0, 14.0, 33.0, 32.0, 57.0, 58.0, 81.0, 105.0, 133.0, 102.0, 93.0, 84.0, 62.0, 43.0, 21.0, 19.0, 16.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.64203643798828, -61.530479431152344, -59.418922424316406, -57.30736541748047, -55.19580841064453, -53.084251403808594, -50.972694396972656, -48.86113739013672, -46.74958038330078, -44.638023376464844, -42.526466369628906, -40.41490936279297, -38.30335235595703, -36.191795349121094, -34.080238342285156, -31.96868133544922, -29.85712432861328, -27.745567321777344, -25.634010314941406, -23.52245330810547, -21.41089630126953, -19.299339294433594, -17.187782287597656, -15.076225280761719, -12.964668273925781, -10.853111267089844, -8.741554260253906, -6.629997253417969, -4.518440246582031, -2.4068832397460938, -0.29532623291015625, 1.8162307739257812, 3.9277801513671875, 6.039337158203125, 8.150894165039062, 10.262451171875, 12.374008178710938, 14.485565185546875, 16.597122192382812, 18.70867919921875, 20.820236206054688, 22.931793212890625, 25.043350219726562, 27.1549072265625, 29.266464233398438, 31.378021240234375, 33.48957824707031, 35.60113525390625, 37.71269226074219, 39.824249267578125, 41.93580627441406, 44.04736328125, 46.15892028808594, 48.270477294921875, 50.38203430175781, 52.49359130859375, 54.60514831542969, 56.716705322265625, 58.82826232910156, 60.9398193359375, 63.05137634277344, 65.16293334960938, 67.27449035644531, 69.38604736328125, 71.49760437011719]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 10.0, 7.0, 9.0, 4.0, 10.0, 19.0, 15.0, 22.0, 24.0, 29.0, 27.0, 29.0, 27.0, 31.0, 51.0, 41.0, 54.0, 59.0, 58.0, 42.0, 41.0, 38.0, 38.0, 36.0, 35.0, 35.0, 29.0, 26.0, 20.0, 22.0, 15.0, 16.0, 20.0, 10.0, 11.0, 8.0, 4.0, 6.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.5850715637207, -35.49740219116211, -34.40972900390625, -33.322059631347656, -32.23439025878906, -31.146717071533203, -30.05904769897461, -28.971376419067383, -27.883705139160156, -26.79603385925293, -25.708362579345703, -24.62069320678711, -23.533021926879883, -22.445350646972656, -21.357681274414062, -20.270009994506836, -19.18233871459961, -18.094667434692383, -17.006996154785156, -15.919326782226562, -14.831655502319336, -13.74398422241211, -12.6563138961792, -11.568643569946289, -10.480972290039062, -9.393301010131836, -8.305630683898926, -7.217959880828857, -6.130289077758789, -5.042618274688721, -3.9549474716186523, -2.867276668548584, -1.77960205078125, -0.6919312477111816, 0.3957395553588867, 1.483410358428955, 2.5710811614990234, 3.658751964569092, 4.74642276763916, 5.8340935707092285, 6.921764373779297, 8.009435653686523, 9.097105979919434, 10.184776306152344, 11.27244758605957, 12.360118865966797, 13.447789192199707, 14.535459518432617, 15.623130798339844, 16.71080207824707, 17.798473358154297, 18.88614273071289, 19.973814010620117, 21.061485290527344, 22.149154663085938, 23.236825942993164, 24.32449722290039, 25.412168502807617, 26.499839782714844, 27.587509155273438, 28.675180435180664, 29.76285171508789, 30.850521087646484, 31.93819236755371, 33.02586364746094]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 10.0, 9.0, 10.0, 17.0, 31.0, 38.0, 67.0, 93.0, 163.0, 228.0, 392.0, 822.0, 1602.0, 3762.0, 9365.0, 25503.0, 71721.0, 190532.0, 348573.0, 243277.0, 95801.0, 34591.0, 12687.0, 4898.0, 2060.0, 997.0, 524.0, 273.0, 180.0, 119.0, 76.0, 43.0, 27.0, 21.0, 11.0, 9.0, 9.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-59.9375, -58.20751953125, -56.4775390625, -54.74755859375, -53.017578125, -51.28759765625, -49.5576171875, -47.82763671875, -46.09765625, -44.36767578125, -42.6376953125, -40.90771484375, -39.177734375, -37.44775390625, -35.7177734375, -33.98779296875, -32.2578125, -30.52783203125, -28.7978515625, -27.06787109375, -25.337890625, -23.60791015625, -21.8779296875, -20.14794921875, -18.41796875, -16.68798828125, -14.9580078125, -13.22802734375, -11.498046875, -9.76806640625, -8.0380859375, -6.30810546875, -4.578125, -2.84814453125, -1.1181640625, 0.61181640625, 2.341796875, 4.07177734375, 5.8017578125, 7.53173828125, 9.26171875, 10.99169921875, 12.7216796875, 14.45166015625, 16.181640625, 17.91162109375, 19.6416015625, 21.37158203125, 23.1015625, 24.83154296875, 26.5615234375, 28.29150390625, 30.021484375, 31.75146484375, 33.4814453125, 35.21142578125, 36.94140625, 38.67138671875, 40.4013671875, 42.13134765625, 43.861328125, 45.59130859375, 47.3212890625, 49.05126953125, 50.78125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 5.0, 4.0, 3.0, 9.0, 5.0, 7.0, 13.0, 20.0, 24.0, 14.0, 22.0, 27.0, 33.0, 33.0, 41.0, 32.0, 40.0, 49.0, 55.0, 51.0, 60.0, 55.0, 48.0, 36.0, 54.0, 50.0, 34.0, 35.0, 31.0, 24.0, 16.0, 14.0, 9.0, 14.0, 8.0, 5.0, 7.0, 6.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.4676513671875, -11.989990234375, -11.5123291015625, -11.03466796875, -10.5570068359375, -10.079345703125, -9.6016845703125, -9.1240234375, -8.6463623046875, -8.168701171875, -7.6910400390625, -7.21337890625, -6.7357177734375, -6.258056640625, -5.7803955078125, -5.302734375, -4.8250732421875, -4.347412109375, -3.8697509765625, -3.39208984375, -2.9144287109375, -2.436767578125, -1.9591064453125, -1.4814453125, -1.0037841796875, -0.526123046875, -0.0484619140625, 0.42919921875, 0.9068603515625, 1.384521484375, 1.8621826171875, 2.33984375, 2.8175048828125, 3.295166015625, 3.7728271484375, 4.25048828125, 4.7281494140625, 5.205810546875, 5.6834716796875, 6.1611328125, 6.6387939453125, 7.116455078125, 7.5941162109375, 8.07177734375, 8.5494384765625, 9.027099609375, 9.5047607421875, 9.982421875, 10.4600830078125, 10.937744140625, 11.4154052734375, 11.89306640625, 12.3707275390625, 12.848388671875, 13.3260498046875, 13.8037109375, 14.2813720703125, 14.759033203125, 15.2366943359375, 15.71435546875, 16.1920166015625, 16.669677734375, 17.1473388671875, 17.625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 10.0, 11.0, 13.0, 21.0, 21.0, 28.0, 35.0, 46.0, 67.0, 95.0, 117.0, 177.0, 219.0, 281.0, 368.0, 594.0, 963.0, 1612.0, 3123.0, 6941.0, 19039.0, 53093.0, 153035.0, 374738.0, 275705.0, 99917.0, 34515.0, 12408.0, 5114.0, 2329.0, 1246.0, 739.0, 507.0, 327.0, 255.0, 235.0, 136.0, 127.0, 91.0, 71.0, 54.0, 36.0, 21.0, 24.0, 19.0, 5.0, 6.0, 8.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0], "bins": [-49.34375, -47.8837890625, -46.423828125, -44.9638671875, -43.50390625, -42.0439453125, -40.583984375, -39.1240234375, -37.6640625, -36.2041015625, -34.744140625, -33.2841796875, -31.82421875, -30.3642578125, -28.904296875, -27.4443359375, -25.984375, -24.5244140625, -23.064453125, -21.6044921875, -20.14453125, -18.6845703125, -17.224609375, -15.7646484375, -14.3046875, -12.8447265625, -11.384765625, -9.9248046875, -8.46484375, -7.0048828125, -5.544921875, -4.0849609375, -2.625, -1.1650390625, 0.294921875, 1.7548828125, 3.21484375, 4.6748046875, 6.134765625, 7.5947265625, 9.0546875, 10.5146484375, 11.974609375, 13.4345703125, 14.89453125, 16.3544921875, 17.814453125, 19.2744140625, 20.734375, 22.1943359375, 23.654296875, 25.1142578125, 26.57421875, 28.0341796875, 29.494140625, 30.9541015625, 32.4140625, 33.8740234375, 35.333984375, 36.7939453125, 38.25390625, 39.7138671875, 41.173828125, 42.6337890625, 44.09375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 8.0, 13.0, 10.0, 13.0, 13.0, 9.0, 20.0, 21.0, 30.0, 26.0, 34.0, 30.0, 40.0, 35.0, 25.0, 32.0, 29.0, 37.0, 41.0, 44.0, 36.0, 37.0, 34.0, 35.0, 28.0, 20.0, 31.0, 31.0, 23.0, 21.0, 24.0, 22.0, 17.0, 23.0, 16.0, 15.0, 10.0, 5.0, 8.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-52.03125, -50.40380859375, -48.7763671875, -47.14892578125, -45.521484375, -43.89404296875, -42.2666015625, -40.63916015625, -39.01171875, -37.38427734375, -35.7568359375, -34.12939453125, -32.501953125, -30.87451171875, -29.2470703125, -27.61962890625, -25.9921875, -24.36474609375, -22.7373046875, -21.10986328125, -19.482421875, -17.85498046875, -16.2275390625, -14.60009765625, -12.97265625, -11.34521484375, -9.7177734375, -8.09033203125, -6.462890625, -4.83544921875, -3.2080078125, -1.58056640625, 0.046875, 1.67431640625, 3.3017578125, 4.92919921875, 6.556640625, 8.18408203125, 9.8115234375, 11.43896484375, 13.06640625, 14.69384765625, 16.3212890625, 17.94873046875, 19.576171875, 21.20361328125, 22.8310546875, 24.45849609375, 26.0859375, 27.71337890625, 29.3408203125, 30.96826171875, 32.595703125, 34.22314453125, 35.8505859375, 37.47802734375, 39.10546875, 40.73291015625, 42.3603515625, 43.98779296875, 45.615234375, 47.24267578125, 48.8701171875, 50.49755859375, 52.125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 3.0, 2.0, 10.0, 10.0, 13.0, 27.0, 38.0, 47.0, 57.0, 107.0, 149.0, 238.0, 419.0, 715.0, 1321.0, 2767.0, 6402.0, 17974.0, 63972.0, 265515.0, 484956.0, 147132.0, 36528.0, 11342.0, 4240.0, 2043.0, 1018.0, 569.0, 296.0, 210.0, 141.0, 86.0, 53.0, 34.0, 37.0, 26.0, 17.0, 11.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.765625, -25.936767578125, -25.10791015625, -24.279052734375, -23.4501953125, -22.621337890625, -21.79248046875, -20.963623046875, -20.134765625, -19.305908203125, -18.47705078125, -17.648193359375, -16.8193359375, -15.990478515625, -15.16162109375, -14.332763671875, -13.50390625, -12.675048828125, -11.84619140625, -11.017333984375, -10.1884765625, -9.359619140625, -8.53076171875, -7.701904296875, -6.873046875, -6.044189453125, -5.21533203125, -4.386474609375, -3.5576171875, -2.728759765625, -1.89990234375, -1.071044921875, -0.2421875, 0.586669921875, 1.41552734375, 2.244384765625, 3.0732421875, 3.902099609375, 4.73095703125, 5.559814453125, 6.388671875, 7.217529296875, 8.04638671875, 8.875244140625, 9.7041015625, 10.532958984375, 11.36181640625, 12.190673828125, 13.01953125, 13.848388671875, 14.67724609375, 15.506103515625, 16.3349609375, 17.163818359375, 17.99267578125, 18.821533203125, 19.650390625, 20.479248046875, 21.30810546875, 22.136962890625, 22.9658203125, 23.794677734375, 24.62353515625, 25.452392578125, 26.28125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 13.0, 19.0, 38.0, 52.0, 83.0, 120.0, 163.0, 148.0, 121.0, 80.0, 61.0, 34.0, 24.0, 12.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00685882568359375, -0.0066378116607666016, -0.006416797637939453, -0.006195783615112305, -0.005974769592285156, -0.005753755569458008, -0.005532741546630859, -0.005311727523803711, -0.0050907135009765625, -0.004869699478149414, -0.004648685455322266, -0.004427671432495117, -0.004206657409667969, -0.00398564338684082, -0.003764629364013672, -0.0035436153411865234, -0.003322601318359375, -0.0031015872955322266, -0.002880573272705078, -0.0026595592498779297, -0.0024385452270507812, -0.002217531204223633, -0.0019965171813964844, -0.001775503158569336, -0.0015544891357421875, -0.001333475112915039, -0.0011124610900878906, -0.0008914470672607422, -0.0006704330444335938, -0.0004494190216064453, -0.00022840499877929688, -7.3909759521484375e-06, 0.000213623046875, 0.00043463706970214844, 0.0006556510925292969, 0.0008766651153564453, 0.0010976791381835938, 0.0013186931610107422, 0.0015397071838378906, 0.001760721206665039, 0.0019817352294921875, 0.002202749252319336, 0.0024237632751464844, 0.002644777297973633, 0.0028657913208007812, 0.0030868053436279297, 0.003307819366455078, 0.0035288333892822266, 0.003749847412109375, 0.0039708614349365234, 0.004191875457763672, 0.00441288948059082, 0.004633903503417969, 0.004854917526245117, 0.005075931549072266, 0.005296945571899414, 0.0055179595947265625, 0.005738973617553711, 0.005959987640380859, 0.006181001663208008, 0.006402015686035156, 0.006623029708862305, 0.006844043731689453, 0.0070650577545166016, 0.00728607177734375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 4.0, 12.0, 12.0, 32.0, 47.0, 65.0, 133.0, 191.0, 364.0, 799.0, 1785.0, 5458.0, 25847.0, 249870.0, 668868.0, 77915.0, 11681.0, 3074.0, 1164.0, 557.0, 265.0, 150.0, 105.0, 58.0, 34.0, 18.0, 14.0, 13.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.34375, -47.8603515625, -46.376953125, -44.8935546875, -43.41015625, -41.9267578125, -40.443359375, -38.9599609375, -37.4765625, -35.9931640625, -34.509765625, -33.0263671875, -31.54296875, -30.0595703125, -28.576171875, -27.0927734375, -25.609375, -24.1259765625, -22.642578125, -21.1591796875, -19.67578125, -18.1923828125, -16.708984375, -15.2255859375, -13.7421875, -12.2587890625, -10.775390625, -9.2919921875, -7.80859375, -6.3251953125, -4.841796875, -3.3583984375, -1.875, -0.3916015625, 1.091796875, 2.5751953125, 4.05859375, 5.5419921875, 7.025390625, 8.5087890625, 9.9921875, 11.4755859375, 12.958984375, 14.4423828125, 15.92578125, 17.4091796875, 18.892578125, 20.3759765625, 21.859375, 23.3427734375, 24.826171875, 26.3095703125, 27.79296875, 29.2763671875, 30.759765625, 32.2431640625, 33.7265625, 35.2099609375, 36.693359375, 38.1767578125, 39.66015625, 41.1435546875, 42.626953125, 44.1103515625, 45.59375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 7.0, 9.0, 5.0, 10.0, 8.0, 13.0, 21.0, 23.0, 23.0, 46.0, 59.0, 47.0, 80.0, 75.0, 85.0, 85.0, 87.0, 65.0, 58.0, 41.0, 34.0, 23.0, 23.0, 14.0, 12.0, 11.0, 5.0, 5.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.5625, -30.628662109375, -29.69482421875, -28.760986328125, -27.8271484375, -26.893310546875, -25.95947265625, -25.025634765625, -24.091796875, -23.157958984375, -22.22412109375, -21.290283203125, -20.3564453125, -19.422607421875, -18.48876953125, -17.554931640625, -16.62109375, -15.687255859375, -14.75341796875, -13.819580078125, -12.8857421875, -11.951904296875, -11.01806640625, -10.084228515625, -9.150390625, -8.216552734375, -7.28271484375, -6.348876953125, -5.4150390625, -4.481201171875, -3.54736328125, -2.613525390625, -1.6796875, -0.745849609375, 0.18798828125, 1.121826171875, 2.0556640625, 2.989501953125, 3.92333984375, 4.857177734375, 5.791015625, 6.724853515625, 7.65869140625, 8.592529296875, 9.5263671875, 10.460205078125, 11.39404296875, 12.327880859375, 13.26171875, 14.195556640625, 15.12939453125, 16.063232421875, 16.9970703125, 17.930908203125, 18.86474609375, 19.798583984375, 20.732421875, 21.666259765625, 22.60009765625, 23.533935546875, 24.4677734375, 25.401611328125, 26.33544921875, 27.269287109375, 28.203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 11.0, 18.0, 40.0, 124.0, 225.0, 253.0, 184.0, 93.0, 40.0, 11.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-927.5210571289062, -892.4483642578125, -857.3756103515625, -822.3028564453125, -787.2301635742188, -752.157470703125, -717.084716796875, -682.011962890625, -646.9392700195312, -611.8665771484375, -576.7938232421875, -541.7210693359375, -506.64837646484375, -471.5756530761719, -436.5029296875, -401.4302062988281, -366.35748291015625, -331.2847595214844, -296.2120361328125, -261.1393127441406, -226.06658935546875, -190.99386596679688, -155.921142578125, -120.84841918945312, -85.77569580078125, -50.702972412109375, -15.6302490234375, 19.442474365234375, 54.51519775390625, 89.58792114257812, 124.66064453125, 159.73336791992188, 194.8060302734375, 229.87875366210938, 264.95147705078125, 300.0242004394531, 335.096923828125, 370.1696472167969, 405.24237060546875, 440.3150939941406, 475.3878173828125, 510.4605407714844, 545.5332641601562, 580.60595703125, 615.6787109375, 650.75146484375, 685.8241577148438, 720.8968505859375, 755.9696044921875, 791.0423583984375, 826.1150512695312, 861.187744140625, 896.260498046875, 931.333251953125, 966.4059448242188, 1001.4786376953125, 1036.5513916015625, 1071.6241455078125, 1106.69677734375, 1141.76953125, 1176.84228515625, 1211.9150390625, 1246.98779296875, 1282.0604248046875, 1317.1331787109375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 0.0, 7.0, 6.0, 14.0, 14.0, 17.0, 18.0, 17.0, 14.0, 22.0, 27.0, 29.0, 31.0, 35.0, 38.0, 36.0, 31.0, 44.0, 58.0, 63.0, 45.0, 42.0, 35.0, 59.0, 51.0, 44.0, 26.0, 27.0, 25.0, 17.0, 20.0, 19.0, 13.0, 11.0, 8.0, 11.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-339.6788330078125, -329.2286376953125, -318.7784423828125, -308.3282165527344, -297.8780212402344, -287.4278259277344, -276.9776306152344, -266.5274353027344, -256.07720947265625, -245.62701416015625, -235.1768035888672, -224.7266082763672, -214.27639770507812, -203.82620239257812, -193.37600708007812, -182.92581176757812, -172.47561645507812, -162.02542114257812, -151.57521057128906, -141.12501525878906, -130.6748046875, -120.224609375, -109.7744140625, -99.32421112060547, -88.87400817871094, -78.4238052368164, -67.97360229492188, -57.523406982421875, -47.073204040527344, -36.62300109863281, -26.172801971435547, -15.722602844238281, -5.27239990234375, 5.177801132202148, 15.628002166748047, 26.078203201293945, 36.528404235839844, 46.978607177734375, 57.42880630493164, 67.8790054321289, 78.32920837402344, 88.77941131591797, 99.2296142578125, 109.6798095703125, 120.13001251220703, 130.58021545410156, 141.03041076660156, 151.48062133789062, 161.93081665039062, 172.38101196289062, 182.8312225341797, 193.2814178466797, 203.73162841796875, 214.18182373046875, 224.63201904296875, 235.08221435546875, 245.5324249267578, 255.9826202392578, 266.4328308105469, 276.8830261230469, 287.3332214355469, 297.783447265625, 308.233642578125, 318.683837890625, 329.134033203125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 12.0, 25.0, 30.0, 58.0, 106.0, 188.0, 492.0, 1811.0, 9583.0, 230764.0, 3935103.0, 12721.0, 2278.0, 613.0, 224.0, 114.0, 63.0, 37.0, 19.0, 8.0, 6.0, 3.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.875, -161.134765625, -155.39453125, -149.654296875, -143.9140625, -138.173828125, -132.43359375, -126.693359375, -120.953125, -115.212890625, -109.47265625, -103.732421875, -97.9921875, -92.251953125, -86.51171875, -80.771484375, -75.03125, -69.291015625, -63.55078125, -57.810546875, -52.0703125, -46.330078125, -40.58984375, -34.849609375, -29.109375, -23.369140625, -17.62890625, -11.888671875, -6.1484375, -0.408203125, 5.33203125, 11.072265625, 16.8125, 22.552734375, 28.29296875, 34.033203125, 39.7734375, 45.513671875, 51.25390625, 56.994140625, 62.734375, 68.474609375, 74.21484375, 79.955078125, 85.6953125, 91.435546875, 97.17578125, 102.916015625, 108.65625, 114.396484375, 120.13671875, 125.876953125, 131.6171875, 137.357421875, 143.09765625, 148.837890625, 154.578125, 160.318359375, 166.05859375, 171.798828125, 177.5390625, 183.279296875, 189.01953125, 194.759765625, 200.5]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 9.0, 3.0, 7.0, 9.0, 14.0, 12.0, 16.0, 20.0, 22.0, 27.0, 28.0, 43.0, 35.0, 45.0, 48.0, 53.0, 60.0, 42.0, 54.0, 50.0, 48.0, 48.0, 47.0, 45.0, 39.0, 33.0, 22.0, 25.0, 27.0, 17.0, 12.0, 6.0, 8.0, 9.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7578125, -14.2510986328125, -13.744384765625, -13.2376708984375, -12.73095703125, -12.2242431640625, -11.717529296875, -11.2108154296875, -10.7041015625, -10.1973876953125, -9.690673828125, -9.1839599609375, -8.67724609375, -8.1705322265625, -7.663818359375, -7.1571044921875, -6.650390625, -6.1436767578125, -5.636962890625, -5.1302490234375, -4.62353515625, -4.1168212890625, -3.610107421875, -3.1033935546875, -2.5966796875, -2.0899658203125, -1.583251953125, -1.0765380859375, -0.56982421875, -0.0631103515625, 0.443603515625, 0.9503173828125, 1.45703125, 1.9637451171875, 2.470458984375, 2.9771728515625, 3.48388671875, 3.9906005859375, 4.497314453125, 5.0040283203125, 5.5107421875, 6.0174560546875, 6.524169921875, 7.0308837890625, 7.53759765625, 8.0443115234375, 8.551025390625, 9.0577392578125, 9.564453125, 10.0711669921875, 10.577880859375, 11.0845947265625, 11.59130859375, 12.0980224609375, 12.604736328125, 13.1114501953125, 13.6181640625, 14.1248779296875, 14.631591796875, 15.1383056640625, 15.64501953125, 16.1517333984375, 16.658447265625, 17.1651611328125, 17.671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 3.0, 1.0, 4.0, 6.0, 6.0, 17.0, 16.0, 19.0, 30.0, 43.0, 57.0, 66.0, 98.0, 156.0, 174.0, 281.0, 373.0, 503.0, 791.0, 1202.0, 1784.0, 2762.0, 4507.0, 7988.0, 15524.0, 37854.0, 146286.0, 3755257.0, 144818.0, 37586.0, 15455.0, 7846.0, 4339.0, 2707.0, 1814.0, 1227.0, 813.0, 523.0, 374.0, 241.0, 215.0, 139.0, 84.0, 73.0, 54.0, 36.0, 41.0, 18.0, 25.0, 24.0, 8.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-42.1875, -40.80419921875, -39.4208984375, -38.03759765625, -36.654296875, -35.27099609375, -33.8876953125, -32.50439453125, -31.12109375, -29.73779296875, -28.3544921875, -26.97119140625, -25.587890625, -24.20458984375, -22.8212890625, -21.43798828125, -20.0546875, -18.67138671875, -17.2880859375, -15.90478515625, -14.521484375, -13.13818359375, -11.7548828125, -10.37158203125, -8.98828125, -7.60498046875, -6.2216796875, -4.83837890625, -3.455078125, -2.07177734375, -0.6884765625, 0.69482421875, 2.078125, 3.46142578125, 4.8447265625, 6.22802734375, 7.611328125, 8.99462890625, 10.3779296875, 11.76123046875, 13.14453125, 14.52783203125, 15.9111328125, 17.29443359375, 18.677734375, 20.06103515625, 21.4443359375, 22.82763671875, 24.2109375, 25.59423828125, 26.9775390625, 28.36083984375, 29.744140625, 31.12744140625, 32.5107421875, 33.89404296875, 35.27734375, 36.66064453125, 38.0439453125, 39.42724609375, 40.810546875, 42.19384765625, 43.5771484375, 44.96044921875, 46.34375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 5.0, 8.0, 7.0, 8.0, 24.0, 32.0, 42.0, 58.0, 166.0, 2757.0, 580.0, 135.0, 74.0, 33.0, 33.0, 21.0, 12.0, 8.0, 12.0, 14.0, 4.0, 6.0, 5.0, 6.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8515625, -13.417724609375, -12.98388671875, -12.550048828125, -12.1162109375, -11.682373046875, -11.24853515625, -10.814697265625, -10.380859375, -9.947021484375, -9.51318359375, -9.079345703125, -8.6455078125, -8.211669921875, -7.77783203125, -7.343994140625, -6.91015625, -6.476318359375, -6.04248046875, -5.608642578125, -5.1748046875, -4.740966796875, -4.30712890625, -3.873291015625, -3.439453125, -3.005615234375, -2.57177734375, -2.137939453125, -1.7041015625, -1.270263671875, -0.83642578125, -0.402587890625, 0.03125, 0.465087890625, 0.89892578125, 1.332763671875, 1.7666015625, 2.200439453125, 2.63427734375, 3.068115234375, 3.501953125, 3.935791015625, 4.36962890625, 4.803466796875, 5.2373046875, 5.671142578125, 6.10498046875, 6.538818359375, 6.97265625, 7.406494140625, 7.84033203125, 8.274169921875, 8.7080078125, 9.141845703125, 9.57568359375, 10.009521484375, 10.443359375, 10.877197265625, 11.31103515625, 11.744873046875, 12.1787109375, 12.612548828125, 13.04638671875, 13.480224609375, 13.9140625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 5.0, 3.0, 13.0, 11.0, 24.0, 33.0, 65.0, 72.0, 93.0, 99.0, 128.0, 113.0, 74.0, 78.0, 59.0, 39.0, 33.0, 19.0, 11.0, 5.0, 7.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.242706298828125, -53.68707275390625, -51.13143539428711, -48.575801849365234, -46.020164489746094, -43.46453094482422, -40.908897399902344, -38.35326385498047, -35.79762649536133, -33.24199295043945, -30.686355590820312, -28.130722045898438, -25.57508659362793, -23.019451141357422, -20.463817596435547, -17.90818214416504, -15.352546691894531, -12.796911239624023, -10.241276741027832, -7.685641765594482, -5.130006790161133, -2.574371337890625, -0.018736839294433594, 2.536897659301758, 5.092533111572266, 7.648168087005615, 10.203803062438965, 12.759437561035156, 15.315073013305664, 17.870708465576172, 20.426342010498047, 22.981977462768555, 25.537612915039062, 28.09324836730957, 30.648883819580078, 33.20451736450195, 35.760154724121094, 38.31578826904297, 40.871421813964844, 43.42705535888672, 45.98269271850586, 48.538326263427734, 51.093963623046875, 53.64959716796875, 56.205230712890625, 58.760868072509766, 61.31650161743164, 63.87213897705078, 66.42777252197266, 68.98340606689453, 71.5390396118164, 74.09468078613281, 76.65031433105469, 79.20594787597656, 81.76158142089844, 84.31721496582031, 86.87284851074219, 89.42848205566406, 91.98411560058594, 94.53975677490234, 97.09539031982422, 99.6510238647461, 102.20665740966797, 104.76229095458984, 107.31793212890625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 4.0, 10.0, 10.0, 14.0, 15.0, 19.0, 24.0, 21.0, 23.0, 40.0, 36.0, 34.0, 31.0, 36.0, 38.0, 28.0, 30.0, 41.0, 37.0, 38.0, 41.0, 36.0, 38.0, 39.0, 36.0, 28.0, 36.0, 32.0, 27.0, 21.0, 21.0, 17.0, 15.0, 18.0, 12.0, 10.0, 5.0, 3.0, 8.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.32070541381836, -37.068180084228516, -35.81565475463867, -34.56312561035156, -33.31060028076172, -32.058074951171875, -30.80554962158203, -29.553022384643555, -28.300495147705078, -27.047969818115234, -25.795442581176758, -24.542917251586914, -23.290390014648438, -22.037864685058594, -20.78533935546875, -19.532812118530273, -18.28028678894043, -17.027761459350586, -15.77523422241211, -14.522708892822266, -13.270181655883789, -12.017656326293945, -10.765130043029785, -9.512603759765625, -8.260077476501465, -7.007551193237305, -5.7550249099731445, -4.502499103546143, -3.2499728202819824, -1.9974465370178223, -0.7449207305908203, 0.5076055526733398, 1.7601318359375, 3.01265811920166, 4.26518440246582, 5.517710208892822, 6.770236492156982, 8.022762298583984, 9.275288581848145, 10.527814865112305, 11.780341148376465, 13.032867431640625, 14.285393714904785, 15.537919998168945, 16.79044532775879, 18.042972564697266, 19.29549789428711, 20.548023223876953, 21.80055046081543, 23.053075790405273, 24.30560302734375, 25.558128356933594, 26.81065559387207, 28.063180923461914, 29.31570816040039, 30.568233489990234, 31.820758819580078, 33.07328414916992, 34.325809478759766, 35.578338623046875, 36.83086395263672, 38.08338928222656, 39.335914611816406, 40.58843994140625, 41.84096908569336]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 6.0, 2.0, 9.0, 10.0, 25.0, 32.0, 42.0, 59.0, 101.0, 166.0, 285.0, 497.0, 924.0, 1927.0, 4163.0, 9613.0, 25535.0, 69676.0, 190384.0, 338799.0, 248888.0, 98783.0, 35308.0, 12871.0, 5384.0, 2445.0, 1216.0, 567.0, 334.0, 165.0, 114.0, 59.0, 47.0, 39.0, 31.0, 14.0, 12.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.65625, -42.1845703125, -40.712890625, -39.2412109375, -37.76953125, -36.2978515625, -34.826171875, -33.3544921875, -31.8828125, -30.4111328125, -28.939453125, -27.4677734375, -25.99609375, -24.5244140625, -23.052734375, -21.5810546875, -20.109375, -18.6376953125, -17.166015625, -15.6943359375, -14.22265625, -12.7509765625, -11.279296875, -9.8076171875, -8.3359375, -6.8642578125, -5.392578125, -3.9208984375, -2.44921875, -0.9775390625, 0.494140625, 1.9658203125, 3.4375, 4.9091796875, 6.380859375, 7.8525390625, 9.32421875, 10.7958984375, 12.267578125, 13.7392578125, 15.2109375, 16.6826171875, 18.154296875, 19.6259765625, 21.09765625, 22.5693359375, 24.041015625, 25.5126953125, 26.984375, 28.4560546875, 29.927734375, 31.3994140625, 32.87109375, 34.3427734375, 35.814453125, 37.2861328125, 38.7578125, 40.2294921875, 41.701171875, 43.1728515625, 44.64453125, 46.1162109375, 47.587890625, 49.0595703125, 50.53125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 5.0, 6.0, 8.0, 11.0, 9.0, 12.0, 23.0, 22.0, 26.0, 32.0, 32.0, 40.0, 45.0, 44.0, 50.0, 48.0, 49.0, 56.0, 56.0, 35.0, 41.0, 40.0, 55.0, 42.0, 34.0, 30.0, 25.0, 28.0, 13.0, 9.0, 10.0, 9.0, 11.0, 9.0, 8.0, 5.0, 3.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.3046875, -14.7872314453125, -14.269775390625, -13.7523193359375, -13.23486328125, -12.7174072265625, -12.199951171875, -11.6824951171875, -11.1650390625, -10.6475830078125, -10.130126953125, -9.6126708984375, -9.09521484375, -8.5777587890625, -8.060302734375, -7.5428466796875, -7.025390625, -6.5079345703125, -5.990478515625, -5.4730224609375, -4.95556640625, -4.4381103515625, -3.920654296875, -3.4031982421875, -2.8857421875, -2.3682861328125, -1.850830078125, -1.3333740234375, -0.81591796875, -0.2984619140625, 0.218994140625, 0.7364501953125, 1.25390625, 1.7713623046875, 2.288818359375, 2.8062744140625, 3.32373046875, 3.8411865234375, 4.358642578125, 4.8760986328125, 5.3935546875, 5.9110107421875, 6.428466796875, 6.9459228515625, 7.46337890625, 7.9808349609375, 8.498291015625, 9.0157470703125, 9.533203125, 10.0506591796875, 10.568115234375, 11.0855712890625, 11.60302734375, 12.1204833984375, 12.637939453125, 13.1553955078125, 13.6728515625, 14.1903076171875, 14.707763671875, 15.2252197265625, 15.74267578125, 16.2601318359375, 16.777587890625, 17.2950439453125, 17.8125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 9.0, 11.0, 18.0, 19.0, 23.0, 32.0, 47.0, 68.0, 112.0, 116.0, 155.0, 222.0, 292.0, 444.0, 646.0, 937.0, 1565.0, 2975.0, 7065.0, 21924.0, 84508.0, 336573.0, 425987.0, 117560.0, 29469.0, 8975.0, 3619.0, 1781.0, 980.0, 687.0, 458.0, 324.0, 263.0, 173.0, 130.0, 84.0, 68.0, 56.0, 46.0, 29.0, 26.0, 21.0, 18.0, 5.0, 7.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-57.71875, -56.02685546875, -54.3349609375, -52.64306640625, -50.951171875, -49.25927734375, -47.5673828125, -45.87548828125, -44.18359375, -42.49169921875, -40.7998046875, -39.10791015625, -37.416015625, -35.72412109375, -34.0322265625, -32.34033203125, -30.6484375, -28.95654296875, -27.2646484375, -25.57275390625, -23.880859375, -22.18896484375, -20.4970703125, -18.80517578125, -17.11328125, -15.42138671875, -13.7294921875, -12.03759765625, -10.345703125, -8.65380859375, -6.9619140625, -5.27001953125, -3.578125, -1.88623046875, -0.1943359375, 1.49755859375, 3.189453125, 4.88134765625, 6.5732421875, 8.26513671875, 9.95703125, 11.64892578125, 13.3408203125, 15.03271484375, 16.724609375, 18.41650390625, 20.1083984375, 21.80029296875, 23.4921875, 25.18408203125, 26.8759765625, 28.56787109375, 30.259765625, 31.95166015625, 33.6435546875, 35.33544921875, 37.02734375, 38.71923828125, 40.4111328125, 42.10302734375, 43.794921875, 45.48681640625, 47.1787109375, 48.87060546875, 50.5625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 10.0, 8.0, 15.0, 13.0, 17.0, 26.0, 27.0, 29.0, 22.0, 34.0, 46.0, 35.0, 53.0, 49.0, 41.0, 54.0, 49.0, 28.0, 42.0, 60.0, 47.0, 51.0, 25.0, 33.0, 25.0, 26.0, 24.0, 19.0, 13.0, 23.0, 10.0, 12.0, 7.0, 2.0, 10.0, 3.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.1875, -71.953125, -69.71875, -67.484375, -65.25, -63.015625, -60.78125, -58.546875, -56.3125, -54.078125, -51.84375, -49.609375, -47.375, -45.140625, -42.90625, -40.671875, -38.4375, -36.203125, -33.96875, -31.734375, -29.5, -27.265625, -25.03125, -22.796875, -20.5625, -18.328125, -16.09375, -13.859375, -11.625, -9.390625, -7.15625, -4.921875, -2.6875, -0.453125, 1.78125, 4.015625, 6.25, 8.484375, 10.71875, 12.953125, 15.1875, 17.421875, 19.65625, 21.890625, 24.125, 26.359375, 28.59375, 30.828125, 33.0625, 35.296875, 37.53125, 39.765625, 42.0, 44.234375, 46.46875, 48.703125, 50.9375, 53.171875, 55.40625, 57.640625, 59.875, 62.109375, 64.34375, 66.578125, 68.8125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 7.0, 11.0, 11.0, 22.0, 21.0, 56.0, 60.0, 86.0, 145.0, 222.0, 368.0, 575.0, 1029.0, 2002.0, 4395.0, 12061.0, 46392.0, 244882.0, 557161.0, 135381.0, 28356.0, 8300.0, 3312.0, 1487.0, 863.0, 493.0, 278.0, 181.0, 117.0, 81.0, 49.0, 32.0, 33.0, 17.0, 13.0, 11.0, 7.0, 6.0, 7.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.921875, -25.094482421875, -24.26708984375, -23.439697265625, -22.6123046875, -21.784912109375, -20.95751953125, -20.130126953125, -19.302734375, -18.475341796875, -17.64794921875, -16.820556640625, -15.9931640625, -15.165771484375, -14.33837890625, -13.510986328125, -12.68359375, -11.856201171875, -11.02880859375, -10.201416015625, -9.3740234375, -8.546630859375, -7.71923828125, -6.891845703125, -6.064453125, -5.237060546875, -4.40966796875, -3.582275390625, -2.7548828125, -1.927490234375, -1.10009765625, -0.272705078125, 0.5546875, 1.382080078125, 2.20947265625, 3.036865234375, 3.8642578125, 4.691650390625, 5.51904296875, 6.346435546875, 7.173828125, 8.001220703125, 8.82861328125, 9.656005859375, 10.4833984375, 11.310791015625, 12.13818359375, 12.965576171875, 13.79296875, 14.620361328125, 15.44775390625, 16.275146484375, 17.1025390625, 17.929931640625, 18.75732421875, 19.584716796875, 20.412109375, 21.239501953125, 22.06689453125, 22.894287109375, 23.7216796875, 24.549072265625, 25.37646484375, 26.203857421875, 27.03125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 4.0, 5.0, 9.0, 10.0, 13.0, 18.0, 21.0, 29.0, 29.0, 37.0, 49.0, 54.0, 56.0, 71.0, 94.0, 85.0, 67.0, 60.0, 51.0, 42.0, 33.0, 27.0, 28.0, 17.0, 19.0, 11.0, 6.0, 8.0, 3.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.003204345703125, -0.003092348575592041, -0.002980351448059082, -0.002868354320526123, -0.002756357192993164, -0.002644360065460205, -0.002532362937927246, -0.002420365810394287, -0.002308368682861328, -0.002196371555328369, -0.00208437442779541, -0.001972377300262451, -0.0018603801727294922, -0.0017483830451965332, -0.0016363859176635742, -0.0015243887901306152, -0.0014123916625976562, -0.0013003945350646973, -0.0011883974075317383, -0.0010764002799987793, -0.0009644031524658203, -0.0008524060249328613, -0.0007404088973999023, -0.0006284117698669434, -0.0005164146423339844, -0.0004044175148010254, -0.0002924203872680664, -0.00018042325973510742, -6.842613220214844e-05, 4.357099533081055e-05, 0.00015556812286376953, 0.0002675652503967285, 0.0003795623779296875, 0.0004915595054626465, 0.0006035566329956055, 0.0007155537605285645, 0.0008275508880615234, 0.0009395480155944824, 0.0010515451431274414, 0.0011635422706604004, 0.0012755393981933594, 0.0013875365257263184, 0.0014995336532592773, 0.0016115307807922363, 0.0017235279083251953, 0.0018355250358581543, 0.0019475221633911133, 0.0020595192909240723, 0.0021715164184570312, 0.0022835135459899902, 0.0023955106735229492, 0.002507507801055908, 0.002619504928588867, 0.002731502056121826, 0.002843499183654785, 0.002955496311187744, 0.003067493438720703, 0.003179490566253662, 0.003291487693786621, 0.00340348482131958, 0.003515481948852539, 0.003627479076385498, 0.003739476203918457, 0.003851473331451416, 0.003963470458984375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 9.0, 17.0, 24.0, 42.0, 58.0, 102.0, 195.0, 361.0, 781.0, 1999.0, 6420.0, 41046.0, 576527.0, 384960.0, 27773.0, 5079.0, 1664.0, 741.0, 335.0, 155.0, 105.0, 49.0, 29.0, 19.0, 15.0, 7.0, 8.0, 3.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-47.75, -46.38232421875, -45.0146484375, -43.64697265625, -42.279296875, -40.91162109375, -39.5439453125, -38.17626953125, -36.80859375, -35.44091796875, -34.0732421875, -32.70556640625, -31.337890625, -29.97021484375, -28.6025390625, -27.23486328125, -25.8671875, -24.49951171875, -23.1318359375, -21.76416015625, -20.396484375, -19.02880859375, -17.6611328125, -16.29345703125, -14.92578125, -13.55810546875, -12.1904296875, -10.82275390625, -9.455078125, -8.08740234375, -6.7197265625, -5.35205078125, -3.984375, -2.61669921875, -1.2490234375, 0.11865234375, 1.486328125, 2.85400390625, 4.2216796875, 5.58935546875, 6.95703125, 8.32470703125, 9.6923828125, 11.06005859375, 12.427734375, 13.79541015625, 15.1630859375, 16.53076171875, 17.8984375, 19.26611328125, 20.6337890625, 22.00146484375, 23.369140625, 24.73681640625, 26.1044921875, 27.47216796875, 28.83984375, 30.20751953125, 31.5751953125, 32.94287109375, 34.310546875, 35.67822265625, 37.0458984375, 38.41357421875, 39.78125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 11.0, 5.0, 7.0, 4.0, 18.0, 17.0, 26.0, 39.0, 62.0, 66.0, 93.0, 88.0, 115.0, 97.0, 84.0, 68.0, 54.0, 38.0, 27.0, 17.0, 23.0, 15.0, 10.0, 12.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -30.976318359375, -29.96826171875, -28.960205078125, -27.9521484375, -26.944091796875, -25.93603515625, -24.927978515625, -23.919921875, -22.911865234375, -21.90380859375, -20.895751953125, -19.8876953125, -18.879638671875, -17.87158203125, -16.863525390625, -15.85546875, -14.847412109375, -13.83935546875, -12.831298828125, -11.8232421875, -10.815185546875, -9.80712890625, -8.799072265625, -7.791015625, -6.782958984375, -5.77490234375, -4.766845703125, -3.7587890625, -2.750732421875, -1.74267578125, -0.734619140625, 0.2734375, 1.281494140625, 2.28955078125, 3.297607421875, 4.3056640625, 5.313720703125, 6.32177734375, 7.329833984375, 8.337890625, 9.345947265625, 10.35400390625, 11.362060546875, 12.3701171875, 13.378173828125, 14.38623046875, 15.394287109375, 16.40234375, 17.410400390625, 18.41845703125, 19.426513671875, 20.4345703125, 21.442626953125, 22.45068359375, 23.458740234375, 24.466796875, 25.474853515625, 26.48291015625, 27.490966796875, 28.4990234375, 29.507080078125, 30.51513671875, 31.523193359375, 32.53125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 8.0, 8.0, 35.0, 83.0, 114.0, 208.0, 207.0, 152.0, 101.0, 38.0, 32.0, 4.0, 10.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-259.57855224609375, -233.72531127929688, -207.87208557128906, -182.01885986328125, -156.16561889648438, -130.3123779296875, -104.45915222167969, -78.60592651367188, -52.752685546875, -26.899452209472656, -1.0462188720703125, 24.80701446533203, 50.660247802734375, 76.51348876953125, 102.36671447753906, 128.21994018554688, 154.07318115234375, 179.92642211914062, 205.77964782714844, 231.63287353515625, 257.4861145019531, 283.33935546875, 309.19256591796875, 335.0458068847656, 360.8990478515625, 386.7522888183594, 412.60552978515625, 438.458740234375, 464.3119812011719, 490.16522216796875, 516.0184326171875, 541.8717041015625, 567.724853515625, 593.5780639648438, 619.4313354492188, 645.2845458984375, 671.1378173828125, 696.9910278320312, 722.84423828125, 748.697509765625, 774.5507202148438, 800.4039306640625, 826.2572021484375, 852.1104125976562, 877.963623046875, 903.81689453125, 929.6701049804688, 955.5233154296875, 981.3765869140625, 1007.2297973632812, 1033.0830078125, 1058.936279296875, 1084.78955078125, 1110.642822265625, 1136.4959716796875, 1162.3492431640625, 1188.202392578125, 1214.0556640625, 1239.9088134765625, 1265.7620849609375, 1291.6153564453125, 1317.468505859375, 1343.32177734375, 1369.175048828125, 1395.0283203125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 2.0, 7.0, 7.0, 7.0, 11.0, 15.0, 16.0, 13.0, 17.0, 16.0, 12.0, 29.0, 22.0, 26.0, 43.0, 28.0, 35.0, 48.0, 42.0, 34.0, 40.0, 42.0, 50.0, 44.0, 23.0, 43.0, 38.0, 37.0, 30.0, 35.0, 21.0, 26.0, 23.0, 19.0, 20.0, 8.0, 9.0, 10.0, 8.0, 5.0, 8.0, 6.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-272.5573425292969, -263.57769775390625, -254.59808349609375, -245.6184539794922, -236.63882446289062, -227.65919494628906, -218.6795654296875, -209.69993591308594, -200.72030639648438, -191.7406768798828, -182.76104736328125, -173.7814178466797, -164.80178833007812, -155.82215881347656, -146.842529296875, -137.86289978027344, -128.88327026367188, -119.90364074707031, -110.92401123046875, -101.94438171386719, -92.96475219726562, -83.98512268066406, -75.0054931640625, -66.02586364746094, -57.046234130859375, -48.06660461425781, -39.08697509765625, -30.107345581054688, -21.127716064453125, -12.148086547851562, -3.16845703125, 5.8111724853515625, 14.790802001953125, 23.770431518554688, 32.75006103515625, 41.72969055175781, 50.709320068359375, 59.68894958496094, 68.6685791015625, 77.64820861816406, 86.62783813476562, 95.60746765136719, 104.58709716796875, 113.56672668457031, 122.54635620117188, 131.52598571777344, 140.505615234375, 149.48524475097656, 158.46487426757812, 167.4445037841797, 176.42413330078125, 185.4037628173828, 194.38339233398438, 203.36302185058594, 212.3426513671875, 221.32228088378906, 230.30191040039062, 239.2815399169922, 248.26116943359375, 257.24078369140625, 266.2204284667969, 275.2000732421875, 284.1796875, 293.1593017578125, 302.1389465332031]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 8.0, 8.0, 5.0, 9.0, 14.0, 22.0, 42.0, 57.0, 79.0, 126.0, 192.0, 308.0, 551.0, 1148.0, 2889.0, 7971.0, 36371.0, 4096517.0, 34724.0, 7878.0, 2758.0, 1205.0, 553.0, 313.0, 169.0, 111.0, 78.0, 58.0, 42.0, 20.0, 16.0, 13.0, 9.0, 10.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-124.3125, -120.2353515625, -116.158203125, -112.0810546875, -108.00390625, -103.9267578125, -99.849609375, -95.7724609375, -91.6953125, -87.6181640625, -83.541015625, -79.4638671875, -75.38671875, -71.3095703125, -67.232421875, -63.1552734375, -59.078125, -55.0009765625, -50.923828125, -46.8466796875, -42.76953125, -38.6923828125, -34.615234375, -30.5380859375, -26.4609375, -22.3837890625, -18.306640625, -14.2294921875, -10.15234375, -6.0751953125, -1.998046875, 2.0791015625, 6.15625, 10.2333984375, 14.310546875, 18.3876953125, 22.46484375, 26.5419921875, 30.619140625, 34.6962890625, 38.7734375, 42.8505859375, 46.927734375, 51.0048828125, 55.08203125, 59.1591796875, 63.236328125, 67.3134765625, 71.390625, 75.4677734375, 79.544921875, 83.6220703125, 87.69921875, 91.7763671875, 95.853515625, 99.9306640625, 104.0078125, 108.0849609375, 112.162109375, 116.2392578125, 120.31640625, 124.3935546875, 128.470703125, 132.5478515625, 136.625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 6.0, 8.0, 5.0, 7.0, 14.0, 12.0, 16.0, 27.0, 32.0, 35.0, 43.0, 49.0, 42.0, 39.0, 60.0, 52.0, 64.0, 59.0, 52.0, 47.0, 72.0, 30.0, 34.0, 23.0, 31.0, 26.0, 21.0, 18.0, 10.0, 15.0, 11.0, 9.0, 4.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.09375, -19.4970703125, -18.900390625, -18.3037109375, -17.70703125, -17.1103515625, -16.513671875, -15.9169921875, -15.3203125, -14.7236328125, -14.126953125, -13.5302734375, -12.93359375, -12.3369140625, -11.740234375, -11.1435546875, -10.546875, -9.9501953125, -9.353515625, -8.7568359375, -8.16015625, -7.5634765625, -6.966796875, -6.3701171875, -5.7734375, -5.1767578125, -4.580078125, -3.9833984375, -3.38671875, -2.7900390625, -2.193359375, -1.5966796875, -1.0, -0.4033203125, 0.193359375, 0.7900390625, 1.38671875, 1.9833984375, 2.580078125, 3.1767578125, 3.7734375, 4.3701171875, 4.966796875, 5.5634765625, 6.16015625, 6.7568359375, 7.353515625, 7.9501953125, 8.546875, 9.1435546875, 9.740234375, 10.3369140625, 10.93359375, 11.5302734375, 12.126953125, 12.7236328125, 13.3203125, 13.9169921875, 14.513671875, 15.1103515625, 15.70703125, 16.3037109375, 16.900390625, 17.4970703125, 18.09375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 13.0, 20.0, 15.0, 28.0, 18.0, 29.0, 31.0, 45.0, 48.0, 67.0, 107.0, 180.0, 346.0, 803.0, 2255.0, 7594.0, 48189.0, 4098783.0, 26967.0, 5455.0, 1765.0, 658.0, 277.0, 164.0, 105.0, 48.0, 40.0, 43.0, 43.0, 28.0, 22.0, 17.0, 19.0, 11.0, 10.0, 8.0, 11.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-142.625, -138.080078125, -133.53515625, -128.990234375, -124.4453125, -119.900390625, -115.35546875, -110.810546875, -106.265625, -101.720703125, -97.17578125, -92.630859375, -88.0859375, -83.541015625, -78.99609375, -74.451171875, -69.90625, -65.361328125, -60.81640625, -56.271484375, -51.7265625, -47.181640625, -42.63671875, -38.091796875, -33.546875, -29.001953125, -24.45703125, -19.912109375, -15.3671875, -10.822265625, -6.27734375, -1.732421875, 2.8125, 7.357421875, 11.90234375, 16.447265625, 20.9921875, 25.537109375, 30.08203125, 34.626953125, 39.171875, 43.716796875, 48.26171875, 52.806640625, 57.3515625, 61.896484375, 66.44140625, 70.986328125, 75.53125, 80.076171875, 84.62109375, 89.166015625, 93.7109375, 98.255859375, 102.80078125, 107.345703125, 111.890625, 116.435546875, 120.98046875, 125.525390625, 130.0703125, 134.615234375, 139.16015625, 143.705078125, 148.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 7.0, 7.0, 8.0, 13.0, 28.0, 68.0, 3608.0, 259.0, 37.0, 14.0, 9.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.9375, -35.8134765625, -34.689453125, -33.5654296875, -32.44140625, -31.3173828125, -30.193359375, -29.0693359375, -27.9453125, -26.8212890625, -25.697265625, -24.5732421875, -23.44921875, -22.3251953125, -21.201171875, -20.0771484375, -18.953125, -17.8291015625, -16.705078125, -15.5810546875, -14.45703125, -13.3330078125, -12.208984375, -11.0849609375, -9.9609375, -8.8369140625, -7.712890625, -6.5888671875, -5.46484375, -4.3408203125, -3.216796875, -2.0927734375, -0.96875, 0.1552734375, 1.279296875, 2.4033203125, 3.52734375, 4.6513671875, 5.775390625, 6.8994140625, 8.0234375, 9.1474609375, 10.271484375, 11.3955078125, 12.51953125, 13.6435546875, 14.767578125, 15.8916015625, 17.015625, 18.1396484375, 19.263671875, 20.3876953125, 21.51171875, 22.6357421875, 23.759765625, 24.8837890625, 26.0078125, 27.1318359375, 28.255859375, 29.3798828125, 30.50390625, 31.6279296875, 32.751953125, 33.8759765625, 35.0]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 12.0, 44.0, 72.0, 178.0, 274.0, 228.0, 102.0, 51.0, 26.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.46912384033203, -113.3116683959961, -108.15421295166016, -102.99675750732422, -97.83930206298828, -92.68184661865234, -87.52439880371094, -82.366943359375, -77.20948791503906, -72.05203247070312, -66.89457702636719, -61.73712158203125, -56.57966613769531, -51.422210693359375, -46.2647590637207, -41.107303619384766, -35.94984436035156, -30.792388916015625, -25.634933471679688, -20.477479934692383, -15.320024490356445, -10.162569046020508, -5.005115509033203, 0.15233993530273438, 5.309795379638672, 10.46725082397461, 15.62470531463623, 20.78215980529785, 25.93961524963379, 31.097070693969727, 36.25452423095703, 41.41197967529297, 46.569427490234375, 51.72688293457031, 56.88433837890625, 62.04179382324219, 67.19924926757812, 72.35670471191406, 77.51416015625, 82.67161560058594, 87.82907104492188, 92.98652648925781, 98.14398193359375, 103.30143737792969, 108.45889282226562, 113.61634826660156, 118.7738037109375, 123.93125915527344, 129.08871459960938, 134.2461700439453, 139.40362548828125, 144.5610809326172, 149.71853637695312, 154.87599182128906, 160.033447265625, 165.19090270996094, 170.3483428955078, 175.50579833984375, 180.6632537841797, 185.82070922851562, 190.97816467285156, 196.1356201171875, 201.29307556152344, 206.45053100585938, 211.6079864501953]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 10.0, 10.0, 8.0, 13.0, 12.0, 15.0, 18.0, 20.0, 32.0, 31.0, 33.0, 33.0, 36.0, 34.0, 30.0, 34.0, 46.0, 34.0, 41.0, 46.0, 30.0, 35.0, 36.0, 45.0, 39.0, 26.0, 32.0, 26.0, 24.0, 26.0, 29.0, 13.0, 17.0, 16.0, 15.0, 13.0, 4.0, 7.0, 8.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.481239318847656, -39.245887756347656, -38.01053237915039, -36.77518081665039, -35.539825439453125, -34.304473876953125, -33.06911849975586, -31.83376693725586, -30.598411560058594, -29.36305809020996, -28.127704620361328, -26.892351150512695, -25.656997680664062, -24.42164421081543, -23.186290740966797, -21.950939178466797, -20.715585708618164, -19.48023223876953, -18.2448787689209, -17.009525299072266, -15.774171829223633, -14.538818359375, -13.303465843200684, -12.06811237335205, -10.832758903503418, -9.597405433654785, -8.362051963806152, -7.126698970794678, -5.891345500946045, -4.655992031097412, -3.4206390380859375, -2.1852855682373047, -0.9499320983886719, 0.2854212522506714, 1.5207746028900146, 2.7561278343200684, 3.991481304168701, 5.226834774017334, 6.462187767028809, 7.697541236877441, 8.932894706726074, 10.168248176574707, 11.40360164642334, 12.638954162597656, 13.874307632446289, 15.109661102294922, 16.345014572143555, 17.580368041992188, 18.81572151184082, 20.051074981689453, 21.286428451538086, 22.52178192138672, 23.75713539123535, 24.992488861083984, 26.227840423583984, 27.46319580078125, 28.69854736328125, 29.933900833129883, 31.169254302978516, 32.404605865478516, 33.63996124267578, 34.87531280517578, 36.11066818237305, 37.34601974487305, 38.58137512207031]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 5.0, 4.0, 12.0, 9.0, 15.0, 18.0, 27.0, 36.0, 48.0, 85.0, 110.0, 156.0, 234.0, 391.0, 648.0, 1121.0, 2286.0, 4813.0, 10972.0, 27369.0, 69740.0, 173911.0, 319887.0, 251223.0, 111116.0, 43261.0, 17017.0, 7080.0, 3108.0, 1583.0, 809.0, 486.0, 344.0, 187.0, 133.0, 90.0, 50.0, 44.0, 29.0, 29.0, 18.0, 12.0, 7.0, 10.0, 5.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-42.75, -41.4033203125, -40.056640625, -38.7099609375, -37.36328125, -36.0166015625, -34.669921875, -33.3232421875, -31.9765625, -30.6298828125, -29.283203125, -27.9365234375, -26.58984375, -25.2431640625, -23.896484375, -22.5498046875, -21.203125, -19.8564453125, -18.509765625, -17.1630859375, -15.81640625, -14.4697265625, -13.123046875, -11.7763671875, -10.4296875, -9.0830078125, -7.736328125, -6.3896484375, -5.04296875, -3.6962890625, -2.349609375, -1.0029296875, 0.34375, 1.6904296875, 3.037109375, 4.3837890625, 5.73046875, 7.0771484375, 8.423828125, 9.7705078125, 11.1171875, 12.4638671875, 13.810546875, 15.1572265625, 16.50390625, 17.8505859375, 19.197265625, 20.5439453125, 21.890625, 23.2373046875, 24.583984375, 25.9306640625, 27.27734375, 28.6240234375, 29.970703125, 31.3173828125, 32.6640625, 34.0107421875, 35.357421875, 36.7041015625, 38.05078125, 39.3974609375, 40.744140625, 42.0908203125, 43.4375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 7.0, 3.0, 5.0, 9.0, 4.0, 14.0, 15.0, 18.0, 14.0, 30.0, 36.0, 35.0, 34.0, 43.0, 34.0, 36.0, 47.0, 45.0, 67.0, 50.0, 73.0, 52.0, 44.0, 29.0, 39.0, 25.0, 33.0, 29.0, 22.0, 16.0, 13.0, 13.0, 17.0, 10.0, 6.0, 9.0, 6.0, 3.0, 4.0, 0.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.53125, -18.93896484375, -18.3466796875, -17.75439453125, -17.162109375, -16.56982421875, -15.9775390625, -15.38525390625, -14.79296875, -14.20068359375, -13.6083984375, -13.01611328125, -12.423828125, -11.83154296875, -11.2392578125, -10.64697265625, -10.0546875, -9.46240234375, -8.8701171875, -8.27783203125, -7.685546875, -7.09326171875, -6.5009765625, -5.90869140625, -5.31640625, -4.72412109375, -4.1318359375, -3.53955078125, -2.947265625, -2.35498046875, -1.7626953125, -1.17041015625, -0.578125, 0.01416015625, 0.6064453125, 1.19873046875, 1.791015625, 2.38330078125, 2.9755859375, 3.56787109375, 4.16015625, 4.75244140625, 5.3447265625, 5.93701171875, 6.529296875, 7.12158203125, 7.7138671875, 8.30615234375, 8.8984375, 9.49072265625, 10.0830078125, 10.67529296875, 11.267578125, 11.85986328125, 12.4521484375, 13.04443359375, 13.63671875, 14.22900390625, 14.8212890625, 15.41357421875, 16.005859375, 16.59814453125, 17.1904296875, 17.78271484375, 18.375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 9.0, 8.0, 14.0, 17.0, 23.0, 33.0, 54.0, 61.0, 96.0, 118.0, 173.0, 250.0, 405.0, 549.0, 949.0, 1542.0, 3724.0, 13276.0, 77720.0, 522283.0, 359805.0, 51097.0, 9656.0, 2943.0, 1369.0, 773.0, 504.0, 334.0, 212.0, 165.0, 99.0, 76.0, 56.0, 46.0, 28.0, 23.0, 15.0, 15.0, 7.0, 11.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-72.125, -69.7900390625, -67.455078125, -65.1201171875, -62.78515625, -60.4501953125, -58.115234375, -55.7802734375, -53.4453125, -51.1103515625, -48.775390625, -46.4404296875, -44.10546875, -41.7705078125, -39.435546875, -37.1005859375, -34.765625, -32.4306640625, -30.095703125, -27.7607421875, -25.42578125, -23.0908203125, -20.755859375, -18.4208984375, -16.0859375, -13.7509765625, -11.416015625, -9.0810546875, -6.74609375, -4.4111328125, -2.076171875, 0.2587890625, 2.59375, 4.9287109375, 7.263671875, 9.5986328125, 11.93359375, 14.2685546875, 16.603515625, 18.9384765625, 21.2734375, 23.6083984375, 25.943359375, 28.2783203125, 30.61328125, 32.9482421875, 35.283203125, 37.6181640625, 39.953125, 42.2880859375, 44.623046875, 46.9580078125, 49.29296875, 51.6279296875, 53.962890625, 56.2978515625, 58.6328125, 60.9677734375, 63.302734375, 65.6376953125, 67.97265625, 70.3076171875, 72.642578125, 74.9775390625, 77.3125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 13.0, 8.0, 10.0, 8.0, 15.0, 17.0, 13.0, 20.0, 32.0, 31.0, 26.0, 42.0, 41.0, 26.0, 31.0, 41.0, 52.0, 56.0, 49.0, 39.0, 49.0, 51.0, 47.0, 41.0, 36.0, 29.0, 26.0, 18.0, 17.0, 23.0, 18.0, 23.0, 13.0, 9.0, 11.0, 5.0, 3.0, 0.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-86.0625, -83.4873046875, -80.912109375, -78.3369140625, -75.76171875, -73.1865234375, -70.611328125, -68.0361328125, -65.4609375, -62.8857421875, -60.310546875, -57.7353515625, -55.16015625, -52.5849609375, -50.009765625, -47.4345703125, -44.859375, -42.2841796875, -39.708984375, -37.1337890625, -34.55859375, -31.9833984375, -29.408203125, -26.8330078125, -24.2578125, -21.6826171875, -19.107421875, -16.5322265625, -13.95703125, -11.3818359375, -8.806640625, -6.2314453125, -3.65625, -1.0810546875, 1.494140625, 4.0693359375, 6.64453125, 9.2197265625, 11.794921875, 14.3701171875, 16.9453125, 19.5205078125, 22.095703125, 24.6708984375, 27.24609375, 29.8212890625, 32.396484375, 34.9716796875, 37.546875, 40.1220703125, 42.697265625, 45.2724609375, 47.84765625, 50.4228515625, 52.998046875, 55.5732421875, 58.1484375, 60.7236328125, 63.298828125, 65.8740234375, 68.44921875, 71.0244140625, 73.599609375, 76.1748046875, 78.75]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 7.0, 6.0, 5.0, 11.0, 18.0, 15.0, 16.0, 26.0, 17.0, 35.0, 36.0, 85.0, 86.0, 149.0, 204.0, 408.0, 917.0, 2940.0, 15225.0, 265928.0, 725751.0, 29529.0, 4531.0, 1296.0, 483.0, 265.0, 148.0, 106.0, 62.0, 58.0, 39.0, 32.0, 22.0, 17.0, 17.0, 13.0, 16.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-74.8125, -72.6220703125, -70.431640625, -68.2412109375, -66.05078125, -63.8603515625, -61.669921875, -59.4794921875, -57.2890625, -55.0986328125, -52.908203125, -50.7177734375, -48.52734375, -46.3369140625, -44.146484375, -41.9560546875, -39.765625, -37.5751953125, -35.384765625, -33.1943359375, -31.00390625, -28.8134765625, -26.623046875, -24.4326171875, -22.2421875, -20.0517578125, -17.861328125, -15.6708984375, -13.48046875, -11.2900390625, -9.099609375, -6.9091796875, -4.71875, -2.5283203125, -0.337890625, 1.8525390625, 4.04296875, 6.2333984375, 8.423828125, 10.6142578125, 12.8046875, 14.9951171875, 17.185546875, 19.3759765625, 21.56640625, 23.7568359375, 25.947265625, 28.1376953125, 30.328125, 32.5185546875, 34.708984375, 36.8994140625, 39.08984375, 41.2802734375, 43.470703125, 45.6611328125, 47.8515625, 50.0419921875, 52.232421875, 54.4228515625, 56.61328125, 58.8037109375, 60.994140625, 63.1845703125, 65.375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 4.0, 9.0, 13.0, 15.0, 34.0, 35.0, 69.0, 123.0, 159.0, 156.0, 132.0, 80.0, 59.0, 35.0, 19.0, 19.0, 12.0, 3.0, 6.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00930023193359375, -0.009020805358886719, -0.008741378784179688, -0.008461952209472656, -0.008182525634765625, -0.007903099060058594, -0.0076236724853515625, -0.007344245910644531, -0.0070648193359375, -0.006785392761230469, -0.0065059661865234375, -0.006226539611816406, -0.005947113037109375, -0.005667686462402344, -0.0053882598876953125, -0.005108833312988281, -0.00482940673828125, -0.004549980163574219, -0.0042705535888671875, -0.003991127014160156, -0.003711700439453125, -0.0034322738647460938, -0.0031528472900390625, -0.0028734207153320312, -0.002593994140625, -0.0023145675659179688, -0.0020351409912109375, -0.0017557144165039062, -0.001476287841796875, -0.0011968612670898438, -0.0009174346923828125, -0.0006380081176757812, -0.00035858154296875, -7.915496826171875e-05, 0.0002002716064453125, 0.00047969818115234375, 0.000759124755859375, 0.0010385513305664062, 0.0013179779052734375, 0.0015974044799804688, 0.0018768310546875, 0.0021562576293945312, 0.0024356842041015625, 0.0027151107788085938, 0.002994537353515625, 0.0032739639282226562, 0.0035533905029296875, 0.0038328170776367188, 0.00411224365234375, 0.004391670227050781, 0.0046710968017578125, 0.004950523376464844, 0.005229949951171875, 0.005509376525878906, 0.0057888031005859375, 0.006068229675292969, 0.00634765625, 0.006627082824707031, 0.0069065093994140625, 0.007185935974121094, 0.007465362548828125, 0.007744789123535156, 0.008024215698242188, 0.008303642272949219, 0.00858306884765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 8.0, 9.0, 18.0, 26.0, 39.0, 38.0, 55.0, 64.0, 136.0, 239.0, 463.0, 1039.0, 2624.0, 9700.0, 71910.0, 842647.0, 102289.0, 11890.0, 3077.0, 1102.0, 500.0, 251.0, 149.0, 84.0, 54.0, 45.0, 22.0, 19.0, 11.0, 9.0, 9.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.75, -68.5771484375, -66.404296875, -64.2314453125, -62.05859375, -59.8857421875, -57.712890625, -55.5400390625, -53.3671875, -51.1943359375, -49.021484375, -46.8486328125, -44.67578125, -42.5029296875, -40.330078125, -38.1572265625, -35.984375, -33.8115234375, -31.638671875, -29.4658203125, -27.29296875, -25.1201171875, -22.947265625, -20.7744140625, -18.6015625, -16.4287109375, -14.255859375, -12.0830078125, -9.91015625, -7.7373046875, -5.564453125, -3.3916015625, -1.21875, 0.9541015625, 3.126953125, 5.2998046875, 7.47265625, 9.6455078125, 11.818359375, 13.9912109375, 16.1640625, 18.3369140625, 20.509765625, 22.6826171875, 24.85546875, 27.0283203125, 29.201171875, 31.3740234375, 33.546875, 35.7197265625, 37.892578125, 40.0654296875, 42.23828125, 44.4111328125, 46.583984375, 48.7568359375, 50.9296875, 53.1025390625, 55.275390625, 57.4482421875, 59.62109375, 61.7939453125, 63.966796875, 66.1396484375, 68.3125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 8.0, 9.0, 12.0, 7.0, 20.0, 23.0, 29.0, 45.0, 52.0, 73.0, 76.0, 129.0, 120.0, 99.0, 75.0, 59.0, 50.0, 34.0, 24.0, 5.0, 14.0, 7.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.19873046875, -32.6474609375, -31.09619140625, -29.544921875, -27.99365234375, -26.4423828125, -24.89111328125, -23.33984375, -21.78857421875, -20.2373046875, -18.68603515625, -17.134765625, -15.58349609375, -14.0322265625, -12.48095703125, -10.9296875, -9.37841796875, -7.8271484375, -6.27587890625, -4.724609375, -3.17333984375, -1.6220703125, -0.07080078125, 1.48046875, 3.03173828125, 4.5830078125, 6.13427734375, 7.685546875, 9.23681640625, 10.7880859375, 12.33935546875, 13.890625, 15.44189453125, 16.9931640625, 18.54443359375, 20.095703125, 21.64697265625, 23.1982421875, 24.74951171875, 26.30078125, 27.85205078125, 29.4033203125, 30.95458984375, 32.505859375, 34.05712890625, 35.6083984375, 37.15966796875, 38.7109375, 40.26220703125, 41.8134765625, 43.36474609375, 44.916015625, 46.46728515625, 48.0185546875, 49.56982421875, 51.12109375, 52.67236328125, 54.2236328125, 55.77490234375, 57.326171875, 58.87744140625, 60.4287109375, 61.97998046875, 63.53125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 27.0, 91.0, 199.0, 315.0, 216.0, 92.0, 37.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-855.9484252929688, -816.4798583984375, -777.01123046875, -737.5426635742188, -698.0740966796875, -658.60546875, -619.1369018554688, -579.6683349609375, -540.19970703125, -500.7311096191406, -461.26251220703125, -421.7939453125, -382.3253479003906, -342.85675048828125, -303.38818359375, -263.9195861816406, -224.45098876953125, -184.98239135742188, -145.51380920410156, -106.04521942138672, -66.57662963867188, -27.1080322265625, 12.360549926757812, 51.829132080078125, 91.2977294921875, 130.76632690429688, 170.2349090576172, 209.7034912109375, 249.17208862304688, 288.64068603515625, 328.1092529296875, 367.5778503417969, 407.0465087890625, 446.5151062011719, 485.98370361328125, 525.4522705078125, 564.9208984375, 604.3894653320312, 643.8580322265625, 683.32666015625, 722.7952270507812, 762.2637939453125, 801.732421875, 841.2009887695312, 880.6695556640625, 920.13818359375, 959.6067504882812, 999.0753173828125, 1038.5439453125, 1078.0125732421875, 1117.4810791015625, 1156.94970703125, 1196.4183349609375, 1235.886962890625, 1275.35546875, 1314.8240966796875, 1354.292724609375, 1393.7613525390625, 1433.2298583984375, 1472.698486328125, 1512.1671142578125, 1551.6357421875, 1591.104248046875, 1630.5728759765625, 1670.0413818359375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 8.0, 7.0, 6.0, 14.0, 11.0, 14.0, 16.0, 23.0, 25.0, 22.0, 34.0, 36.0, 28.0, 39.0, 37.0, 39.0, 48.0, 38.0, 41.0, 40.0, 65.0, 37.0, 46.0, 40.0, 41.0, 30.0, 33.0, 33.0, 19.0, 25.0, 12.0, 13.0, 12.0, 9.0, 13.0, 5.0, 5.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-381.6477355957031, -369.9373779296875, -358.2270202636719, -346.51666259765625, -334.80633544921875, -323.0959777832031, -311.3856201171875, -299.6752624511719, -287.96490478515625, -276.2545471191406, -264.544189453125, -252.83384704589844, -241.12350463867188, -229.41314697265625, -217.70278930664062, -205.992431640625, -194.2821044921875, -182.57174682617188, -170.8614044189453, -159.1510467529297, -147.44070434570312, -135.7303466796875, -124.01998901367188, -112.30963897705078, -100.59928894042969, -88.8889389038086, -77.1785888671875, -65.46823120117188, -53.75788116455078, -42.04753112792969, -30.337173461914062, -18.62682342529297, -6.91650390625, 4.793848037719727, 16.504199981689453, 28.214553833007812, 39.924903869628906, 51.63525390625, 63.345611572265625, 75.05596160888672, 86.76631164550781, 98.4766616821289, 110.18701171875, 121.89736938476562, 133.60772705078125, 145.3180694580078, 157.02842712402344, 168.73876953125, 180.44912719726562, 192.15948486328125, 203.8698272705078, 215.58018493652344, 227.29052734375, 239.00088500976562, 250.71124267578125, 262.4216003417969, 274.1319580078125, 285.8423156738281, 297.55267333984375, 309.26300048828125, 320.9733581542969, 332.6837158203125, 344.3940734863281, 356.10443115234375, 367.81475830078125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 9.0, 12.0, 22.0, 39.0, 46.0, 86.0, 125.0, 241.0, 365.0, 771.0, 1657.0, 3946.0, 11590.0, 52905.0, 4039562.0, 62431.0, 12598.0, 4269.0, 1754.0, 803.0, 438.0, 221.0, 136.0, 83.0, 57.0, 37.0, 26.0, 13.0, 8.0, 7.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-86.0625, -83.244140625, -80.42578125, -77.607421875, -74.7890625, -71.970703125, -69.15234375, -66.333984375, -63.515625, -60.697265625, -57.87890625, -55.060546875, -52.2421875, -49.423828125, -46.60546875, -43.787109375, -40.96875, -38.150390625, -35.33203125, -32.513671875, -29.6953125, -26.876953125, -24.05859375, -21.240234375, -18.421875, -15.603515625, -12.78515625, -9.966796875, -7.1484375, -4.330078125, -1.51171875, 1.306640625, 4.125, 6.943359375, 9.76171875, 12.580078125, 15.3984375, 18.216796875, 21.03515625, 23.853515625, 26.671875, 29.490234375, 32.30859375, 35.126953125, 37.9453125, 40.763671875, 43.58203125, 46.400390625, 49.21875, 52.037109375, 54.85546875, 57.673828125, 60.4921875, 63.310546875, 66.12890625, 68.947265625, 71.765625, 74.583984375, 77.40234375, 80.220703125, 83.0390625, 85.857421875, 88.67578125, 91.494140625, 94.3125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 8.0, 6.0, 10.0, 17.0, 13.0, 20.0, 25.0, 27.0, 47.0, 59.0, 46.0, 45.0, 56.0, 59.0, 62.0, 66.0, 62.0, 65.0, 55.0, 43.0, 33.0, 33.0, 23.0, 24.0, 21.0, 15.0, 14.0, 8.0, 9.0, 6.0, 5.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.984375, -17.266845703125, -16.54931640625, -15.831787109375, -15.1142578125, -14.396728515625, -13.67919921875, -12.961669921875, -12.244140625, -11.526611328125, -10.80908203125, -10.091552734375, -9.3740234375, -8.656494140625, -7.93896484375, -7.221435546875, -6.50390625, -5.786376953125, -5.06884765625, -4.351318359375, -3.6337890625, -2.916259765625, -2.19873046875, -1.481201171875, -0.763671875, -0.046142578125, 0.67138671875, 1.388916015625, 2.1064453125, 2.823974609375, 3.54150390625, 4.259033203125, 4.9765625, 5.694091796875, 6.41162109375, 7.129150390625, 7.8466796875, 8.564208984375, 9.28173828125, 9.999267578125, 10.716796875, 11.434326171875, 12.15185546875, 12.869384765625, 13.5869140625, 14.304443359375, 15.02197265625, 15.739501953125, 16.45703125, 17.174560546875, 17.89208984375, 18.609619140625, 19.3271484375, 20.044677734375, 20.76220703125, 21.479736328125, 22.197265625, 22.914794921875, 23.63232421875, 24.349853515625, 25.0673828125, 25.784912109375, 26.50244140625, 27.219970703125, 27.9375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 7.0, 12.0, 17.0, 17.0, 22.0, 27.0, 41.0, 67.0, 76.0, 112.0, 170.0, 248.0, 334.0, 494.0, 697.0, 1196.0, 2048.0, 3968.0, 9200.0, 30140.0, 462443.0, 3626826.0, 35440.0, 10302.0, 4297.0, 2241.0, 1309.0, 814.0, 503.0, 350.0, 243.0, 176.0, 123.0, 82.0, 73.0, 50.0, 33.0, 23.0, 19.0, 11.0, 13.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.6875, -69.451171875, -67.21484375, -64.978515625, -62.7421875, -60.505859375, -58.26953125, -56.033203125, -53.796875, -51.560546875, -49.32421875, -47.087890625, -44.8515625, -42.615234375, -40.37890625, -38.142578125, -35.90625, -33.669921875, -31.43359375, -29.197265625, -26.9609375, -24.724609375, -22.48828125, -20.251953125, -18.015625, -15.779296875, -13.54296875, -11.306640625, -9.0703125, -6.833984375, -4.59765625, -2.361328125, -0.125, 2.111328125, 4.34765625, 6.583984375, 8.8203125, 11.056640625, 13.29296875, 15.529296875, 17.765625, 20.001953125, 22.23828125, 24.474609375, 26.7109375, 28.947265625, 31.18359375, 33.419921875, 35.65625, 37.892578125, 40.12890625, 42.365234375, 44.6015625, 46.837890625, 49.07421875, 51.310546875, 53.546875, 55.783203125, 58.01953125, 60.255859375, 62.4921875, 64.728515625, 66.96484375, 69.201171875, 71.4375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 13.0, 12.0, 23.0, 38.0, 62.0, 233.0, 3353.0, 160.0, 76.0, 34.0, 13.0, 12.0, 6.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.90625, -46.69140625, -45.4765625, -44.26171875, -43.046875, -41.83203125, -40.6171875, -39.40234375, -38.1875, -36.97265625, -35.7578125, -34.54296875, -33.328125, -32.11328125, -30.8984375, -29.68359375, -28.46875, -27.25390625, -26.0390625, -24.82421875, -23.609375, -22.39453125, -21.1796875, -19.96484375, -18.75, -17.53515625, -16.3203125, -15.10546875, -13.890625, -12.67578125, -11.4609375, -10.24609375, -9.03125, -7.81640625, -6.6015625, -5.38671875, -4.171875, -2.95703125, -1.7421875, -0.52734375, 0.6875, 1.90234375, 3.1171875, 4.33203125, 5.546875, 6.76171875, 7.9765625, 9.19140625, 10.40625, 11.62109375, 12.8359375, 14.05078125, 15.265625, 16.48046875, 17.6953125, 18.91015625, 20.125, 21.33984375, 22.5546875, 23.76953125, 24.984375, 26.19921875, 27.4140625, 28.62890625, 29.84375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 7.0, 5.0, 15.0, 23.0, 59.0, 75.0, 151.0, 172.0, 161.0, 128.0, 80.0, 57.0, 25.0, 15.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-217.40093994140625, -212.0947265625, -206.7885284423828, -201.48233032226562, -196.17611694335938, -190.86990356445312, -185.56370544433594, -180.25750732421875, -174.9512939453125, -169.64508056640625, -164.33888244628906, -159.03268432617188, -153.72647094726562, -148.42025756835938, -143.1140594482422, -137.807861328125, -132.50164794921875, -127.19544219970703, -121.88923645019531, -116.5830307006836, -111.27682495117188, -105.97061920166016, -100.66441345214844, -95.35820770263672, -90.052001953125, -84.74579620361328, -79.43959045410156, -74.13338470458984, -68.82717895507812, -63.520973205566406, -58.21476745605469, -52.90856170654297, -47.60234069824219, -42.29613494873047, -36.98992919921875, -31.68372344970703, -26.377517700195312, -21.071311950683594, -15.765106201171875, -10.458900451660156, -5.1526947021484375, 0.15351104736328125, 5.459716796875, 10.765922546386719, 16.072128295898438, 21.378334045410156, 26.684539794921875, 31.990745544433594, 37.29695129394531, 42.60315704345703, 47.90936279296875, 53.21556854248047, 58.52177429199219, 63.827980041503906, 69.13418579101562, 74.44039154052734, 79.74659729003906, 85.05280303955078, 90.3590087890625, 95.66521453857422, 100.97142028808594, 106.27762603759766, 111.58383178710938, 116.8900375366211, 122.19624328613281]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 3.0, 9.0, 10.0, 12.0, 9.0, 12.0, 21.0, 16.0, 22.0, 29.0, 29.0, 26.0, 37.0, 31.0, 37.0, 34.0, 50.0, 34.0, 38.0, 49.0, 45.0, 49.0, 43.0, 39.0, 40.0, 32.0, 28.0, 30.0, 23.0, 26.0, 16.0, 13.0, 14.0, 16.0, 15.0, 11.0, 7.0, 10.0, 6.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-63.826290130615234, -61.83027648925781, -59.83426284790039, -57.83824920654297, -55.84223556518555, -53.846221923828125, -51.85021209716797, -49.85419845581055, -47.858184814453125, -45.8621711730957, -43.86615753173828, -41.87014389038086, -39.87413024902344, -37.87812042236328, -35.882102966308594, -33.88609313964844, -31.890077590942383, -29.89406394958496, -27.89805030822754, -25.90203857421875, -23.906024932861328, -21.910011291503906, -19.913997650146484, -17.917984008789062, -15.921971321105957, -13.925957679748535, -11.92994499206543, -9.933931350708008, -7.937918186187744, -5.9419050216674805, -3.9458913803100586, -1.9498786926269531, 0.04613494873046875, 2.0421481132507324, 4.038161277770996, 6.034174919128418, 8.030187606811523, 10.026201248168945, 12.022214889526367, 14.018227577209473, 16.014240264892578, 18.01025390625, 20.006267547607422, 22.002281188964844, 23.998292922973633, 25.994306564331055, 27.990320205688477, 29.986331939697266, 31.98234748840332, 33.97835922241211, 35.97437286376953, 37.97038650512695, 39.966400146484375, 41.9624137878418, 43.95842742919922, 45.95444107055664, 47.95045471191406, 49.946468353271484, 51.942481994628906, 53.93849563598633, 55.93450927734375, 57.930519104003906, 59.926536560058594, 61.92254638671875, 63.91856002807617]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 9.0, 11.0, 20.0, 28.0, 35.0, 58.0, 69.0, 121.0, 196.0, 340.0, 607.0, 1179.0, 2495.0, 5885.0, 15655.0, 46812.0, 149228.0, 391602.0, 289958.0, 95393.0, 30287.0, 10575.0, 4164.0, 1752.0, 867.0, 454.0, 249.0, 170.0, 128.0, 75.0, 45.0, 25.0, 18.0, 12.0, 7.0, 3.0, 5.0, 2.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-70.8125, -68.7177734375, -66.623046875, -64.5283203125, -62.43359375, -60.3388671875, -58.244140625, -56.1494140625, -54.0546875, -51.9599609375, -49.865234375, -47.7705078125, -45.67578125, -43.5810546875, -41.486328125, -39.3916015625, -37.296875, -35.2021484375, -33.107421875, -31.0126953125, -28.91796875, -26.8232421875, -24.728515625, -22.6337890625, -20.5390625, -18.4443359375, -16.349609375, -14.2548828125, -12.16015625, -10.0654296875, -7.970703125, -5.8759765625, -3.78125, -1.6865234375, 0.408203125, 2.5029296875, 4.59765625, 6.6923828125, 8.787109375, 10.8818359375, 12.9765625, 15.0712890625, 17.166015625, 19.2607421875, 21.35546875, 23.4501953125, 25.544921875, 27.6396484375, 29.734375, 31.8291015625, 33.923828125, 36.0185546875, 38.11328125, 40.2080078125, 42.302734375, 44.3974609375, 46.4921875, 48.5869140625, 50.681640625, 52.7763671875, 54.87109375, 56.9658203125, 59.060546875, 61.1552734375, 63.25]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 11.0, 6.0, 16.0, 11.0, 16.0, 23.0, 25.0, 26.0, 33.0, 61.0, 42.0, 48.0, 46.0, 56.0, 66.0, 56.0, 58.0, 62.0, 43.0, 42.0, 50.0, 34.0, 25.0, 27.0, 22.0, 19.0, 15.0, 9.0, 13.0, 8.0, 4.0, 7.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.921875, -18.205810546875, -17.48974609375, -16.773681640625, -16.0576171875, -15.341552734375, -14.62548828125, -13.909423828125, -13.193359375, -12.477294921875, -11.76123046875, -11.045166015625, -10.3291015625, -9.613037109375, -8.89697265625, -8.180908203125, -7.46484375, -6.748779296875, -6.03271484375, -5.316650390625, -4.6005859375, -3.884521484375, -3.16845703125, -2.452392578125, -1.736328125, -1.020263671875, -0.30419921875, 0.411865234375, 1.1279296875, 1.843994140625, 2.56005859375, 3.276123046875, 3.9921875, 4.708251953125, 5.42431640625, 6.140380859375, 6.8564453125, 7.572509765625, 8.28857421875, 9.004638671875, 9.720703125, 10.436767578125, 11.15283203125, 11.868896484375, 12.5849609375, 13.301025390625, 14.01708984375, 14.733154296875, 15.44921875, 16.165283203125, 16.88134765625, 17.597412109375, 18.3134765625, 19.029541015625, 19.74560546875, 20.461669921875, 21.177734375, 21.893798828125, 22.60986328125, 23.325927734375, 24.0419921875, 24.758056640625, 25.47412109375, 26.190185546875, 26.90625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 5.0, 5.0, 11.0, 6.0, 12.0, 22.0, 23.0, 39.0, 74.0, 88.0, 187.0, 243.0, 422.0, 783.0, 1483.0, 4084.0, 17238.0, 151091.0, 730729.0, 120401.0, 14614.0, 3710.0, 1501.0, 705.0, 385.0, 234.0, 156.0, 103.0, 64.0, 32.0, 30.0, 20.0, 12.0, 8.0, 8.0, 5.0, 5.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.375, -115.806640625, -112.23828125, -108.669921875, -105.1015625, -101.533203125, -97.96484375, -94.396484375, -90.828125, -87.259765625, -83.69140625, -80.123046875, -76.5546875, -72.986328125, -69.41796875, -65.849609375, -62.28125, -58.712890625, -55.14453125, -51.576171875, -48.0078125, -44.439453125, -40.87109375, -37.302734375, -33.734375, -30.166015625, -26.59765625, -23.029296875, -19.4609375, -15.892578125, -12.32421875, -8.755859375, -5.1875, -1.619140625, 1.94921875, 5.517578125, 9.0859375, 12.654296875, 16.22265625, 19.791015625, 23.359375, 26.927734375, 30.49609375, 34.064453125, 37.6328125, 41.201171875, 44.76953125, 48.337890625, 51.90625, 55.474609375, 59.04296875, 62.611328125, 66.1796875, 69.748046875, 73.31640625, 76.884765625, 80.453125, 84.021484375, 87.58984375, 91.158203125, 94.7265625, 98.294921875, 101.86328125, 105.431640625, 109.0]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 5.0, 6.0, 14.0, 21.0, 18.0, 23.0, 18.0, 33.0, 41.0, 41.0, 56.0, 54.0, 46.0, 51.0, 47.0, 71.0, 51.0, 56.0, 42.0, 46.0, 41.0, 47.0, 22.0, 26.0, 23.0, 31.0, 15.0, 7.0, 10.0, 9.0, 5.0, 8.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.4375, -85.4072265625, -82.376953125, -79.3466796875, -76.31640625, -73.2861328125, -70.255859375, -67.2255859375, -64.1953125, -61.1650390625, -58.134765625, -55.1044921875, -52.07421875, -49.0439453125, -46.013671875, -42.9833984375, -39.953125, -36.9228515625, -33.892578125, -30.8623046875, -27.83203125, -24.8017578125, -21.771484375, -18.7412109375, -15.7109375, -12.6806640625, -9.650390625, -6.6201171875, -3.58984375, -0.5595703125, 2.470703125, 5.5009765625, 8.53125, 11.5615234375, 14.591796875, 17.6220703125, 20.65234375, 23.6826171875, 26.712890625, 29.7431640625, 32.7734375, 35.8037109375, 38.833984375, 41.8642578125, 44.89453125, 47.9248046875, 50.955078125, 53.9853515625, 57.015625, 60.0458984375, 63.076171875, 66.1064453125, 69.13671875, 72.1669921875, 75.197265625, 78.2275390625, 81.2578125, 84.2880859375, 87.318359375, 90.3486328125, 93.37890625, 96.4091796875, 99.439453125, 102.4697265625, 105.5]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 9.0, 13.0, 12.0, 14.0, 26.0, 21.0, 36.0, 42.0, 62.0, 109.0, 140.0, 287.0, 508.0, 993.0, 2525.0, 8341.0, 49811.0, 693336.0, 261697.0, 22065.0, 4852.0, 1755.0, 770.0, 411.0, 211.0, 139.0, 91.0, 74.0, 51.0, 28.0, 24.0, 27.0, 14.0, 10.0, 13.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-45.65625, -44.220703125, -42.78515625, -41.349609375, -39.9140625, -38.478515625, -37.04296875, -35.607421875, -34.171875, -32.736328125, -31.30078125, -29.865234375, -28.4296875, -26.994140625, -25.55859375, -24.123046875, -22.6875, -21.251953125, -19.81640625, -18.380859375, -16.9453125, -15.509765625, -14.07421875, -12.638671875, -11.203125, -9.767578125, -8.33203125, -6.896484375, -5.4609375, -4.025390625, -2.58984375, -1.154296875, 0.28125, 1.716796875, 3.15234375, 4.587890625, 6.0234375, 7.458984375, 8.89453125, 10.330078125, 11.765625, 13.201171875, 14.63671875, 16.072265625, 17.5078125, 18.943359375, 20.37890625, 21.814453125, 23.25, 24.685546875, 26.12109375, 27.556640625, 28.9921875, 30.427734375, 31.86328125, 33.298828125, 34.734375, 36.169921875, 37.60546875, 39.041015625, 40.4765625, 41.912109375, 43.34765625, 44.783203125, 46.21875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 2.0, 17.0, 16.0, 9.0, 14.0, 24.0, 40.0, 54.0, 53.0, 75.0, 70.0, 106.0, 111.0, 86.0, 69.0, 55.0, 36.0, 32.0, 24.0, 19.0, 13.0, 11.0, 13.0, 8.0, 7.0, 5.0, 2.0, 5.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005535125732421875, -0.005357980728149414, -0.005180835723876953, -0.005003690719604492, -0.004826545715332031, -0.00464940071105957, -0.004472255706787109, -0.0042951107025146484, -0.0041179656982421875, -0.0039408206939697266, -0.0037636756896972656, -0.0035865306854248047, -0.0034093856811523438, -0.003232240676879883, -0.003055095672607422, -0.002877950668334961, -0.0027008056640625, -0.002523660659790039, -0.002346515655517578, -0.002169370651245117, -0.0019922256469726562, -0.0018150806427001953, -0.0016379356384277344, -0.0014607906341552734, -0.0012836456298828125, -0.0011065006256103516, -0.0009293556213378906, -0.0007522106170654297, -0.0005750656127929688, -0.0003979206085205078, -0.00022077560424804688, -4.363059997558594e-05, 0.000133514404296875, 0.00031065940856933594, 0.0004878044128417969, 0.0006649494171142578, 0.0008420944213867188, 0.0010192394256591797, 0.0011963844299316406, 0.0013735294342041016, 0.0015506744384765625, 0.0017278194427490234, 0.0019049644470214844, 0.0020821094512939453, 0.0022592544555664062, 0.002436399459838867, 0.002613544464111328, 0.002790689468383789, 0.00296783447265625, 0.003144979476928711, 0.003322124481201172, 0.003499269485473633, 0.0036764144897460938, 0.0038535594940185547, 0.004030704498291016, 0.0042078495025634766, 0.0043849945068359375, 0.0045621395111083984, 0.004739284515380859, 0.00491642951965332, 0.005093574523925781, 0.005270719528198242, 0.005447864532470703, 0.005625009536743164, 0.005802154541015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 9.0, 4.0, 5.0, 8.0, 9.0, 18.0, 39.0, 34.0, 42.0, 80.0, 97.0, 144.0, 242.0, 398.0, 711.0, 1594.0, 4307.0, 15714.0, 124204.0, 782295.0, 97723.0, 13657.0, 3969.0, 1507.0, 680.0, 371.0, 208.0, 129.0, 105.0, 57.0, 47.0, 26.0, 35.0, 25.0, 16.0, 7.0, 12.0, 10.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-52.59375, -51.1103515625, -49.626953125, -48.1435546875, -46.66015625, -45.1767578125, -43.693359375, -42.2099609375, -40.7265625, -39.2431640625, -37.759765625, -36.2763671875, -34.79296875, -33.3095703125, -31.826171875, -30.3427734375, -28.859375, -27.3759765625, -25.892578125, -24.4091796875, -22.92578125, -21.4423828125, -19.958984375, -18.4755859375, -16.9921875, -15.5087890625, -14.025390625, -12.5419921875, -11.05859375, -9.5751953125, -8.091796875, -6.6083984375, -5.125, -3.6416015625, -2.158203125, -0.6748046875, 0.80859375, 2.2919921875, 3.775390625, 5.2587890625, 6.7421875, 8.2255859375, 9.708984375, 11.1923828125, 12.67578125, 14.1591796875, 15.642578125, 17.1259765625, 18.609375, 20.0927734375, 21.576171875, 23.0595703125, 24.54296875, 26.0263671875, 27.509765625, 28.9931640625, 30.4765625, 31.9599609375, 33.443359375, 34.9267578125, 36.41015625, 37.8935546875, 39.376953125, 40.8603515625, 42.34375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 7.0, 7.0, 10.0, 6.0, 18.0, 25.0, 22.0, 54.0, 75.0, 98.0, 142.0, 134.0, 127.0, 82.0, 62.0, 32.0, 26.0, 14.0, 13.0, 7.0, 8.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.40625, -41.80712890625, -40.2080078125, -38.60888671875, -37.009765625, -35.41064453125, -33.8115234375, -32.21240234375, -30.61328125, -29.01416015625, -27.4150390625, -25.81591796875, -24.216796875, -22.61767578125, -21.0185546875, -19.41943359375, -17.8203125, -16.22119140625, -14.6220703125, -13.02294921875, -11.423828125, -9.82470703125, -8.2255859375, -6.62646484375, -5.02734375, -3.42822265625, -1.8291015625, -0.22998046875, 1.369140625, 2.96826171875, 4.5673828125, 6.16650390625, 7.765625, 9.36474609375, 10.9638671875, 12.56298828125, 14.162109375, 15.76123046875, 17.3603515625, 18.95947265625, 20.55859375, 22.15771484375, 23.7568359375, 25.35595703125, 26.955078125, 28.55419921875, 30.1533203125, 31.75244140625, 33.3515625, 34.95068359375, 36.5498046875, 38.14892578125, 39.748046875, 41.34716796875, 42.9462890625, 44.54541015625, 46.14453125, 47.74365234375, 49.3427734375, 50.94189453125, 52.541015625, 54.14013671875, 55.7392578125, 57.33837890625, 58.9375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 16.0, 46.0, 95.0, 136.0, 230.0, 215.0, 137.0, 60.0, 23.0, 18.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-635.205322265625, -603.095703125, -570.986083984375, -538.87646484375, -506.7668762207031, -474.6572570800781, -442.54766845703125, -410.43804931640625, -378.32843017578125, -346.21881103515625, -314.10919189453125, -281.9996032714844, -249.88998413085938, -217.78036499023438, -185.67076110839844, -153.5611572265625, -121.4515380859375, -89.34192657470703, -57.23231506347656, -25.122703552246094, 6.986907958984375, 39.096527099609375, 71.20613098144531, 103.31573486328125, 135.42535400390625, 167.53497314453125, 199.6445770263672, 231.75418090820312, 263.8638000488281, 295.9734191894531, 328.0830078125, 360.192626953125, 392.3023681640625, 424.4119873046875, 456.5216064453125, 488.6311950683594, 520.7408447265625, 552.8504638671875, 584.9600219726562, 617.0696411132812, 649.1792602539062, 681.2888793945312, 713.3984985351562, 745.5081176757812, 777.61767578125, 809.727294921875, 841.8369140625, 873.946533203125, 906.05615234375, 938.165771484375, 970.275390625, 1002.385009765625, 1034.49462890625, 1066.604248046875, 1098.7138671875, 1130.823486328125, 1162.93310546875, 1195.042724609375, 1227.15234375, 1259.261962890625, 1291.37158203125, 1323.481201171875, 1355.5908203125, 1387.700439453125, 1419.8099365234375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 8.0, 6.0, 8.0, 16.0, 16.0, 13.0, 18.0, 16.0, 24.0, 30.0, 29.0, 42.0, 50.0, 44.0, 56.0, 60.0, 62.0, 47.0, 57.0, 57.0, 42.0, 42.0, 35.0, 40.0, 41.0, 26.0, 24.0, 16.0, 19.0, 9.0, 14.0, 8.0, 8.0, 1.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-464.69232177734375, -450.9377136230469, -437.1830749511719, -423.428466796875, -409.673828125, -395.9192199707031, -382.16461181640625, -368.40997314453125, -354.6553649902344, -340.9007568359375, -327.1461181640625, -313.3915100097656, -299.6368713378906, -285.88226318359375, -272.12762451171875, -258.3730163574219, -244.61839294433594, -230.86376953125, -217.10914611816406, -203.35452270507812, -189.59991455078125, -175.8452911376953, -162.09066772460938, -148.3360595703125, -134.5814208984375, -120.82679748535156, -107.07218170166016, -93.31755828857422, -79.56294250488281, -65.80831909179688, -52.05369567871094, -38.29907989501953, -24.544464111328125, -10.789843559265137, 2.9647769927978516, 16.719398498535156, 30.474018096923828, 44.2286376953125, 57.98326110839844, 71.73787689208984, 85.49250030517578, 99.24712371826172, 113.00173950195312, 126.75636291503906, 140.510986328125, 154.26559448242188, 168.02023315429688, 181.77484130859375, 195.5294647216797, 209.28408813476562, 223.03871154785156, 236.7933349609375, 250.54794311523438, 264.30255126953125, 278.05718994140625, 291.8117980957031, 305.5664367675781, 319.321044921875, 333.07568359375, 346.8302917480469, 360.5849304199219, 374.33953857421875, 388.09417724609375, 401.8487854003906, 415.6033935546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 2.0, 7.0, 5.0, 11.0, 21.0, 25.0, 38.0, 58.0, 80.0, 118.0, 225.0, 443.0, 965.0, 2295.0, 5939.0, 18274.0, 71135.0, 849220.0, 3071013.0, 131416.0, 28367.0, 8798.0, 3102.0, 1363.0, 603.0, 311.0, 167.0, 103.0, 54.0, 33.0, 21.0, 20.0, 17.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.40625, -50.54638671875, -48.6865234375, -46.82666015625, -44.966796875, -43.10693359375, -41.2470703125, -39.38720703125, -37.52734375, -35.66748046875, -33.8076171875, -31.94775390625, -30.087890625, -28.22802734375, -26.3681640625, -24.50830078125, -22.6484375, -20.78857421875, -18.9287109375, -17.06884765625, -15.208984375, -13.34912109375, -11.4892578125, -9.62939453125, -7.76953125, -5.90966796875, -4.0498046875, -2.18994140625, -0.330078125, 1.52978515625, 3.3896484375, 5.24951171875, 7.109375, 8.96923828125, 10.8291015625, 12.68896484375, 14.548828125, 16.40869140625, 18.2685546875, 20.12841796875, 21.98828125, 23.84814453125, 25.7080078125, 27.56787109375, 29.427734375, 31.28759765625, 33.1474609375, 35.00732421875, 36.8671875, 38.72705078125, 40.5869140625, 42.44677734375, 44.306640625, 46.16650390625, 48.0263671875, 49.88623046875, 51.74609375, 53.60595703125, 55.4658203125, 57.32568359375, 59.185546875, 61.04541015625, 62.9052734375, 64.76513671875, 66.625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 7.0, 5.0, 7.0, 8.0, 5.0, 13.0, 16.0, 18.0, 21.0, 29.0, 34.0, 36.0, 35.0, 45.0, 56.0, 50.0, 55.0, 43.0, 54.0, 64.0, 52.0, 50.0, 52.0, 43.0, 35.0, 32.0, 22.0, 22.0, 14.0, 11.0, 13.0, 13.0, 11.0, 7.0, 5.0, 6.0, 3.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.578125, -19.95703125, -19.3359375, -18.71484375, -18.09375, -17.47265625, -16.8515625, -16.23046875, -15.609375, -14.98828125, -14.3671875, -13.74609375, -13.125, -12.50390625, -11.8828125, -11.26171875, -10.640625, -10.01953125, -9.3984375, -8.77734375, -8.15625, -7.53515625, -6.9140625, -6.29296875, -5.671875, -5.05078125, -4.4296875, -3.80859375, -3.1875, -2.56640625, -1.9453125, -1.32421875, -0.703125, -0.08203125, 0.5390625, 1.16015625, 1.78125, 2.40234375, 3.0234375, 3.64453125, 4.265625, 4.88671875, 5.5078125, 6.12890625, 6.75, 7.37109375, 7.9921875, 8.61328125, 9.234375, 9.85546875, 10.4765625, 11.09765625, 11.71875, 12.33984375, 12.9609375, 13.58203125, 14.203125, 14.82421875, 15.4453125, 16.06640625, 16.6875, 17.30859375, 17.9296875, 18.55078125, 19.171875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 3.0, 9.0, 10.0, 29.0, 31.0, 59.0, 96.0, 133.0, 303.0, 762.0, 2128.0, 7103.0, 30157.0, 235541.0, 3682107.0, 198499.0, 27616.0, 6396.0, 1958.0, 688.0, 304.0, 124.0, 79.0, 32.0, 30.0, 22.0, 18.0, 7.0, 7.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-97.75, -95.2734375, -92.796875, -90.3203125, -87.84375, -85.3671875, -82.890625, -80.4140625, -77.9375, -75.4609375, -72.984375, -70.5078125, -68.03125, -65.5546875, -63.078125, -60.6015625, -58.125, -55.6484375, -53.171875, -50.6953125, -48.21875, -45.7421875, -43.265625, -40.7890625, -38.3125, -35.8359375, -33.359375, -30.8828125, -28.40625, -25.9296875, -23.453125, -20.9765625, -18.5, -16.0234375, -13.546875, -11.0703125, -8.59375, -6.1171875, -3.640625, -1.1640625, 1.3125, 3.7890625, 6.265625, 8.7421875, 11.21875, 13.6953125, 16.171875, 18.6484375, 21.125, 23.6015625, 26.078125, 28.5546875, 31.03125, 33.5078125, 35.984375, 38.4609375, 40.9375, 43.4140625, 45.890625, 48.3671875, 50.84375, 53.3203125, 55.796875, 58.2734375, 60.75]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 9.0, 5.0, 11.0, 6.0, 12.0, 18.0, 23.0, 37.0, 40.0, 67.0, 98.0, 174.0, 392.0, 934.0, 1173.0, 518.0, 206.0, 104.0, 65.0, 55.0, 40.0, 26.0, 21.0, 12.0, 10.0, 5.0, 5.0, 3.0, 2.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.625, -61.515625, -59.40625, -57.296875, -55.1875, -53.078125, -50.96875, -48.859375, -46.75, -44.640625, -42.53125, -40.421875, -38.3125, -36.203125, -34.09375, -31.984375, -29.875, -27.765625, -25.65625, -23.546875, -21.4375, -19.328125, -17.21875, -15.109375, -13.0, -10.890625, -8.78125, -6.671875, -4.5625, -2.453125, -0.34375, 1.765625, 3.875, 5.984375, 8.09375, 10.203125, 12.3125, 14.421875, 16.53125, 18.640625, 20.75, 22.859375, 24.96875, 27.078125, 29.1875, 31.296875, 33.40625, 35.515625, 37.625, 39.734375, 41.84375, 43.953125, 46.0625, 48.171875, 50.28125, 52.390625, 54.5, 56.609375, 58.71875, 60.828125, 62.9375, 65.046875, 67.15625, 69.265625, 71.375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 5.0, 23.0, 34.0, 59.0, 136.0, 211.0, 215.0, 148.0, 80.0, 36.0, 15.0, 7.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-595.4869384765625, -572.8504028320312, -550.2138061523438, -527.5772705078125, -504.94073486328125, -482.3041687011719, -459.6676025390625, -437.03106689453125, -414.3945007324219, -391.7579345703125, -369.12139892578125, -346.4848327636719, -323.8482666015625, -301.21173095703125, -278.5751647949219, -255.93861389160156, -233.30206298828125, -210.66551208496094, -188.02896118164062, -165.39239501953125, -142.75584411621094, -120.11929321289062, -97.48272705078125, -74.84617614746094, -52.209625244140625, -29.573070526123047, -6.936515808105469, 15.700042724609375, 38.33659362792969, 60.97314453125, 83.60971069335938, 106.24626159667969, 128.8828125, 151.5193634033203, 174.15591430664062, 196.79248046875, 219.4290313720703, 242.06558227539062, 264.7021484375, 287.33868408203125, 309.9752502441406, 332.61181640625, 355.24835205078125, 377.8849182128906, 400.521484375, 423.15802001953125, 445.7945861816406, 468.43115234375, 491.06768798828125, 513.7042236328125, 536.3408203125, 558.9773559570312, 581.6138916015625, 604.25048828125, 626.8870239257812, 649.5235595703125, 672.16015625, 694.7966918945312, 717.4332885742188, 740.06982421875, 762.7063598632812, 785.3428955078125, 807.9794921875, 830.6160278320312, 853.2525634765625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 9.0, 8.0, 13.0, 10.0, 13.0, 23.0, 36.0, 26.0, 37.0, 30.0, 38.0, 38.0, 42.0, 41.0, 44.0, 47.0, 43.0, 55.0, 59.0, 39.0, 34.0, 43.0, 27.0, 27.0, 30.0, 27.0, 26.0, 17.0, 24.0, 19.0, 14.0, 6.0, 8.0, 3.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.61831665039062, -234.143798828125, -226.66928100585938, -219.1947479248047, -211.72023010253906, -204.24571228027344, -196.77117919921875, -189.29666137695312, -181.8221435546875, -174.34762573242188, -166.87310791015625, -159.39857482910156, -151.92405700683594, -144.4495391845703, -136.97500610351562, -129.50048828125, -122.02597045898438, -114.55145263671875, -107.0769271850586, -99.60240173339844, -92.12788391113281, -84.65336608886719, -77.17884063720703, -69.70431518554688, -62.22979736328125, -54.75527572631836, -47.28075408935547, -39.80623245239258, -32.33171081542969, -24.857189178466797, -17.382667541503906, -9.908145904541016, -2.433624267578125, 5.040897369384766, 12.515419006347656, 19.989940643310547, 27.464462280273438, 34.93898391723633, 42.41350555419922, 49.88802719116211, 57.362548828125, 64.83706665039062, 72.31159210205078, 79.78611755371094, 87.26063537597656, 94.73515319824219, 102.20967864990234, 109.6842041015625, 117.15872192382812, 124.63323974609375, 132.10775756835938, 139.58229064941406, 147.0568084716797, 154.5313262939453, 162.005859375, 169.48037719726562, 176.95489501953125, 184.42941284179688, 191.9039306640625, 199.3784637451172, 206.8529815673828, 214.32749938964844, 221.80203247070312, 229.27655029296875, 236.75106811523438]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 14.0, 9.0, 13.0, 26.0, 37.0, 67.0, 105.0, 145.0, 252.0, 528.0, 1242.0, 3326.0, 10165.0, 37341.0, 159266.0, 515420.0, 242928.0, 55747.0, 14480.0, 4358.0, 1576.0, 677.0, 289.0, 205.0, 113.0, 68.0, 37.0, 30.0, 21.0, 14.0, 7.0, 11.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-87.3125, -84.7919921875, -82.271484375, -79.7509765625, -77.23046875, -74.7099609375, -72.189453125, -69.6689453125, -67.1484375, -64.6279296875, -62.107421875, -59.5869140625, -57.06640625, -54.5458984375, -52.025390625, -49.5048828125, -46.984375, -44.4638671875, -41.943359375, -39.4228515625, -36.90234375, -34.3818359375, -31.861328125, -29.3408203125, -26.8203125, -24.2998046875, -21.779296875, -19.2587890625, -16.73828125, -14.2177734375, -11.697265625, -9.1767578125, -6.65625, -4.1357421875, -1.615234375, 0.9052734375, 3.42578125, 5.9462890625, 8.466796875, 10.9873046875, 13.5078125, 16.0283203125, 18.548828125, 21.0693359375, 23.58984375, 26.1103515625, 28.630859375, 31.1513671875, 33.671875, 36.1923828125, 38.712890625, 41.2333984375, 43.75390625, 46.2744140625, 48.794921875, 51.3154296875, 53.8359375, 56.3564453125, 58.876953125, 61.3974609375, 63.91796875, 66.4384765625, 68.958984375, 71.4794921875, 74.0]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 6.0, 5.0, 6.0, 12.0, 9.0, 9.0, 12.0, 22.0, 21.0, 24.0, 21.0, 44.0, 32.0, 46.0, 44.0, 52.0, 48.0, 48.0, 52.0, 44.0, 62.0, 48.0, 41.0, 40.0, 44.0, 44.0, 37.0, 21.0, 21.0, 18.0, 9.0, 12.0, 11.0, 6.0, 7.0, 6.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.53125, -19.88623046875, -19.2412109375, -18.59619140625, -17.951171875, -17.30615234375, -16.6611328125, -16.01611328125, -15.37109375, -14.72607421875, -14.0810546875, -13.43603515625, -12.791015625, -12.14599609375, -11.5009765625, -10.85595703125, -10.2109375, -9.56591796875, -8.9208984375, -8.27587890625, -7.630859375, -6.98583984375, -6.3408203125, -5.69580078125, -5.05078125, -4.40576171875, -3.7607421875, -3.11572265625, -2.470703125, -1.82568359375, -1.1806640625, -0.53564453125, 0.109375, 0.75439453125, 1.3994140625, 2.04443359375, 2.689453125, 3.33447265625, 3.9794921875, 4.62451171875, 5.26953125, 5.91455078125, 6.5595703125, 7.20458984375, 7.849609375, 8.49462890625, 9.1396484375, 9.78466796875, 10.4296875, 11.07470703125, 11.7197265625, 12.36474609375, 13.009765625, 13.65478515625, 14.2998046875, 14.94482421875, 15.58984375, 16.23486328125, 16.8798828125, 17.52490234375, 18.169921875, 18.81494140625, 19.4599609375, 20.10498046875, 20.75]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 6.0, 4.0, 14.0, 15.0, 12.0, 21.0, 30.0, 46.0, 77.0, 137.0, 185.0, 325.0, 645.0, 1346.0, 3486.0, 14443.0, 155117.0, 796631.0, 62618.0, 8664.0, 2379.0, 1062.0, 515.0, 293.0, 172.0, 115.0, 59.0, 51.0, 28.0, 21.0, 12.0, 6.0, 6.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-142.375, -137.83203125, -133.2890625, -128.74609375, -124.203125, -119.66015625, -115.1171875, -110.57421875, -106.03125, -101.48828125, -96.9453125, -92.40234375, -87.859375, -83.31640625, -78.7734375, -74.23046875, -69.6875, -65.14453125, -60.6015625, -56.05859375, -51.515625, -46.97265625, -42.4296875, -37.88671875, -33.34375, -28.80078125, -24.2578125, -19.71484375, -15.171875, -10.62890625, -6.0859375, -1.54296875, 3.0, 7.54296875, 12.0859375, 16.62890625, 21.171875, 25.71484375, 30.2578125, 34.80078125, 39.34375, 43.88671875, 48.4296875, 52.97265625, 57.515625, 62.05859375, 66.6015625, 71.14453125, 75.6875, 80.23046875, 84.7734375, 89.31640625, 93.859375, 98.40234375, 102.9453125, 107.48828125, 112.03125, 116.57421875, 121.1171875, 125.66015625, 130.203125, 134.74609375, 139.2890625, 143.83203125, 148.375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 3.0, 4.0, 3.0, 11.0, 17.0, 16.0, 13.0, 23.0, 26.0, 43.0, 36.0, 44.0, 44.0, 52.0, 70.0, 49.0, 62.0, 57.0, 51.0, 59.0, 47.0, 42.0, 38.0, 32.0, 33.0, 16.0, 19.0, 16.0, 18.0, 14.0, 4.0, 7.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.5, -85.2255859375, -81.951171875, -78.6767578125, -75.40234375, -72.1279296875, -68.853515625, -65.5791015625, -62.3046875, -59.0302734375, -55.755859375, -52.4814453125, -49.20703125, -45.9326171875, -42.658203125, -39.3837890625, -36.109375, -32.8349609375, -29.560546875, -26.2861328125, -23.01171875, -19.7373046875, -16.462890625, -13.1884765625, -9.9140625, -6.6396484375, -3.365234375, -0.0908203125, 3.18359375, 6.4580078125, 9.732421875, 13.0068359375, 16.28125, 19.5556640625, 22.830078125, 26.1044921875, 29.37890625, 32.6533203125, 35.927734375, 39.2021484375, 42.4765625, 45.7509765625, 49.025390625, 52.2998046875, 55.57421875, 58.8486328125, 62.123046875, 65.3974609375, 68.671875, 71.9462890625, 75.220703125, 78.4951171875, 81.76953125, 85.0439453125, 88.318359375, 91.5927734375, 94.8671875, 98.1416015625, 101.416015625, 104.6904296875, 107.96484375, 111.2392578125, 114.513671875, 117.7880859375, 121.0625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 1.0, 4.0, 1.0, 7.0, 10.0, 9.0, 14.0, 21.0, 27.0, 34.0, 73.0, 68.0, 145.0, 246.0, 458.0, 972.0, 2776.0, 11089.0, 100926.0, 846185.0, 72069.0, 9140.0, 2346.0, 893.0, 408.0, 225.0, 136.0, 76.0, 56.0, 32.0, 22.0, 17.0, 13.0, 20.0, 10.0, 3.0, 6.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.65625, -50.9814453125, -49.306640625, -47.6318359375, -45.95703125, -44.2822265625, -42.607421875, -40.9326171875, -39.2578125, -37.5830078125, -35.908203125, -34.2333984375, -32.55859375, -30.8837890625, -29.208984375, -27.5341796875, -25.859375, -24.1845703125, -22.509765625, -20.8349609375, -19.16015625, -17.4853515625, -15.810546875, -14.1357421875, -12.4609375, -10.7861328125, -9.111328125, -7.4365234375, -5.76171875, -4.0869140625, -2.412109375, -0.7373046875, 0.9375, 2.6123046875, 4.287109375, 5.9619140625, 7.63671875, 9.3115234375, 10.986328125, 12.6611328125, 14.3359375, 16.0107421875, 17.685546875, 19.3603515625, 21.03515625, 22.7099609375, 24.384765625, 26.0595703125, 27.734375, 29.4091796875, 31.083984375, 32.7587890625, 34.43359375, 36.1083984375, 37.783203125, 39.4580078125, 41.1328125, 42.8076171875, 44.482421875, 46.1572265625, 47.83203125, 49.5068359375, 51.181640625, 52.8564453125, 54.53125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 8.0, 7.0, 5.0, 13.0, 17.0, 22.0, 39.0, 54.0, 99.0, 167.0, 204.0, 160.0, 87.0, 38.0, 29.0, 18.0, 16.0, 8.0, 6.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01345062255859375, -0.013058662414550781, -0.012666702270507812, -0.012274742126464844, -0.011882781982421875, -0.011490821838378906, -0.011098861694335938, -0.010706901550292969, -0.01031494140625, -0.009922981262207031, -0.009531021118164062, -0.009139060974121094, -0.008747100830078125, -0.008355140686035156, -0.007963180541992188, -0.007571220397949219, -0.00717926025390625, -0.006787300109863281, -0.0063953399658203125, -0.006003379821777344, -0.005611419677734375, -0.005219459533691406, -0.0048274993896484375, -0.004435539245605469, -0.0040435791015625, -0.0036516189575195312, -0.0032596588134765625, -0.0028676986694335938, -0.002475738525390625, -0.0020837783813476562, -0.0016918182373046875, -0.0012998580932617188, -0.00090789794921875, -0.0005159378051757812, -0.0001239776611328125, 0.00026798248291015625, 0.000659942626953125, 0.0010519027709960938, 0.0014438629150390625, 0.0018358230590820312, 0.002227783203125, 0.0026197433471679688, 0.0030117034912109375, 0.0034036636352539062, 0.003795623779296875, 0.004187583923339844, 0.0045795440673828125, 0.004971504211425781, 0.00536346435546875, 0.005755424499511719, 0.0061473846435546875, 0.006539344787597656, 0.006931304931640625, 0.007323265075683594, 0.0077152252197265625, 0.008107185363769531, 0.0084991455078125, 0.008891105651855469, 0.009283065795898438, 0.009675025939941406, 0.010066986083984375, 0.010458946228027344, 0.010850906372070312, 0.011242866516113281, 0.01163482666015625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 14.0, 14.0, 21.0, 32.0, 34.0, 66.0, 103.0, 171.0, 304.0, 623.0, 1541.0, 4856.0, 25991.0, 611010.0, 376625.0, 20390.0, 4115.0, 1361.0, 574.0, 275.0, 128.0, 77.0, 65.0, 48.0, 30.0, 15.0, 12.0, 9.0, 10.0, 8.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.15625, -47.39697265625, -45.6376953125, -43.87841796875, -42.119140625, -40.35986328125, -38.6005859375, -36.84130859375, -35.08203125, -33.32275390625, -31.5634765625, -29.80419921875, -28.044921875, -26.28564453125, -24.5263671875, -22.76708984375, -21.0078125, -19.24853515625, -17.4892578125, -15.72998046875, -13.970703125, -12.21142578125, -10.4521484375, -8.69287109375, -6.93359375, -5.17431640625, -3.4150390625, -1.65576171875, 0.103515625, 1.86279296875, 3.6220703125, 5.38134765625, 7.140625, 8.89990234375, 10.6591796875, 12.41845703125, 14.177734375, 15.93701171875, 17.6962890625, 19.45556640625, 21.21484375, 22.97412109375, 24.7333984375, 26.49267578125, 28.251953125, 30.01123046875, 31.7705078125, 33.52978515625, 35.2890625, 37.04833984375, 38.8076171875, 40.56689453125, 42.326171875, 44.08544921875, 45.8447265625, 47.60400390625, 49.36328125, 51.12255859375, 52.8818359375, 54.64111328125, 56.400390625, 58.15966796875, 59.9189453125, 61.67822265625, 63.4375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 12.0, 13.0, 12.0, 13.0, 30.0, 26.0, 51.0, 75.0, 70.0, 101.0, 123.0, 116.0, 72.0, 76.0, 59.0, 34.0, 26.0, 18.0, 13.0, 7.0, 8.0, 6.0, 6.0, 8.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.0625, -37.79296875, -36.5234375, -35.25390625, -33.984375, -32.71484375, -31.4453125, -30.17578125, -28.90625, -27.63671875, -26.3671875, -25.09765625, -23.828125, -22.55859375, -21.2890625, -20.01953125, -18.75, -17.48046875, -16.2109375, -14.94140625, -13.671875, -12.40234375, -11.1328125, -9.86328125, -8.59375, -7.32421875, -6.0546875, -4.78515625, -3.515625, -2.24609375, -0.9765625, 0.29296875, 1.5625, 2.83203125, 4.1015625, 5.37109375, 6.640625, 7.91015625, 9.1796875, 10.44921875, 11.71875, 12.98828125, 14.2578125, 15.52734375, 16.796875, 18.06640625, 19.3359375, 20.60546875, 21.875, 23.14453125, 24.4140625, 25.68359375, 26.953125, 28.22265625, 29.4921875, 30.76171875, 32.03125, 33.30078125, 34.5703125, 35.83984375, 37.109375, 38.37890625, 39.6484375, 40.91796875, 42.1875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 8.0, 15.0, 37.0, 70.0, 123.0, 195.0, 212.0, 160.0, 81.0, 40.0, 28.0, 12.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1059.01806640625, -1032.680908203125, -1006.3436279296875, -980.0064086914062, -953.669189453125, -927.33203125, -900.9948120117188, -874.6575927734375, -848.3203735351562, -821.983154296875, -795.6459350585938, -769.3087158203125, -742.9715576171875, -716.63427734375, -690.297119140625, -663.9598999023438, -637.6226806640625, -611.2854614257812, -584.9482421875, -558.6110229492188, -532.2738037109375, -505.9366149902344, -479.59942626953125, -453.26220703125, -426.92498779296875, -400.5877685546875, -374.25054931640625, -347.9133605957031, -321.5761413574219, -295.2389221191406, -268.9017333984375, -242.56451416015625, -216.227294921875, -189.89007568359375, -163.55287170410156, -137.21566772460938, -110.87844848632812, -84.54122924804688, -58.20402526855469, -31.8668212890625, -5.52960205078125, 20.80760955810547, 47.14482116699219, 73.4820327758789, 99.81924438476562, 126.15646362304688, 152.49366760253906, 178.83087158203125, 205.1680908203125, 231.50531005859375, 257.842529296875, 284.1797180175781, 310.5169372558594, 336.8541564941406, 363.19134521484375, 389.528564453125, 415.86578369140625, 442.2030029296875, 468.54022216796875, 494.8774108886719, 521.214599609375, 547.5518798828125, 573.8890380859375, 600.2262573242188, 626.5634765625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 12.0, 19.0, 15.0, 20.0, 40.0, 48.0, 58.0, 51.0, 55.0, 74.0, 96.0, 80.0, 74.0, 59.0, 66.0, 52.0, 44.0, 38.0, 19.0, 20.0, 21.0, 10.0, 10.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-653.1954345703125, -636.46875, -619.7420043945312, -603.0153198242188, -586.28857421875, -569.5618896484375, -552.8351440429688, -536.1084594726562, -519.3817138671875, -502.6549987792969, -485.92828369140625, -469.2015686035156, -452.474853515625, -435.7481689453125, -419.0214538574219, -402.29473876953125, -385.56805419921875, -368.8413391113281, -352.1146240234375, -335.3879089355469, -318.66119384765625, -301.93450927734375, -285.2077941894531, -268.4810791015625, -251.75436401367188, -235.02764892578125, -218.30093383789062, -201.57423400878906, -184.84751892089844, -168.1208038330078, -151.39410400390625, -134.66738891601562, -117.940673828125, -101.21395874023438, -84.48725128173828, -67.76054382324219, -51.03382873535156, -34.30711364746094, -17.580406188964844, -0.85369873046875, 15.873016357421875, 32.599727630615234, 49.326438903808594, 66.05314636230469, 82.77986145019531, 99.50657653808594, 116.23328399658203, 132.95999145507812, 149.68670654296875, 166.41342163085938, 183.14013671875, 199.86683654785156, 216.5935516357422, 233.3202667236328, 250.04696655273438, 266.773681640625, 283.5003967285156, 300.22711181640625, 316.9538269042969, 333.6805419921875, 350.4072265625, 367.13397216796875, 383.86065673828125, 400.5873718261719, 417.3140869140625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 16.0, 12.0, 19.0, 24.0, 36.0, 57.0, 97.0, 185.0, 380.0, 902.0, 2639.0, 9081.0, 47235.0, 2144638.0, 1928712.0, 46502.0, 9393.0, 2685.0, 860.0, 348.0, 194.0, 122.0, 51.0, 32.0, 21.0, 12.0, 6.0, 3.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-90.0, -87.69189453125, -85.3837890625, -83.07568359375, -80.767578125, -78.45947265625, -76.1513671875, -73.84326171875, -71.53515625, -69.22705078125, -66.9189453125, -64.61083984375, -62.302734375, -59.99462890625, -57.6865234375, -55.37841796875, -53.0703125, -50.76220703125, -48.4541015625, -46.14599609375, -43.837890625, -41.52978515625, -39.2216796875, -36.91357421875, -34.60546875, -32.29736328125, -29.9892578125, -27.68115234375, -25.373046875, -23.06494140625, -20.7568359375, -18.44873046875, -16.140625, -13.83251953125, -11.5244140625, -9.21630859375, -6.908203125, -4.60009765625, -2.2919921875, 0.01611328125, 2.32421875, 4.63232421875, 6.9404296875, 9.24853515625, 11.556640625, 13.86474609375, 16.1728515625, 18.48095703125, 20.7890625, 23.09716796875, 25.4052734375, 27.71337890625, 30.021484375, 32.32958984375, 34.6376953125, 36.94580078125, 39.25390625, 41.56201171875, 43.8701171875, 46.17822265625, 48.486328125, 50.79443359375, 53.1025390625, 55.41064453125, 57.71875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 13.0, 20.0, 22.0, 52.0, 69.0, 105.0, 121.0, 141.0, 124.0, 104.0, 99.0, 45.0, 42.0, 24.0, 15.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.375, -73.76171875, -72.1484375, -70.53515625, -68.921875, -67.30859375, -65.6953125, -64.08203125, -62.46875, -60.85546875, -59.2421875, -57.62890625, -56.015625, -54.40234375, -52.7890625, -51.17578125, -49.5625, -47.94921875, -46.3359375, -44.72265625, -43.109375, -41.49609375, -39.8828125, -38.26953125, -36.65625, -35.04296875, -33.4296875, -31.81640625, -30.203125, -28.58984375, -26.9765625, -25.36328125, -23.75, -22.13671875, -20.5234375, -18.91015625, -17.296875, -15.68359375, -14.0703125, -12.45703125, -10.84375, -9.23046875, -7.6171875, -6.00390625, -4.390625, -2.77734375, -1.1640625, 0.44921875, 2.0625, 3.67578125, 5.2890625, 6.90234375, 8.515625, 10.12890625, 11.7421875, 13.35546875, 14.96875, 16.58203125, 18.1953125, 19.80859375, 21.421875, 23.03515625, 24.6484375, 26.26171875, 27.875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 9.0, 14.0, 12.0, 22.0, 30.0, 53.0, 57.0, 114.0, 201.0, 344.0, 625.0, 1137.0, 2238.0, 4686.0, 10106.0, 24165.0, 71291.0, 425621.0, 3227434.0, 322881.0, 62652.0, 22043.0, 9294.0, 4394.0, 2197.0, 1173.0, 615.0, 336.0, 204.0, 116.0, 73.0, 47.0, 30.0, 19.0, 16.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.25, -45.83740234375, -44.4248046875, -43.01220703125, -41.599609375, -40.18701171875, -38.7744140625, -37.36181640625, -35.94921875, -34.53662109375, -33.1240234375, -31.71142578125, -30.298828125, -28.88623046875, -27.4736328125, -26.06103515625, -24.6484375, -23.23583984375, -21.8232421875, -20.41064453125, -18.998046875, -17.58544921875, -16.1728515625, -14.76025390625, -13.34765625, -11.93505859375, -10.5224609375, -9.10986328125, -7.697265625, -6.28466796875, -4.8720703125, -3.45947265625, -2.046875, -0.63427734375, 0.7783203125, 2.19091796875, 3.603515625, 5.01611328125, 6.4287109375, 7.84130859375, 9.25390625, 10.66650390625, 12.0791015625, 13.49169921875, 14.904296875, 16.31689453125, 17.7294921875, 19.14208984375, 20.5546875, 21.96728515625, 23.3798828125, 24.79248046875, 26.205078125, 27.61767578125, 29.0302734375, 30.44287109375, 31.85546875, 33.26806640625, 34.6806640625, 36.09326171875, 37.505859375, 38.91845703125, 40.3310546875, 41.74365234375, 43.15625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 11.0, 12.0, 6.0, 19.0, 21.0, 21.0, 39.0, 48.0, 72.0, 99.0, 221.0, 377.0, 824.0, 1049.0, 533.0, 248.0, 141.0, 89.0, 73.0, 37.0, 25.0, 13.0, 14.0, 17.0, 5.0, 14.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.9375, -52.31982421875, -50.7021484375, -49.08447265625, -47.466796875, -45.84912109375, -44.2314453125, -42.61376953125, -40.99609375, -39.37841796875, -37.7607421875, -36.14306640625, -34.525390625, -32.90771484375, -31.2900390625, -29.67236328125, -28.0546875, -26.43701171875, -24.8193359375, -23.20166015625, -21.583984375, -19.96630859375, -18.3486328125, -16.73095703125, -15.11328125, -13.49560546875, -11.8779296875, -10.26025390625, -8.642578125, -7.02490234375, -5.4072265625, -3.78955078125, -2.171875, -0.55419921875, 1.0634765625, 2.68115234375, 4.298828125, 5.91650390625, 7.5341796875, 9.15185546875, 10.76953125, 12.38720703125, 14.0048828125, 15.62255859375, 17.240234375, 18.85791015625, 20.4755859375, 22.09326171875, 23.7109375, 25.32861328125, 26.9462890625, 28.56396484375, 30.181640625, 31.79931640625, 33.4169921875, 35.03466796875, 36.65234375, 38.27001953125, 39.8876953125, 41.50537109375, 43.123046875, 44.74072265625, 46.3583984375, 47.97607421875, 49.59375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 9.0, 18.0, 21.0, 39.0, 95.0, 182.0, 213.0, 196.0, 105.0, 66.0, 22.0, 14.0, 5.0, 5.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-520.798583984375, -501.9437255859375, -483.0888671875, -464.2339782714844, -445.3791198730469, -426.5242614746094, -407.66937255859375, -388.81451416015625, -369.95965576171875, -351.10479736328125, -332.24993896484375, -313.3950500488281, -294.5401916503906, -275.6853332519531, -256.8304443359375, -237.9755859375, -219.1207275390625, -200.265869140625, -181.41099548339844, -162.55612182617188, -143.70126342773438, -124.84639739990234, -105.99153137207031, -87.13665771484375, -68.28179931640625, -49.42693328857422, -30.572067260742188, -11.717201232910156, 7.137664794921875, 25.992530822753906, 44.84739685058594, 63.7022705078125, 82.55712890625, 101.41199493408203, 120.26686096191406, 139.12173461914062, 157.97659301757812, 176.83145141601562, 195.6863250732422, 214.54119873046875, 233.39605712890625, 252.25091552734375, 271.10577392578125, 289.9606628417969, 308.8155212402344, 327.6703796386719, 346.5252685546875, 365.380126953125, 384.2349853515625, 403.08984375, 421.9447021484375, 440.7995910644531, 459.6544494628906, 478.5093078613281, 497.36419677734375, 516.2190551757812, 535.0739135742188, 553.9287719726562, 572.7836303710938, 591.6384887695312, 610.493408203125, 629.3482666015625, 648.203125, 667.0579833984375, 685.912841796875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 7.0, 2.0, 11.0, 6.0, 15.0, 16.0, 16.0, 13.0, 20.0, 22.0, 26.0, 22.0, 26.0, 38.0, 24.0, 38.0, 39.0, 36.0, 32.0, 42.0, 43.0, 43.0, 45.0, 26.0, 31.0, 43.0, 28.0, 23.0, 31.0, 28.0, 27.0, 24.0, 25.0, 27.0, 24.0, 16.0, 13.0, 7.0, 6.0, 4.0, 9.0, 6.0, 4.0, 6.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-185.49554443359375, -179.41937255859375, -173.3431854248047, -167.2670135498047, -161.19082641601562, -155.11465454101562, -149.03846740722656, -142.96229553222656, -136.8861083984375, -130.8099365234375, -124.73374938964844, -118.6575698852539, -112.58139038085938, -106.50521087646484, -100.42903137207031, -94.35285949707031, -88.27667999267578, -82.20050048828125, -76.12432098388672, -70.04814147949219, -63.971961975097656, -57.895782470703125, -51.81960678100586, -45.74342727661133, -39.6672477722168, -33.591068267822266, -27.514888763427734, -21.438711166381836, -15.362531661987305, -9.286352157592773, -3.210174560546875, 2.8660049438476562, 8.942184448242188, 15.018363952636719, 21.09454345703125, 27.17072105407715, 33.24690246582031, 39.323081970214844, 45.39925765991211, 51.47543716430664, 57.55161666870117, 63.6277961730957, 69.70397186279297, 75.7801513671875, 81.85633087158203, 87.93251037597656, 94.0086898803711, 100.08486938476562, 106.16104888916016, 112.23722839355469, 118.31340789794922, 124.38958740234375, 130.46575927734375, 136.5419464111328, 142.6181182861328, 148.69430541992188, 154.77047729492188, 160.84664916992188, 166.92283630371094, 172.99900817871094, 179.0751953125, 185.1513671875, 191.22755432128906, 197.30372619628906, 203.37991333007812]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 10.0, 15.0, 19.0, 32.0, 57.0, 129.0, 265.0, 746.0, 2134.0, 8307.0, 41107.0, 266819.0, 590132.0, 113042.0, 19284.0, 4396.0, 1242.0, 429.0, 184.0, 88.0, 52.0, 27.0, 16.0, 11.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.0625, -88.0546875, -85.046875, -82.0390625, -79.03125, -76.0234375, -73.015625, -70.0078125, -67.0, -63.9921875, -60.984375, -57.9765625, -54.96875, -51.9609375, -48.953125, -45.9453125, -42.9375, -39.9296875, -36.921875, -33.9140625, -30.90625, -27.8984375, -24.890625, -21.8828125, -18.875, -15.8671875, -12.859375, -9.8515625, -6.84375, -3.8359375, -0.828125, 2.1796875, 5.1875, 8.1953125, 11.203125, 14.2109375, 17.21875, 20.2265625, 23.234375, 26.2421875, 29.25, 32.2578125, 35.265625, 38.2734375, 41.28125, 44.2890625, 47.296875, 50.3046875, 53.3125, 56.3203125, 59.328125, 62.3359375, 65.34375, 68.3515625, 71.359375, 74.3671875, 77.375, 80.3828125, 83.390625, 86.3984375, 89.40625, 92.4140625, 95.421875, 98.4296875, 101.4375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 10.0, 4.0, 16.0, 27.0, 39.0, 45.0, 61.0, 59.0, 69.0, 72.0, 90.0, 77.0, 83.0, 68.0, 55.0, 56.0, 51.0, 34.0, 36.0, 13.0, 15.0, 12.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-47.53125, -46.4326171875, -45.333984375, -44.2353515625, -43.13671875, -42.0380859375, -40.939453125, -39.8408203125, -38.7421875, -37.6435546875, -36.544921875, -35.4462890625, -34.34765625, -33.2490234375, -32.150390625, -31.0517578125, -29.953125, -28.8544921875, -27.755859375, -26.6572265625, -25.55859375, -24.4599609375, -23.361328125, -22.2626953125, -21.1640625, -20.0654296875, -18.966796875, -17.8681640625, -16.76953125, -15.6708984375, -14.572265625, -13.4736328125, -12.375, -11.2763671875, -10.177734375, -9.0791015625, -7.98046875, -6.8818359375, -5.783203125, -4.6845703125, -3.5859375, -2.4873046875, -1.388671875, -0.2900390625, 0.80859375, 1.9072265625, 3.005859375, 4.1044921875, 5.203125, 6.3017578125, 7.400390625, 8.4990234375, 9.59765625, 10.6962890625, 11.794921875, 12.8935546875, 13.9921875, 15.0908203125, 16.189453125, 17.2880859375, 18.38671875, 19.4853515625, 20.583984375, 21.6826171875, 22.78125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 5.0, 22.0, 15.0, 35.0, 32.0, 49.0, 96.0, 132.0, 231.0, 381.0, 660.0, 1342.0, 2991.0, 7945.0, 27366.0, 124755.0, 616837.0, 205447.0, 41519.0, 11253.0, 3836.0, 1569.0, 812.0, 447.0, 289.0, 169.0, 95.0, 75.0, 48.0, 34.0, 12.0, 17.0, 10.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-93.9375, -91.3740234375, -88.810546875, -86.2470703125, -83.68359375, -81.1201171875, -78.556640625, -75.9931640625, -73.4296875, -70.8662109375, -68.302734375, -65.7392578125, -63.17578125, -60.6123046875, -58.048828125, -55.4853515625, -52.921875, -50.3583984375, -47.794921875, -45.2314453125, -42.66796875, -40.1044921875, -37.541015625, -34.9775390625, -32.4140625, -29.8505859375, -27.287109375, -24.7236328125, -22.16015625, -19.5966796875, -17.033203125, -14.4697265625, -11.90625, -9.3427734375, -6.779296875, -4.2158203125, -1.65234375, 0.9111328125, 3.474609375, 6.0380859375, 8.6015625, 11.1650390625, 13.728515625, 16.2919921875, 18.85546875, 21.4189453125, 23.982421875, 26.5458984375, 29.109375, 31.6728515625, 34.236328125, 36.7998046875, 39.36328125, 41.9267578125, 44.490234375, 47.0537109375, 49.6171875, 52.1806640625, 54.744140625, 57.3076171875, 59.87109375, 62.4345703125, 64.998046875, 67.5615234375, 70.125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 5.0, 15.0, 10.0, 17.0, 19.0, 13.0, 24.0, 23.0, 28.0, 35.0, 27.0, 29.0, 46.0, 40.0, 47.0, 50.0, 49.0, 42.0, 48.0, 47.0, 50.0, 35.0, 43.0, 25.0, 35.0, 27.0, 19.0, 28.0, 22.0, 9.0, 9.0, 18.0, 11.0, 5.0, 11.0, 0.0, 6.0, 2.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.9375, -74.3701171875, -71.802734375, -69.2353515625, -66.66796875, -64.1005859375, -61.533203125, -58.9658203125, -56.3984375, -53.8310546875, -51.263671875, -48.6962890625, -46.12890625, -43.5615234375, -40.994140625, -38.4267578125, -35.859375, -33.2919921875, -30.724609375, -28.1572265625, -25.58984375, -23.0224609375, -20.455078125, -17.8876953125, -15.3203125, -12.7529296875, -10.185546875, -7.6181640625, -5.05078125, -2.4833984375, 0.083984375, 2.6513671875, 5.21875, 7.7861328125, 10.353515625, 12.9208984375, 15.48828125, 18.0556640625, 20.623046875, 23.1904296875, 25.7578125, 28.3251953125, 30.892578125, 33.4599609375, 36.02734375, 38.5947265625, 41.162109375, 43.7294921875, 46.296875, 48.8642578125, 51.431640625, 53.9990234375, 56.56640625, 59.1337890625, 61.701171875, 64.2685546875, 66.8359375, 69.4033203125, 71.970703125, 74.5380859375, 77.10546875, 79.6728515625, 82.240234375, 84.8076171875, 87.375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 10.0, 11.0, 17.0, 25.0, 47.0, 45.0, 93.0, 171.0, 332.0, 871.0, 2737.0, 13679.0, 195415.0, 783156.0, 43740.0, 5583.0, 1486.0, 543.0, 255.0, 112.0, 85.0, 39.0, 31.0, 17.0, 11.0, 7.0, 8.0, 11.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.25, -41.537109375, -39.82421875, -38.111328125, -36.3984375, -34.685546875, -32.97265625, -31.259765625, -29.546875, -27.833984375, -26.12109375, -24.408203125, -22.6953125, -20.982421875, -19.26953125, -17.556640625, -15.84375, -14.130859375, -12.41796875, -10.705078125, -8.9921875, -7.279296875, -5.56640625, -3.853515625, -2.140625, -0.427734375, 1.28515625, 2.998046875, 4.7109375, 6.423828125, 8.13671875, 9.849609375, 11.5625, 13.275390625, 14.98828125, 16.701171875, 18.4140625, 20.126953125, 21.83984375, 23.552734375, 25.265625, 26.978515625, 28.69140625, 30.404296875, 32.1171875, 33.830078125, 35.54296875, 37.255859375, 38.96875, 40.681640625, 42.39453125, 44.107421875, 45.8203125, 47.533203125, 49.24609375, 50.958984375, 52.671875, 54.384765625, 56.09765625, 57.810546875, 59.5234375, 61.236328125, 62.94921875, 64.662109375, 66.375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 11.0, 7.0, 7.0, 15.0, 24.0, 20.0, 34.0, 37.0, 65.0, 66.0, 73.0, 115.0, 114.0, 97.0, 61.0, 67.0, 55.0, 27.0, 22.0, 27.0, 12.0, 12.0, 10.0, 10.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006763458251953125, -0.006570994853973389, -0.006378531455993652, -0.006186068058013916, -0.00599360466003418, -0.005801141262054443, -0.005608677864074707, -0.005416214466094971, -0.005223751068115234, -0.005031287670135498, -0.004838824272155762, -0.004646360874176025, -0.004453897476196289, -0.004261434078216553, -0.004068970680236816, -0.00387650728225708, -0.0036840438842773438, -0.0034915804862976074, -0.003299117088317871, -0.0031066536903381348, -0.0029141902923583984, -0.002721726894378662, -0.0025292634963989258, -0.0023368000984191895, -0.002144336700439453, -0.0019518733024597168, -0.0017594099044799805, -0.0015669465065002441, -0.0013744831085205078, -0.0011820197105407715, -0.0009895563125610352, -0.0007970929145812988, -0.0006046295166015625, -0.00041216611862182617, -0.00021970272064208984, -2.7239322662353516e-05, 0.0001652240753173828, 0.00035768747329711914, 0.0005501508712768555, 0.0007426142692565918, 0.0009350776672363281, 0.0011275410652160645, 0.0013200044631958008, 0.0015124678611755371, 0.0017049312591552734, 0.0018973946571350098, 0.002089858055114746, 0.0022823214530944824, 0.0024747848510742188, 0.002667248249053955, 0.0028597116470336914, 0.0030521750450134277, 0.003244638442993164, 0.0034371018409729004, 0.0036295652389526367, 0.003822028636932373, 0.004014492034912109, 0.004206955432891846, 0.004399418830871582, 0.004591882228851318, 0.004784345626831055, 0.004976809024810791, 0.005169272422790527, 0.005361735820770264, 0.00555419921875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 8.0, 17.0, 13.0, 24.0, 43.0, 46.0, 108.0, 155.0, 306.0, 577.0, 1079.0, 2475.0, 7036.0, 27665.0, 194920.0, 686138.0, 101728.0, 17272.0, 4911.0, 1998.0, 886.0, 460.0, 256.0, 145.0, 96.0, 61.0, 37.0, 23.0, 17.0, 12.0, 8.0, 5.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.90625, -32.82470703125, -31.7431640625, -30.66162109375, -29.580078125, -28.49853515625, -27.4169921875, -26.33544921875, -25.25390625, -24.17236328125, -23.0908203125, -22.00927734375, -20.927734375, -19.84619140625, -18.7646484375, -17.68310546875, -16.6015625, -15.52001953125, -14.4384765625, -13.35693359375, -12.275390625, -11.19384765625, -10.1123046875, -9.03076171875, -7.94921875, -6.86767578125, -5.7861328125, -4.70458984375, -3.623046875, -2.54150390625, -1.4599609375, -0.37841796875, 0.703125, 1.78466796875, 2.8662109375, 3.94775390625, 5.029296875, 6.11083984375, 7.1923828125, 8.27392578125, 9.35546875, 10.43701171875, 11.5185546875, 12.60009765625, 13.681640625, 14.76318359375, 15.8447265625, 16.92626953125, 18.0078125, 19.08935546875, 20.1708984375, 21.25244140625, 22.333984375, 23.41552734375, 24.4970703125, 25.57861328125, 26.66015625, 27.74169921875, 28.8232421875, 29.90478515625, 30.986328125, 32.06787109375, 33.1494140625, 34.23095703125, 35.3125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 16.0, 11.0, 31.0, 27.0, 44.0, 72.0, 102.0, 97.0, 126.0, 119.0, 104.0, 74.0, 53.0, 39.0, 16.0, 16.0, 15.0, 7.0, 6.0, 4.0, 8.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.59375, -35.322265625, -34.05078125, -32.779296875, -31.5078125, -30.236328125, -28.96484375, -27.693359375, -26.421875, -25.150390625, -23.87890625, -22.607421875, -21.3359375, -20.064453125, -18.79296875, -17.521484375, -16.25, -14.978515625, -13.70703125, -12.435546875, -11.1640625, -9.892578125, -8.62109375, -7.349609375, -6.078125, -4.806640625, -3.53515625, -2.263671875, -0.9921875, 0.279296875, 1.55078125, 2.822265625, 4.09375, 5.365234375, 6.63671875, 7.908203125, 9.1796875, 10.451171875, 11.72265625, 12.994140625, 14.265625, 15.537109375, 16.80859375, 18.080078125, 19.3515625, 20.623046875, 21.89453125, 23.166015625, 24.4375, 25.708984375, 26.98046875, 28.251953125, 29.5234375, 30.794921875, 32.06640625, 33.337890625, 34.609375, 35.880859375, 37.15234375, 38.423828125, 39.6953125, 40.966796875, 42.23828125, 43.509765625, 44.78125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 9.0, 13.0, 21.0, 65.0, 121.0, 193.0, 226.0, 162.0, 80.0, 50.0, 23.0, 14.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-844.7828369140625, -820.2403564453125, -795.6979370117188, -771.1554565429688, -746.6129760742188, -722.070556640625, -697.528076171875, -672.985595703125, -648.4431762695312, -623.9006958007812, -599.3582763671875, -574.8157958984375, -550.2733154296875, -525.7308959960938, -501.18841552734375, -476.6459655761719, -452.1034851074219, -427.56103515625, -403.0185546875, -378.4761047363281, -353.93365478515625, -329.39117431640625, -304.8487243652344, -280.3062744140625, -255.76380920410156, -231.22134399414062, -206.67889404296875, -182.1364288330078, -157.59396362304688, -133.051513671875, -108.50904846191406, -83.96659851074219, -59.42413330078125, -34.881675720214844, -10.339214324951172, 14.2032470703125, 38.745704650878906, 63.28816223144531, 87.83062744140625, 112.37307739257812, 136.91554260253906, 161.4580078125, 186.00045776367188, 210.5429229736328, 235.08538818359375, 259.6278381347656, 284.1702880859375, 308.7127685546875, 333.2552185058594, 357.79766845703125, 382.34014892578125, 406.8825988769531, 431.425048828125, 455.967529296875, 480.5099792480469, 505.05242919921875, 529.5949096679688, 554.1373901367188, 578.6798095703125, 603.2222900390625, 627.7647705078125, 652.3071899414062, 676.8496704101562, 701.39208984375, 725.9345703125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 5.0, 4.0, 9.0, 14.0, 17.0, 15.0, 11.0, 18.0, 19.0, 30.0, 30.0, 35.0, 36.0, 35.0, 37.0, 47.0, 52.0, 65.0, 60.0, 53.0, 34.0, 43.0, 43.0, 47.0, 29.0, 23.0, 31.0, 23.0, 29.0, 21.0, 18.0, 21.0, 10.0, 10.0, 7.0, 6.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-310.74908447265625, -299.2730407714844, -287.7969970703125, -276.3209533691406, -264.84490966796875, -253.3688507080078, -241.89279174804688, -230.416748046875, -218.94070434570312, -207.46466064453125, -195.98861694335938, -184.51255798339844, -173.03651428222656, -161.5604705810547, -150.08441162109375, -138.60836791992188, -127.13232421875, -115.65628051757812, -104.18022918701172, -92.70417785644531, -81.22813415527344, -69.75209045410156, -58.276039123535156, -46.79998779296875, -35.323944091796875, -23.847896575927734, -12.371849060058594, -0.8958015441894531, 10.580245971679688, 22.056293487548828, 33.53234100341797, 45.008392333984375, 56.484405517578125, 67.96044921875, 79.4365005493164, 90.91255187988281, 102.38859558105469, 113.86463928222656, 125.34069061279297, 136.81674194335938, 148.29278564453125, 159.76882934570312, 171.244873046875, 182.72093200683594, 194.1969757080078, 205.6730194091797, 217.14907836914062, 228.6251220703125, 240.10116577148438, 251.57720947265625, 263.0532531738281, 274.529296875, 286.00537109375, 297.4814147949219, 308.95745849609375, 320.4335021972656, 331.9095458984375, 343.3855895996094, 354.86163330078125, 366.3376770019531, 377.813720703125, 389.289794921875, 400.7658386230469, 412.24188232421875, 423.7179260253906]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 4.0, 5.0, 7.0, 8.0, 23.0, 26.0, 43.0, 74.0, 169.0, 471.0, 1103.0, 3701.0, 15559.0, 94453.0, 2428740.0, 1562501.0, 69442.0, 12641.0, 3359.0, 1059.0, 421.0, 198.0, 87.0, 80.0, 33.0, 25.0, 14.0, 6.0, 6.0, 4.0, 3.0, 9.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-76.25, -74.29150390625, -72.3330078125, -70.37451171875, -68.416015625, -66.45751953125, -64.4990234375, -62.54052734375, -60.58203125, -58.62353515625, -56.6650390625, -54.70654296875, -52.748046875, -50.78955078125, -48.8310546875, -46.87255859375, -44.9140625, -42.95556640625, -40.9970703125, -39.03857421875, -37.080078125, -35.12158203125, -33.1630859375, -31.20458984375, -29.24609375, -27.28759765625, -25.3291015625, -23.37060546875, -21.412109375, -19.45361328125, -17.4951171875, -15.53662109375, -13.578125, -11.61962890625, -9.6611328125, -7.70263671875, -5.744140625, -3.78564453125, -1.8271484375, 0.13134765625, 2.08984375, 4.04833984375, 6.0068359375, 7.96533203125, 9.923828125, 11.88232421875, 13.8408203125, 15.79931640625, 17.7578125, 19.71630859375, 21.6748046875, 23.63330078125, 25.591796875, 27.55029296875, 29.5087890625, 31.46728515625, 33.42578125, 35.38427734375, 37.3427734375, 39.30126953125, 41.259765625, 43.21826171875, 45.1767578125, 47.13525390625, 49.09375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 7.0, 8.0, 11.0, 18.0, 17.0, 23.0, 25.0, 41.0, 40.0, 40.0, 32.0, 51.0, 52.0, 59.0, 60.0, 79.0, 56.0, 50.0, 54.0, 32.0, 46.0, 30.0, 33.0, 29.0, 21.0, 19.0, 14.0, 18.0, 10.0, 10.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-25.171875, -24.4755859375, -23.779296875, -23.0830078125, -22.38671875, -21.6904296875, -20.994140625, -20.2978515625, -19.6015625, -18.9052734375, -18.208984375, -17.5126953125, -16.81640625, -16.1201171875, -15.423828125, -14.7275390625, -14.03125, -13.3349609375, -12.638671875, -11.9423828125, -11.24609375, -10.5498046875, -9.853515625, -9.1572265625, -8.4609375, -7.7646484375, -7.068359375, -6.3720703125, -5.67578125, -4.9794921875, -4.283203125, -3.5869140625, -2.890625, -2.1943359375, -1.498046875, -0.8017578125, -0.10546875, 0.5908203125, 1.287109375, 1.9833984375, 2.6796875, 3.3759765625, 4.072265625, 4.7685546875, 5.46484375, 6.1611328125, 6.857421875, 7.5537109375, 8.25, 8.9462890625, 9.642578125, 10.3388671875, 11.03515625, 11.7314453125, 12.427734375, 13.1240234375, 13.8203125, 14.5166015625, 15.212890625, 15.9091796875, 16.60546875, 17.3017578125, 17.998046875, 18.6943359375, 19.390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 7.0, 10.0, 10.0, 17.0, 30.0, 36.0, 52.0, 63.0, 92.0, 128.0, 273.0, 455.0, 757.0, 1362.0, 2660.0, 5688.0, 12934.0, 33723.0, 105147.0, 583510.0, 2863722.0, 440730.0, 91615.0, 29529.0, 11505.0, 4946.0, 2303.0, 1190.0, 678.0, 368.0, 212.0, 157.0, 85.0, 76.0, 47.0, 43.0, 22.0, 21.0, 19.0, 9.0, 10.0, 6.0, 6.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.4375, -35.19970703125, -33.9619140625, -32.72412109375, -31.486328125, -30.24853515625, -29.0107421875, -27.77294921875, -26.53515625, -25.29736328125, -24.0595703125, -22.82177734375, -21.583984375, -20.34619140625, -19.1083984375, -17.87060546875, -16.6328125, -15.39501953125, -14.1572265625, -12.91943359375, -11.681640625, -10.44384765625, -9.2060546875, -7.96826171875, -6.73046875, -5.49267578125, -4.2548828125, -3.01708984375, -1.779296875, -0.54150390625, 0.6962890625, 1.93408203125, 3.171875, 4.40966796875, 5.6474609375, 6.88525390625, 8.123046875, 9.36083984375, 10.5986328125, 11.83642578125, 13.07421875, 14.31201171875, 15.5498046875, 16.78759765625, 18.025390625, 19.26318359375, 20.5009765625, 21.73876953125, 22.9765625, 24.21435546875, 25.4521484375, 26.68994140625, 27.927734375, 29.16552734375, 30.4033203125, 31.64111328125, 32.87890625, 34.11669921875, 35.3544921875, 36.59228515625, 37.830078125, 39.06787109375, 40.3056640625, 41.54345703125, 42.78125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 2.0, 5.0, 4.0, 6.0, 10.0, 11.0, 14.0, 19.0, 34.0, 31.0, 54.0, 62.0, 116.0, 179.0, 291.0, 665.0, 802.0, 699.0, 364.0, 231.0, 150.0, 91.0, 69.0, 44.0, 31.0, 26.0, 14.0, 12.0, 9.0, 9.0, 6.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.65625, -57.71533203125, -55.7744140625, -53.83349609375, -51.892578125, -49.95166015625, -48.0107421875, -46.06982421875, -44.12890625, -42.18798828125, -40.2470703125, -38.30615234375, -36.365234375, -34.42431640625, -32.4833984375, -30.54248046875, -28.6015625, -26.66064453125, -24.7197265625, -22.77880859375, -20.837890625, -18.89697265625, -16.9560546875, -15.01513671875, -13.07421875, -11.13330078125, -9.1923828125, -7.25146484375, -5.310546875, -3.36962890625, -1.4287109375, 0.51220703125, 2.453125, 4.39404296875, 6.3349609375, 8.27587890625, 10.216796875, 12.15771484375, 14.0986328125, 16.03955078125, 17.98046875, 19.92138671875, 21.8623046875, 23.80322265625, 25.744140625, 27.68505859375, 29.6259765625, 31.56689453125, 33.5078125, 35.44873046875, 37.3896484375, 39.33056640625, 41.271484375, 43.21240234375, 45.1533203125, 47.09423828125, 49.03515625, 50.97607421875, 52.9169921875, 54.85791015625, 56.798828125, 58.73974609375, 60.6806640625, 62.62158203125, 64.5625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 3.0, 12.0, 43.0, 81.0, 210.0, 323.0, 200.0, 69.0, 26.0, 10.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-433.897216796875, -401.48358154296875, -369.0699462890625, -336.65631103515625, -304.24267578125, -271.82904052734375, -239.41543579101562, -207.00180053710938, -174.58816528320312, -142.17453002929688, -109.76090240478516, -77.34727478027344, -44.93363952636719, -12.520004272460938, 19.89361572265625, 52.3072509765625, 84.72088623046875, 117.134521484375, 149.54815673828125, 181.96177673339844, 214.3754119873047, 246.78904724121094, 279.2026672363281, 311.6163024902344, 344.0299377441406, 376.4435729980469, 408.8572082519531, 441.27081298828125, 473.6844482421875, 506.09808349609375, 538.51171875, 570.9253540039062, 603.3389892578125, 635.7526245117188, 668.166259765625, 700.5798950195312, 732.9935302734375, 765.4071655273438, 797.82080078125, 830.234375, 862.6480712890625, 895.0617065429688, 927.475341796875, 959.8889770507812, 992.3026123046875, 1024.7161865234375, 1057.1298828125, 1089.54345703125, 1121.95703125, 1154.37060546875, 1186.7843017578125, 1219.1978759765625, 1251.611572265625, 1284.025146484375, 1316.4388427734375, 1348.8524169921875, 1381.26611328125, 1413.6796875, 1446.0933837890625, 1478.5069580078125, 1510.920654296875, 1543.334228515625, 1575.7479248046875, 1608.1614990234375, 1640.5751953125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 4.0, 5.0, 4.0, 5.0, 7.0, 7.0, 12.0, 8.0, 7.0, 16.0, 13.0, 21.0, 25.0, 21.0, 25.0, 35.0, 36.0, 37.0, 45.0, 45.0, 47.0, 35.0, 46.0, 52.0, 40.0, 43.0, 37.0, 47.0, 35.0, 41.0, 31.0, 21.0, 24.0, 21.0, 15.0, 15.0, 13.0, 19.0, 9.0, 9.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-301.70928955078125, -293.31610107421875, -284.9228820800781, -276.5296630859375, -268.136474609375, -259.7432861328125, -251.35006713867188, -242.9568634033203, -234.56365966796875, -226.1704559326172, -217.77725219726562, -209.38404846191406, -200.9908447265625, -192.59764099121094, -184.20443725585938, -175.8112335205078, -167.41802978515625, -159.0248260498047, -150.63162231445312, -142.23841857910156, -133.84521484375, -125.45201110839844, -117.05880737304688, -108.66560363769531, -100.27239990234375, -91.87919616699219, -83.48599243164062, -75.09278869628906, -66.6995849609375, -58.30638122558594, -49.913177490234375, -41.51997375488281, -33.12678527832031, -24.73358154296875, -16.340377807617188, -7.947174072265625, 0.4460296630859375, 8.8392333984375, 17.232437133789062, 25.625640869140625, 34.01884460449219, 42.41204833984375, 50.80525207519531, 59.198455810546875, 67.59165954589844, 75.98486328125, 84.37806701660156, 92.77127075195312, 101.16447448730469, 109.55767822265625, 117.95088195800781, 126.34408569335938, 134.73728942871094, 143.1304931640625, 151.52369689941406, 159.91690063476562, 168.3101043701172, 176.70330810546875, 185.0965118408203, 193.48971557617188, 201.88291931152344, 210.276123046875, 218.66932678222656, 227.06253051757812, 235.4557342529297]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 12.0, 6.0, 27.0, 39.0, 53.0, 102.0, 205.0, 518.0, 1687.0, 6403.0, 29905.0, 168116.0, 585459.0, 208659.0, 36712.0, 7495.0, 2001.0, 643.0, 234.0, 133.0, 50.0, 31.0, 20.0, 14.0, 10.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.1875, -102.310546875, -99.43359375, -96.556640625, -93.6796875, -90.802734375, -87.92578125, -85.048828125, -82.171875, -79.294921875, -76.41796875, -73.541015625, -70.6640625, -67.787109375, -64.91015625, -62.033203125, -59.15625, -56.279296875, -53.40234375, -50.525390625, -47.6484375, -44.771484375, -41.89453125, -39.017578125, -36.140625, -33.263671875, -30.38671875, -27.509765625, -24.6328125, -21.755859375, -18.87890625, -16.001953125, -13.125, -10.248046875, -7.37109375, -4.494140625, -1.6171875, 1.259765625, 4.13671875, 7.013671875, 9.890625, 12.767578125, 15.64453125, 18.521484375, 21.3984375, 24.275390625, 27.15234375, 30.029296875, 32.90625, 35.783203125, 38.66015625, 41.537109375, 44.4140625, 47.291015625, 50.16796875, 53.044921875, 55.921875, 58.798828125, 61.67578125, 64.552734375, 67.4296875, 70.306640625, 73.18359375, 76.060546875, 78.9375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 11.0, 8.0, 13.0, 15.0, 20.0, 24.0, 22.0, 39.0, 39.0, 42.0, 31.0, 53.0, 47.0, 50.0, 57.0, 66.0, 53.0, 53.0, 59.0, 40.0, 37.0, 38.0, 37.0, 27.0, 18.0, 25.0, 19.0, 13.0, 4.0, 15.0, 7.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.90625, -24.20166015625, -23.4970703125, -22.79248046875, -22.087890625, -21.38330078125, -20.6787109375, -19.97412109375, -19.26953125, -18.56494140625, -17.8603515625, -17.15576171875, -16.451171875, -15.74658203125, -15.0419921875, -14.33740234375, -13.6328125, -12.92822265625, -12.2236328125, -11.51904296875, -10.814453125, -10.10986328125, -9.4052734375, -8.70068359375, -7.99609375, -7.29150390625, -6.5869140625, -5.88232421875, -5.177734375, -4.47314453125, -3.7685546875, -3.06396484375, -2.359375, -1.65478515625, -0.9501953125, -0.24560546875, 0.458984375, 1.16357421875, 1.8681640625, 2.57275390625, 3.27734375, 3.98193359375, 4.6865234375, 5.39111328125, 6.095703125, 6.80029296875, 7.5048828125, 8.20947265625, 8.9140625, 9.61865234375, 10.3232421875, 11.02783203125, 11.732421875, 12.43701171875, 13.1416015625, 13.84619140625, 14.55078125, 15.25537109375, 15.9599609375, 16.66455078125, 17.369140625, 18.07373046875, 18.7783203125, 19.48291015625, 20.1875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 10.0, 7.0, 22.0, 26.0, 33.0, 41.0, 51.0, 56.0, 96.0, 162.0, 200.0, 316.0, 411.0, 668.0, 1037.0, 1846.0, 3521.0, 8932.0, 32776.0, 178264.0, 660289.0, 121314.0, 23837.0, 7117.0, 2967.0, 1592.0, 971.0, 589.0, 413.0, 281.0, 181.0, 145.0, 98.0, 81.0, 58.0, 33.0, 20.0, 36.0, 17.0, 11.0, 6.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-95.1875, -92.3369140625, -89.486328125, -86.6357421875, -83.78515625, -80.9345703125, -78.083984375, -75.2333984375, -72.3828125, -69.5322265625, -66.681640625, -63.8310546875, -60.98046875, -58.1298828125, -55.279296875, -52.4287109375, -49.578125, -46.7275390625, -43.876953125, -41.0263671875, -38.17578125, -35.3251953125, -32.474609375, -29.6240234375, -26.7734375, -23.9228515625, -21.072265625, -18.2216796875, -15.37109375, -12.5205078125, -9.669921875, -6.8193359375, -3.96875, -1.1181640625, 1.732421875, 4.5830078125, 7.43359375, 10.2841796875, 13.134765625, 15.9853515625, 18.8359375, 21.6865234375, 24.537109375, 27.3876953125, 30.23828125, 33.0888671875, 35.939453125, 38.7900390625, 41.640625, 44.4912109375, 47.341796875, 50.1923828125, 53.04296875, 55.8935546875, 58.744140625, 61.5947265625, 64.4453125, 67.2958984375, 70.146484375, 72.9970703125, 75.84765625, 78.6982421875, 81.548828125, 84.3994140625, 87.25]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 8.0, 9.0, 10.0, 18.0, 6.0, 16.0, 19.0, 23.0, 36.0, 34.0, 35.0, 39.0, 36.0, 55.0, 62.0, 46.0, 50.0, 54.0, 66.0, 40.0, 52.0, 48.0, 36.0, 45.0, 33.0, 23.0, 20.0, 25.0, 6.0, 14.0, 6.0, 12.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-117.0, -113.580078125, -110.16015625, -106.740234375, -103.3203125, -99.900390625, -96.48046875, -93.060546875, -89.640625, -86.220703125, -82.80078125, -79.380859375, -75.9609375, -72.541015625, -69.12109375, -65.701171875, -62.28125, -58.861328125, -55.44140625, -52.021484375, -48.6015625, -45.181640625, -41.76171875, -38.341796875, -34.921875, -31.501953125, -28.08203125, -24.662109375, -21.2421875, -17.822265625, -14.40234375, -10.982421875, -7.5625, -4.142578125, -0.72265625, 2.697265625, 6.1171875, 9.537109375, 12.95703125, 16.376953125, 19.796875, 23.216796875, 26.63671875, 30.056640625, 33.4765625, 36.896484375, 40.31640625, 43.736328125, 47.15625, 50.576171875, 53.99609375, 57.416015625, 60.8359375, 64.255859375, 67.67578125, 71.095703125, 74.515625, 77.935546875, 81.35546875, 84.775390625, 88.1953125, 91.615234375, 95.03515625, 98.455078125, 101.875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 11.0, 9.0, 6.0, 7.0, 10.0, 16.0, 11.0, 18.0, 36.0, 44.0, 48.0, 97.0, 178.0, 354.0, 968.0, 3706.0, 43336.0, 915200.0, 77201.0, 5190.0, 1140.0, 413.0, 170.0, 102.0, 68.0, 61.0, 37.0, 36.0, 9.0, 16.0, 6.0, 11.0, 9.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-59.4375, -57.61328125, -55.7890625, -53.96484375, -52.140625, -50.31640625, -48.4921875, -46.66796875, -44.84375, -43.01953125, -41.1953125, -39.37109375, -37.546875, -35.72265625, -33.8984375, -32.07421875, -30.25, -28.42578125, -26.6015625, -24.77734375, -22.953125, -21.12890625, -19.3046875, -17.48046875, -15.65625, -13.83203125, -12.0078125, -10.18359375, -8.359375, -6.53515625, -4.7109375, -2.88671875, -1.0625, 0.76171875, 2.5859375, 4.41015625, 6.234375, 8.05859375, 9.8828125, 11.70703125, 13.53125, 15.35546875, 17.1796875, 19.00390625, 20.828125, 22.65234375, 24.4765625, 26.30078125, 28.125, 29.94921875, 31.7734375, 33.59765625, 35.421875, 37.24609375, 39.0703125, 40.89453125, 42.71875, 44.54296875, 46.3671875, 48.19140625, 50.015625, 51.83984375, 53.6640625, 55.48828125, 57.3125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 3.0, 6.0, 3.0, 6.0, 12.0, 12.0, 12.0, 10.0, 16.0, 24.0, 11.0, 33.0, 34.0, 45.0, 50.0, 74.0, 73.0, 82.0, 92.0, 70.0, 58.0, 50.0, 48.0, 33.0, 26.0, 22.0, 15.0, 14.0, 13.0, 14.0, 9.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.004913330078125, -0.00474858283996582, -0.004583835601806641, -0.004419088363647461, -0.004254341125488281, -0.0040895938873291016, -0.003924846649169922, -0.003760099411010742, -0.0035953521728515625, -0.003430604934692383, -0.003265857696533203, -0.0031011104583740234, -0.0029363632202148438, -0.002771615982055664, -0.0026068687438964844, -0.0024421215057373047, -0.002277374267578125, -0.0021126270294189453, -0.0019478797912597656, -0.001783132553100586, -0.0016183853149414062, -0.0014536380767822266, -0.0012888908386230469, -0.0011241436004638672, -0.0009593963623046875, -0.0007946491241455078, -0.0006299018859863281, -0.00046515464782714844, -0.00030040740966796875, -0.00013566017150878906, 2.9087066650390625e-05, 0.0001938343048095703, 0.00035858154296875, 0.0005233287811279297, 0.0006880760192871094, 0.0008528232574462891, 0.0010175704956054688, 0.0011823177337646484, 0.0013470649719238281, 0.0015118122100830078, 0.0016765594482421875, 0.0018413066864013672, 0.002006053924560547, 0.0021708011627197266, 0.0023355484008789062, 0.002500295639038086, 0.0026650428771972656, 0.0028297901153564453, 0.002994537353515625, 0.0031592845916748047, 0.0033240318298339844, 0.003488779067993164, 0.0036535263061523438, 0.0038182735443115234, 0.003983020782470703, 0.004147768020629883, 0.0043125152587890625, 0.004477262496948242, 0.004642009735107422, 0.0048067569732666016, 0.004971504211425781, 0.005136251449584961, 0.005300998687744141, 0.00546574592590332, 0.0056304931640625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 4.0, 11.0, 11.0, 31.0, 34.0, 75.0, 129.0, 252.0, 560.0, 1698.0, 7353.0, 261921.0, 763236.0, 9972.0, 2018.0, 665.0, 267.0, 133.0, 67.0, 42.0, 25.0, 19.0, 10.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.0625, -95.09765625, -92.1328125, -89.16796875, -86.203125, -83.23828125, -80.2734375, -77.30859375, -74.34375, -71.37890625, -68.4140625, -65.44921875, -62.484375, -59.51953125, -56.5546875, -53.58984375, -50.625, -47.66015625, -44.6953125, -41.73046875, -38.765625, -35.80078125, -32.8359375, -29.87109375, -26.90625, -23.94140625, -20.9765625, -18.01171875, -15.046875, -12.08203125, -9.1171875, -6.15234375, -3.1875, -0.22265625, 2.7421875, 5.70703125, 8.671875, 11.63671875, 14.6015625, 17.56640625, 20.53125, 23.49609375, 26.4609375, 29.42578125, 32.390625, 35.35546875, 38.3203125, 41.28515625, 44.25, 47.21484375, 50.1796875, 53.14453125, 56.109375, 59.07421875, 62.0390625, 65.00390625, 67.96875, 70.93359375, 73.8984375, 76.86328125, 79.828125, 82.79296875, 85.7578125, 88.72265625, 91.6875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 5.0, 10.0, 5.0, 10.0, 13.0, 17.0, 25.0, 25.0, 30.0, 44.0, 54.0, 58.0, 86.0, 93.0, 116.0, 77.0, 76.0, 57.0, 39.0, 40.0, 26.0, 22.0, 27.0, 9.0, 7.0, 7.0, 9.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.515625, -25.637451171875, -24.75927734375, -23.881103515625, -23.0029296875, -22.124755859375, -21.24658203125, -20.368408203125, -19.490234375, -18.612060546875, -17.73388671875, -16.855712890625, -15.9775390625, -15.099365234375, -14.22119140625, -13.343017578125, -12.46484375, -11.586669921875, -10.70849609375, -9.830322265625, -8.9521484375, -8.073974609375, -7.19580078125, -6.317626953125, -5.439453125, -4.561279296875, -3.68310546875, -2.804931640625, -1.9267578125, -1.048583984375, -0.17041015625, 0.707763671875, 1.5859375, 2.464111328125, 3.34228515625, 4.220458984375, 5.0986328125, 5.976806640625, 6.85498046875, 7.733154296875, 8.611328125, 9.489501953125, 10.36767578125, 11.245849609375, 12.1240234375, 13.002197265625, 13.88037109375, 14.758544921875, 15.63671875, 16.514892578125, 17.39306640625, 18.271240234375, 19.1494140625, 20.027587890625, 20.90576171875, 21.783935546875, 22.662109375, 23.540283203125, 24.41845703125, 25.296630859375, 26.1748046875, 27.052978515625, 27.93115234375, 28.809326171875, 29.6875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 12.0, 19.0, 35.0, 83.0, 147.0, 284.0, 200.0, 121.0, 57.0, 19.0, 7.0, 8.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-978.4988403320312, -950.3035888671875, -922.1082763671875, -893.9130249023438, -865.7177734375, -837.5225219726562, -809.3272705078125, -781.1319580078125, -752.9367065429688, -724.741455078125, -696.546142578125, -668.3508911132812, -640.1556396484375, -611.9603881835938, -583.76513671875, -555.56982421875, -527.3745727539062, -499.1793212890625, -470.9840393066406, -442.78875732421875, -414.593505859375, -386.39825439453125, -358.2029724121094, -330.0076904296875, -301.81243896484375, -273.6171875, -245.42190551757812, -217.2266387939453, -189.0313720703125, -160.8361053466797, -132.64083862304688, -104.44557189941406, -76.25030517578125, -48.05503845214844, -19.859771728515625, 8.335494995117188, 36.53076171875, 64.72602844238281, 92.92129516601562, 121.11656188964844, 149.31182861328125, 177.50709533691406, 205.70236206054688, 233.8976287841797, 262.0928955078125, 290.28814697265625, 318.4834289550781, 346.6787109375, 374.87396240234375, 403.0692138671875, 431.2644958496094, 459.45977783203125, 487.655029296875, 515.8502807617188, 544.0455322265625, 572.2408447265625, 600.4360961914062, 628.63134765625, 656.82666015625, 685.0219116210938, 713.2171630859375, 741.4124145507812, 769.607666015625, 797.802978515625, 825.9982299804688]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 9.0, 8.0, 6.0, 12.0, 13.0, 22.0, 17.0, 24.0, 22.0, 26.0, 32.0, 32.0, 34.0, 43.0, 40.0, 42.0, 57.0, 57.0, 70.0, 56.0, 52.0, 44.0, 38.0, 35.0, 25.0, 29.0, 29.0, 19.0, 21.0, 17.0, 13.0, 17.0, 9.0, 10.0, 4.0, 2.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-329.3806457519531, -318.7096862792969, -308.03875732421875, -297.3677978515625, -286.6968688964844, -276.0259094238281, -265.35498046875, -254.68402099609375, -244.01307678222656, -233.34213256835938, -222.6711883544922, -212.000244140625, -201.32928466796875, -190.65835571289062, -179.98739624023438, -169.3164520263672, -158.6455078125, -147.9745635986328, -137.30361938476562, -126.6326675415039, -115.96172332763672, -105.29077911376953, -94.61982727050781, -83.94888305664062, -73.27793884277344, -62.60699462890625, -51.9360466003418, -41.265098571777344, -30.594154357910156, -19.92321014404297, -9.25225830078125, 1.4186859130859375, 12.08966064453125, 22.76060676574707, 33.43155288696289, 44.102500915527344, 54.77344512939453, 65.44438934326172, 76.11534118652344, 86.78628540039062, 97.45722961425781, 108.128173828125, 118.79911804199219, 129.47006225585938, 140.14102172851562, 150.81195068359375, 161.48291015625, 172.1538543701172, 182.82479858398438, 193.49574279785156, 204.16668701171875, 214.837646484375, 225.50857543945312, 236.17953491210938, 246.85047912597656, 257.52142333984375, 268.1923828125, 278.86334228515625, 289.5342712402344, 300.2052307128906, 310.87615966796875, 321.547119140625, 332.21807861328125, 342.8890075683594, 353.5599365234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 12.0, 26.0, 36.0, 32.0, 58.0, 119.0, 299.0, 1475.0, 17344.0, 3696304.0, 470470.0, 6836.0, 816.0, 220.0, 103.0, 45.0, 34.0, 19.0, 11.0, 9.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-190.375, -186.0322265625, -181.689453125, -177.3466796875, -173.00390625, -168.6611328125, -164.318359375, -159.9755859375, -155.6328125, -151.2900390625, -146.947265625, -142.6044921875, -138.26171875, -133.9189453125, -129.576171875, -125.2333984375, -120.890625, -116.5478515625, -112.205078125, -107.8623046875, -103.51953125, -99.1767578125, -94.833984375, -90.4912109375, -86.1484375, -81.8056640625, -77.462890625, -73.1201171875, -68.77734375, -64.4345703125, -60.091796875, -55.7490234375, -51.40625, -47.0634765625, -42.720703125, -38.3779296875, -34.03515625, -29.6923828125, -25.349609375, -21.0068359375, -16.6640625, -12.3212890625, -7.978515625, -3.6357421875, 0.70703125, 5.0498046875, 9.392578125, 13.7353515625, 18.078125, 22.4208984375, 26.763671875, 31.1064453125, 35.44921875, 39.7919921875, 44.134765625, 48.4775390625, 52.8203125, 57.1630859375, 61.505859375, 65.8486328125, 70.19140625, 74.5341796875, 78.876953125, 83.2197265625, 87.5625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 10.0, 4.0, 13.0, 10.0, 10.0, 14.0, 20.0, 23.0, 20.0, 23.0, 32.0, 36.0, 40.0, 44.0, 47.0, 42.0, 39.0, 55.0, 55.0, 52.0, 42.0, 39.0, 39.0, 31.0, 39.0, 43.0, 33.0, 19.0, 23.0, 17.0, 11.0, 14.0, 15.0, 8.0, 11.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.53125, -16.9091796875, -16.287109375, -15.6650390625, -15.04296875, -14.4208984375, -13.798828125, -13.1767578125, -12.5546875, -11.9326171875, -11.310546875, -10.6884765625, -10.06640625, -9.4443359375, -8.822265625, -8.2001953125, -7.578125, -6.9560546875, -6.333984375, -5.7119140625, -5.08984375, -4.4677734375, -3.845703125, -3.2236328125, -2.6015625, -1.9794921875, -1.357421875, -0.7353515625, -0.11328125, 0.5087890625, 1.130859375, 1.7529296875, 2.375, 2.9970703125, 3.619140625, 4.2412109375, 4.86328125, 5.4853515625, 6.107421875, 6.7294921875, 7.3515625, 7.9736328125, 8.595703125, 9.2177734375, 9.83984375, 10.4619140625, 11.083984375, 11.7060546875, 12.328125, 12.9501953125, 13.572265625, 14.1943359375, 14.81640625, 15.4384765625, 16.060546875, 16.6826171875, 17.3046875, 17.9267578125, 18.548828125, 19.1708984375, 19.79296875, 20.4150390625, 21.037109375, 21.6591796875, 22.28125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 8.0, 15.0, 28.0, 29.0, 37.0, 71.0, 130.0, 234.0, 457.0, 983.0, 2187.0, 5604.0, 16324.0, 60457.0, 391637.0, 3237476.0, 390994.0, 60612.0, 16744.0, 5904.0, 2301.0, 1032.0, 477.0, 204.0, 120.0, 83.0, 45.0, 24.0, 18.0, 13.0, 9.0, 5.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.78125, -56.1982421875, -54.615234375, -53.0322265625, -51.44921875, -49.8662109375, -48.283203125, -46.7001953125, -45.1171875, -43.5341796875, -41.951171875, -40.3681640625, -38.78515625, -37.2021484375, -35.619140625, -34.0361328125, -32.453125, -30.8701171875, -29.287109375, -27.7041015625, -26.12109375, -24.5380859375, -22.955078125, -21.3720703125, -19.7890625, -18.2060546875, -16.623046875, -15.0400390625, -13.45703125, -11.8740234375, -10.291015625, -8.7080078125, -7.125, -5.5419921875, -3.958984375, -2.3759765625, -0.79296875, 0.7900390625, 2.373046875, 3.9560546875, 5.5390625, 7.1220703125, 8.705078125, 10.2880859375, 11.87109375, 13.4541015625, 15.037109375, 16.6201171875, 18.203125, 19.7861328125, 21.369140625, 22.9521484375, 24.53515625, 26.1181640625, 27.701171875, 29.2841796875, 30.8671875, 32.4501953125, 34.033203125, 35.6162109375, 37.19921875, 38.7822265625, 40.365234375, 41.9482421875, 43.53125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 9.0, 2.0, 7.0, 7.0, 5.0, 6.0, 15.0, 18.0, 20.0, 29.0, 49.0, 47.0, 74.0, 124.0, 155.0, 275.0, 513.0, 723.0, 711.0, 431.0, 267.0, 167.0, 106.0, 85.0, 62.0, 49.0, 28.0, 21.0, 21.0, 6.0, 13.0, 4.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-55.4375, -53.75927734375, -52.0810546875, -50.40283203125, -48.724609375, -47.04638671875, -45.3681640625, -43.68994140625, -42.01171875, -40.33349609375, -38.6552734375, -36.97705078125, -35.298828125, -33.62060546875, -31.9423828125, -30.26416015625, -28.5859375, -26.90771484375, -25.2294921875, -23.55126953125, -21.873046875, -20.19482421875, -18.5166015625, -16.83837890625, -15.16015625, -13.48193359375, -11.8037109375, -10.12548828125, -8.447265625, -6.76904296875, -5.0908203125, -3.41259765625, -1.734375, -0.05615234375, 1.6220703125, 3.30029296875, 4.978515625, 6.65673828125, 8.3349609375, 10.01318359375, 11.69140625, 13.36962890625, 15.0478515625, 16.72607421875, 18.404296875, 20.08251953125, 21.7607421875, 23.43896484375, 25.1171875, 26.79541015625, 28.4736328125, 30.15185546875, 31.830078125, 33.50830078125, 35.1865234375, 36.86474609375, 38.54296875, 40.22119140625, 41.8994140625, 43.57763671875, 45.255859375, 46.93408203125, 48.6123046875, 50.29052734375, 51.96875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 7.0, 21.0, 58.0, 200.0, 353.0, 227.0, 87.0, 24.0, 13.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-472.80474853515625, -440.0065002441406, -407.208251953125, -374.40997314453125, -341.6117248535156, -308.8134765625, -276.01519775390625, -243.21694946289062, -210.418701171875, -177.62045288085938, -144.8221893310547, -112.02393341064453, -79.22567749023438, -46.42742919921875, -13.629165649414062, 19.169097900390625, 51.96734619140625, 84.7656021118164, 117.56385803222656, 150.36212158203125, 183.16036987304688, 215.9586181640625, 248.7568817138672, 281.5551452636719, 314.3533935546875, 347.1516418457031, 379.94989013671875, 412.7481689453125, 445.5464172363281, 478.34466552734375, 511.1429443359375, 543.941162109375, 576.739501953125, 609.5377807617188, 642.3359985351562, 675.13427734375, 707.9324951171875, 740.7307739257812, 773.529052734375, 806.3272705078125, 839.1255493164062, 871.923828125, 904.7220458984375, 937.5203247070312, 970.318603515625, 1003.1168212890625, 1035.9150390625, 1068.71337890625, 1101.5115966796875, 1134.309814453125, 1167.108154296875, 1199.9063720703125, 1232.70458984375, 1265.5029296875, 1298.3011474609375, 1331.099365234375, 1363.897705078125, 1396.6959228515625, 1429.4942626953125, 1462.29248046875, 1495.0906982421875, 1527.888916015625, 1560.687255859375, 1593.4854736328125, 1626.28369140625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 11.0, 6.0, 9.0, 8.0, 6.0, 15.0, 12.0, 26.0, 22.0, 34.0, 34.0, 44.0, 47.0, 38.0, 45.0, 60.0, 55.0, 61.0, 53.0, 45.0, 40.0, 40.0, 50.0, 35.0, 36.0, 25.0, 26.0, 18.0, 21.0, 14.0, 23.0, 12.0, 8.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-293.5535888671875, -284.6994934082031, -275.8453674316406, -266.99127197265625, -258.13714599609375, -249.28305053710938, -240.42893981933594, -231.5748291015625, -222.72071838378906, -213.86660766601562, -205.0124969482422, -196.15838623046875, -187.30429077148438, -178.45016479492188, -169.5960693359375, -160.74195861816406, -151.88784790039062, -143.0337371826172, -134.17962646484375, -125.32552337646484, -116.4714126586914, -107.61730194091797, -98.76319885253906, -89.90908813476562, -81.05497741699219, -72.20086669921875, -63.34675979614258, -54.492652893066406, -45.63854217529297, -36.78443145751953, -27.93032455444336, -19.076217651367188, -10.22210693359375, -1.3679981231689453, 7.486110687255859, 16.340219497680664, 25.19432830810547, 34.048439025878906, 42.90254592895508, 51.75665283203125, 60.61076354980469, 69.46487426757812, 78.31898498535156, 87.17308807373047, 96.0271987915039, 104.88130950927734, 113.73541259765625, 122.58952331542969, 131.44363403320312, 140.29774475097656, 149.15185546875, 158.00596618652344, 166.86007690429688, 175.71417236328125, 184.5682830810547, 193.42239379882812, 202.27650451660156, 211.130615234375, 219.98472595214844, 228.83883666992188, 237.69293212890625, 246.54705810546875, 255.40115356445312, 264.2552490234375, 273.109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 6.0, 6.0, 4.0, 10.0, 12.0, 18.0, 46.0, 65.0, 111.0, 228.0, 569.0, 1439.0, 3877.0, 11746.0, 46374.0, 244964.0, 571273.0, 128750.0, 27087.0, 7492.0, 2625.0, 985.0, 436.0, 179.0, 97.0, 46.0, 26.0, 18.0, 17.0, 12.0, 7.0, 6.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.53125, -61.02197265625, -58.5126953125, -56.00341796875, -53.494140625, -50.98486328125, -48.4755859375, -45.96630859375, -43.45703125, -40.94775390625, -38.4384765625, -35.92919921875, -33.419921875, -30.91064453125, -28.4013671875, -25.89208984375, -23.3828125, -20.87353515625, -18.3642578125, -15.85498046875, -13.345703125, -10.83642578125, -8.3271484375, -5.81787109375, -3.30859375, -0.79931640625, 1.7099609375, 4.21923828125, 6.728515625, 9.23779296875, 11.7470703125, 14.25634765625, 16.765625, 19.27490234375, 21.7841796875, 24.29345703125, 26.802734375, 29.31201171875, 31.8212890625, 34.33056640625, 36.83984375, 39.34912109375, 41.8583984375, 44.36767578125, 46.876953125, 49.38623046875, 51.8955078125, 54.40478515625, 56.9140625, 59.42333984375, 61.9326171875, 64.44189453125, 66.951171875, 69.46044921875, 71.9697265625, 74.47900390625, 76.98828125, 79.49755859375, 82.0068359375, 84.51611328125, 87.025390625, 89.53466796875, 92.0439453125, 94.55322265625, 97.0625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 9.0, 4.0, 0.0, 6.0, 10.0, 11.0, 7.0, 14.0, 11.0, 15.0, 26.0, 20.0, 22.0, 18.0, 34.0, 19.0, 34.0, 28.0, 29.0, 38.0, 26.0, 43.0, 51.0, 44.0, 39.0, 56.0, 33.0, 30.0, 46.0, 38.0, 27.0, 29.0, 25.0, 19.0, 22.0, 15.0, 21.0, 13.0, 11.0, 10.0, 6.0, 7.0, 6.0, 8.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-19.09375, -18.533447265625, -17.97314453125, -17.412841796875, -16.8525390625, -16.292236328125, -15.73193359375, -15.171630859375, -14.611328125, -14.051025390625, -13.49072265625, -12.930419921875, -12.3701171875, -11.809814453125, -11.24951171875, -10.689208984375, -10.12890625, -9.568603515625, -9.00830078125, -8.447998046875, -7.8876953125, -7.327392578125, -6.76708984375, -6.206787109375, -5.646484375, -5.086181640625, -4.52587890625, -3.965576171875, -3.4052734375, -2.844970703125, -2.28466796875, -1.724365234375, -1.1640625, -0.603759765625, -0.04345703125, 0.516845703125, 1.0771484375, 1.637451171875, 2.19775390625, 2.758056640625, 3.318359375, 3.878662109375, 4.43896484375, 4.999267578125, 5.5595703125, 6.119873046875, 6.68017578125, 7.240478515625, 7.80078125, 8.361083984375, 8.92138671875, 9.481689453125, 10.0419921875, 10.602294921875, 11.16259765625, 11.722900390625, 12.283203125, 12.843505859375, 13.40380859375, 13.964111328125, 14.5244140625, 15.084716796875, 15.64501953125, 16.205322265625, 16.765625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 9.0, 12.0, 19.0, 13.0, 23.0, 39.0, 56.0, 67.0, 99.0, 177.0, 289.0, 485.0, 1012.0, 2283.0, 7096.0, 40197.0, 732853.0, 235179.0, 20318.0, 4595.0, 1739.0, 815.0, 413.0, 285.0, 156.0, 98.0, 58.0, 40.0, 31.0, 30.0, 12.0, 10.0, 14.0, 5.0, 4.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-138.5, -134.1484375, -129.796875, -125.4453125, -121.09375, -116.7421875, -112.390625, -108.0390625, -103.6875, -99.3359375, -94.984375, -90.6328125, -86.28125, -81.9296875, -77.578125, -73.2265625, -68.875, -64.5234375, -60.171875, -55.8203125, -51.46875, -47.1171875, -42.765625, -38.4140625, -34.0625, -29.7109375, -25.359375, -21.0078125, -16.65625, -12.3046875, -7.953125, -3.6015625, 0.75, 5.1015625, 9.453125, 13.8046875, 18.15625, 22.5078125, 26.859375, 31.2109375, 35.5625, 39.9140625, 44.265625, 48.6171875, 52.96875, 57.3203125, 61.671875, 66.0234375, 70.375, 74.7265625, 79.078125, 83.4296875, 87.78125, 92.1328125, 96.484375, 100.8359375, 105.1875, 109.5390625, 113.890625, 118.2421875, 122.59375, 126.9453125, 131.296875, 135.6484375, 140.0]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 4.0, 5.0, 5.0, 4.0, 13.0, 16.0, 9.0, 19.0, 22.0, 28.0, 44.0, 49.0, 38.0, 61.0, 68.0, 61.0, 73.0, 77.0, 61.0, 59.0, 55.0, 39.0, 42.0, 31.0, 27.0, 25.0, 10.0, 16.0, 7.0, 9.0, 8.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-127.1875, -123.5283203125, -119.869140625, -116.2099609375, -112.55078125, -108.8916015625, -105.232421875, -101.5732421875, -97.9140625, -94.2548828125, -90.595703125, -86.9365234375, -83.27734375, -79.6181640625, -75.958984375, -72.2998046875, -68.640625, -64.9814453125, -61.322265625, -57.6630859375, -54.00390625, -50.3447265625, -46.685546875, -43.0263671875, -39.3671875, -35.7080078125, -32.048828125, -28.3896484375, -24.73046875, -21.0712890625, -17.412109375, -13.7529296875, -10.09375, -6.4345703125, -2.775390625, 0.8837890625, 4.54296875, 8.2021484375, 11.861328125, 15.5205078125, 19.1796875, 22.8388671875, 26.498046875, 30.1572265625, 33.81640625, 37.4755859375, 41.134765625, 44.7939453125, 48.453125, 52.1123046875, 55.771484375, 59.4306640625, 63.08984375, 66.7490234375, 70.408203125, 74.0673828125, 77.7265625, 81.3857421875, 85.044921875, 88.7041015625, 92.36328125, 96.0224609375, 99.681640625, 103.3408203125, 107.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 3.0, 3.0, 10.0, 13.0, 21.0, 23.0, 31.0, 57.0, 85.0, 165.0, 362.0, 826.0, 2579.0, 12858.0, 257563.0, 746038.0, 22305.0, 3641.0, 1106.0, 399.0, 161.0, 98.0, 56.0, 29.0, 27.0, 14.0, 18.0, 7.0, 5.0, 10.0, 4.0, 5.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-48.59375, -47.0810546875, -45.568359375, -44.0556640625, -42.54296875, -41.0302734375, -39.517578125, -38.0048828125, -36.4921875, -34.9794921875, -33.466796875, -31.9541015625, -30.44140625, -28.9287109375, -27.416015625, -25.9033203125, -24.390625, -22.8779296875, -21.365234375, -19.8525390625, -18.33984375, -16.8271484375, -15.314453125, -13.8017578125, -12.2890625, -10.7763671875, -9.263671875, -7.7509765625, -6.23828125, -4.7255859375, -3.212890625, -1.7001953125, -0.1875, 1.3251953125, 2.837890625, 4.3505859375, 5.86328125, 7.3759765625, 8.888671875, 10.4013671875, 11.9140625, 13.4267578125, 14.939453125, 16.4521484375, 17.96484375, 19.4775390625, 20.990234375, 22.5029296875, 24.015625, 25.5283203125, 27.041015625, 28.5537109375, 30.06640625, 31.5791015625, 33.091796875, 34.6044921875, 36.1171875, 37.6298828125, 39.142578125, 40.6552734375, 42.16796875, 43.6806640625, 45.193359375, 46.7060546875, 48.21875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 4.0, 10.0, 14.0, 17.0, 25.0, 31.0, 30.0, 36.0, 71.0, 86.0, 142.0, 131.0, 138.0, 68.0, 43.0, 32.0, 26.0, 22.0, 9.0, 15.0, 8.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00748443603515625, -0.007258474826812744, -0.007032513618469238, -0.006806552410125732, -0.0065805912017822266, -0.006354629993438721, -0.006128668785095215, -0.005902707576751709, -0.005676746368408203, -0.005450785160064697, -0.005224823951721191, -0.0049988627433776855, -0.00477290153503418, -0.004546940326690674, -0.004320979118347168, -0.004095017910003662, -0.0038690567016601562, -0.0036430954933166504, -0.0034171342849731445, -0.0031911730766296387, -0.002965211868286133, -0.002739250659942627, -0.002513289451599121, -0.0022873282432556152, -0.0020613670349121094, -0.0018354058265686035, -0.0016094446182250977, -0.0013834834098815918, -0.001157522201538086, -0.0009315609931945801, -0.0007055997848510742, -0.00047963857650756836, -0.0002536773681640625, -2.771615982055664e-05, 0.00019824504852294922, 0.0004242062568664551, 0.0006501674652099609, 0.0008761286735534668, 0.0011020898818969727, 0.0013280510902404785, 0.0015540122985839844, 0.0017799735069274902, 0.002005934715270996, 0.002231895923614502, 0.002457857131958008, 0.0026838183403015137, 0.0029097795486450195, 0.0031357407569885254, 0.0033617019653320312, 0.003587663173675537, 0.003813624382019043, 0.004039585590362549, 0.004265546798706055, 0.0044915080070495605, 0.004717469215393066, 0.004943430423736572, 0.005169391632080078, 0.005395352840423584, 0.00562131404876709, 0.005847275257110596, 0.0060732364654541016, 0.006299197673797607, 0.006525158882141113, 0.006751120090484619, 0.006977081298828125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 6.0, 6.0, 9.0, 11.0, 14.0, 33.0, 26.0, 57.0, 81.0, 99.0, 177.0, 311.0, 599.0, 1257.0, 3324.0, 11923.0, 107438.0, 833029.0, 74622.0, 10103.0, 2986.0, 1108.0, 550.0, 269.0, 157.0, 100.0, 83.0, 50.0, 32.0, 21.0, 17.0, 13.0, 6.0, 14.0, 8.0, 4.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.21875, -30.158203125, -29.09765625, -28.037109375, -26.9765625, -25.916015625, -24.85546875, -23.794921875, -22.734375, -21.673828125, -20.61328125, -19.552734375, -18.4921875, -17.431640625, -16.37109375, -15.310546875, -14.25, -13.189453125, -12.12890625, -11.068359375, -10.0078125, -8.947265625, -7.88671875, -6.826171875, -5.765625, -4.705078125, -3.64453125, -2.583984375, -1.5234375, -0.462890625, 0.59765625, 1.658203125, 2.71875, 3.779296875, 4.83984375, 5.900390625, 6.9609375, 8.021484375, 9.08203125, 10.142578125, 11.203125, 12.263671875, 13.32421875, 14.384765625, 15.4453125, 16.505859375, 17.56640625, 18.626953125, 19.6875, 20.748046875, 21.80859375, 22.869140625, 23.9296875, 24.990234375, 26.05078125, 27.111328125, 28.171875, 29.232421875, 30.29296875, 31.353515625, 32.4140625, 33.474609375, 34.53515625, 35.595703125, 36.65625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 6.0, 5.0, 4.0, 9.0, 13.0, 9.0, 24.0, 25.0, 29.0, 48.0, 62.0, 78.0, 78.0, 94.0, 103.0, 92.0, 70.0, 71.0, 39.0, 30.0, 26.0, 22.0, 16.0, 11.0, 8.0, 1.0, 10.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.328125, -21.500244140625, -20.67236328125, -19.844482421875, -19.0166015625, -18.188720703125, -17.36083984375, -16.532958984375, -15.705078125, -14.877197265625, -14.04931640625, -13.221435546875, -12.3935546875, -11.565673828125, -10.73779296875, -9.909912109375, -9.08203125, -8.254150390625, -7.42626953125, -6.598388671875, -5.7705078125, -4.942626953125, -4.11474609375, -3.286865234375, -2.458984375, -1.631103515625, -0.80322265625, 0.024658203125, 0.8525390625, 1.680419921875, 2.50830078125, 3.336181640625, 4.1640625, 4.991943359375, 5.81982421875, 6.647705078125, 7.4755859375, 8.303466796875, 9.13134765625, 9.959228515625, 10.787109375, 11.614990234375, 12.44287109375, 13.270751953125, 14.0986328125, 14.926513671875, 15.75439453125, 16.582275390625, 17.41015625, 18.238037109375, 19.06591796875, 19.893798828125, 20.7216796875, 21.549560546875, 22.37744140625, 23.205322265625, 24.033203125, 24.861083984375, 25.68896484375, 26.516845703125, 27.3447265625, 28.172607421875, 29.00048828125, 29.828369140625, 30.65625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 7.0, 2.0, 10.0, 26.0, 39.0, 143.0, 365.0, 275.0, 89.0, 22.0, 13.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-742.5076904296875, -706.910400390625, -671.3131103515625, -635.7158203125, -600.1185302734375, -564.521240234375, -528.9239501953125, -493.32666015625, -457.7293701171875, -422.132080078125, -386.5347900390625, -350.9375, -315.3402099609375, -279.742919921875, -244.1456298828125, -208.54833984375, -172.9510498046875, -137.353759765625, -101.7564697265625, -66.1591796875, -30.5618896484375, 5.035400390625, 40.6326904296875, 76.22998046875, 111.8272705078125, 147.424560546875, 183.0218505859375, 218.619140625, 254.2164306640625, 289.813720703125, 325.4110107421875, 361.00830078125, 396.605712890625, 432.2030029296875, 467.80029296875, 503.3975830078125, 538.994873046875, 574.5921630859375, 610.189453125, 645.7867431640625, 681.384033203125, 716.9813232421875, 752.57861328125, 788.1759033203125, 823.773193359375, 859.3704833984375, 894.9677734375, 930.5650634765625, 966.162353515625, 1001.7596435546875, 1037.35693359375, 1072.9542236328125, 1108.551513671875, 1144.1488037109375, 1179.74609375, 1215.3433837890625, 1250.940673828125, 1286.5379638671875, 1322.13525390625, 1357.7325439453125, 1393.329833984375, 1428.9271240234375, 1464.5244140625, 1500.1217041015625, 1535.718994140625]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 9.0, 8.0, 10.0, 12.0, 11.0, 11.0, 16.0, 25.0, 24.0, 20.0, 24.0, 27.0, 26.0, 42.0, 37.0, 49.0, 60.0, 69.0, 64.0, 59.0, 53.0, 39.0, 44.0, 22.0, 24.0, 34.0, 20.0, 20.0, 29.0, 16.0, 18.0, 12.0, 16.0, 11.0, 4.0, 3.0, 5.0, 9.0, 5.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-374.6380615234375, -363.3945007324219, -352.1509094238281, -340.9073486328125, -329.66375732421875, -318.4201965332031, -307.1766357421875, -295.93304443359375, -284.689453125, -273.4458923339844, -262.2023010253906, -250.958740234375, -239.71514892578125, -228.47158813476562, -217.22801208496094, -205.98443603515625, -194.74087524414062, -183.49729919433594, -172.25372314453125, -161.01016235351562, -149.76657104492188, -138.52301025390625, -127.27943420410156, -116.03585815429688, -104.79228210449219, -93.5487060546875, -82.30513000488281, -71.06156158447266, -59.81798553466797, -48.57440948486328, -37.330841064453125, -26.087265014648438, -14.84368896484375, -3.6001148223876953, 7.643459320068359, 18.88703155517578, 30.13060760498047, 41.374183654785156, 52.61775207519531, 63.861328125, 75.10490417480469, 86.34848022460938, 97.59205627441406, 108.83562469482422, 120.0792007446289, 131.32278442382812, 142.56634521484375, 153.80992126464844, 165.05349731445312, 176.2970733642578, 187.5406494140625, 198.78421020507812, 210.02780151367188, 221.2713623046875, 232.5149383544922, 243.75851440429688, 255.00209045410156, 266.24566650390625, 277.4892272949219, 288.7328186035156, 299.97637939453125, 311.219970703125, 322.4635314941406, 333.70709228515625, 344.95068359375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 9.0, 2.0, 18.0, 25.0, 32.0, 35.0, 66.0, 116.0, 151.0, 235.0, 458.0, 999.0, 2493.0, 8428.0, 47529.0, 2387911.0, 1697011.0, 37312.0, 7227.0, 2228.0, 911.0, 435.0, 272.0, 137.0, 75.0, 45.0, 38.0, 25.0, 19.0, 13.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.84375, -49.76611328125, -47.6884765625, -45.61083984375, -43.533203125, -41.45556640625, -39.3779296875, -37.30029296875, -35.22265625, -33.14501953125, -31.0673828125, -28.98974609375, -26.912109375, -24.83447265625, -22.7568359375, -20.67919921875, -18.6015625, -16.52392578125, -14.4462890625, -12.36865234375, -10.291015625, -8.21337890625, -6.1357421875, -4.05810546875, -1.98046875, 0.09716796875, 2.1748046875, 4.25244140625, 6.330078125, 8.40771484375, 10.4853515625, 12.56298828125, 14.640625, 16.71826171875, 18.7958984375, 20.87353515625, 22.951171875, 25.02880859375, 27.1064453125, 29.18408203125, 31.26171875, 33.33935546875, 35.4169921875, 37.49462890625, 39.572265625, 41.64990234375, 43.7275390625, 45.80517578125, 47.8828125, 49.96044921875, 52.0380859375, 54.11572265625, 56.193359375, 58.27099609375, 60.3486328125, 62.42626953125, 64.50390625, 66.58154296875, 68.6591796875, 70.73681640625, 72.814453125, 74.89208984375, 76.9697265625, 79.04736328125, 81.125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 13.0, 10.0, 13.0, 11.0, 13.0, 22.0, 17.0, 26.0, 17.0, 28.0, 23.0, 31.0, 35.0, 34.0, 34.0, 35.0, 39.0, 39.0, 49.0, 42.0, 44.0, 34.0, 37.0, 34.0, 26.0, 34.0, 32.0, 36.0, 25.0, 24.0, 21.0, 19.0, 18.0, 14.0, 13.0, 7.0, 9.0, 12.0, 5.0, 2.0, 5.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-17.46875, -16.925537109375, -16.38232421875, -15.839111328125, -15.2958984375, -14.752685546875, -14.20947265625, -13.666259765625, -13.123046875, -12.579833984375, -12.03662109375, -11.493408203125, -10.9501953125, -10.406982421875, -9.86376953125, -9.320556640625, -8.77734375, -8.234130859375, -7.69091796875, -7.147705078125, -6.6044921875, -6.061279296875, -5.51806640625, -4.974853515625, -4.431640625, -3.888427734375, -3.34521484375, -2.802001953125, -2.2587890625, -1.715576171875, -1.17236328125, -0.629150390625, -0.0859375, 0.457275390625, 1.00048828125, 1.543701171875, 2.0869140625, 2.630126953125, 3.17333984375, 3.716552734375, 4.259765625, 4.802978515625, 5.34619140625, 5.889404296875, 6.4326171875, 6.975830078125, 7.51904296875, 8.062255859375, 8.60546875, 9.148681640625, 9.69189453125, 10.235107421875, 10.7783203125, 11.321533203125, 11.86474609375, 12.407958984375, 12.951171875, 13.494384765625, 14.03759765625, 14.580810546875, 15.1240234375, 15.667236328125, 16.21044921875, 16.753662109375, 17.296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 6.0, 7.0, 5.0, 12.0, 12.0, 22.0, 28.0, 44.0, 82.0, 141.0, 285.0, 506.0, 1157.0, 2915.0, 9518.0, 51201.0, 1931068.0, 2130171.0, 53247.0, 9217.0, 2550.0, 1021.0, 473.0, 252.0, 134.0, 79.0, 45.0, 32.0, 17.0, 7.0, 4.0, 5.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.875, -69.3974609375, -66.919921875, -64.4423828125, -61.96484375, -59.4873046875, -57.009765625, -54.5322265625, -52.0546875, -49.5771484375, -47.099609375, -44.6220703125, -42.14453125, -39.6669921875, -37.189453125, -34.7119140625, -32.234375, -29.7568359375, -27.279296875, -24.8017578125, -22.32421875, -19.8466796875, -17.369140625, -14.8916015625, -12.4140625, -9.9365234375, -7.458984375, -4.9814453125, -2.50390625, -0.0263671875, 2.451171875, 4.9287109375, 7.40625, 9.8837890625, 12.361328125, 14.8388671875, 17.31640625, 19.7939453125, 22.271484375, 24.7490234375, 27.2265625, 29.7041015625, 32.181640625, 34.6591796875, 37.13671875, 39.6142578125, 42.091796875, 44.5693359375, 47.046875, 49.5244140625, 52.001953125, 54.4794921875, 56.95703125, 59.4345703125, 61.912109375, 64.3896484375, 66.8671875, 69.3447265625, 71.822265625, 74.2998046875, 76.77734375, 79.2548828125, 81.732421875, 84.2099609375, 86.6875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 6.0, 8.0, 10.0, 23.0, 28.0, 40.0, 61.0, 90.0, 183.0, 478.0, 1004.0, 1034.0, 560.0, 222.0, 98.0, 77.0, 40.0, 29.0, 23.0, 12.0, 15.0, 7.0, 1.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.625, -67.234375, -64.84375, -62.453125, -60.0625, -57.671875, -55.28125, -52.890625, -50.5, -48.109375, -45.71875, -43.328125, -40.9375, -38.546875, -36.15625, -33.765625, -31.375, -28.984375, -26.59375, -24.203125, -21.8125, -19.421875, -17.03125, -14.640625, -12.25, -9.859375, -7.46875, -5.078125, -2.6875, -0.296875, 2.09375, 4.484375, 6.875, 9.265625, 11.65625, 14.046875, 16.4375, 18.828125, 21.21875, 23.609375, 26.0, 28.390625, 30.78125, 33.171875, 35.5625, 37.953125, 40.34375, 42.734375, 45.125, 47.515625, 49.90625, 52.296875, 54.6875, 57.078125, 59.46875, 61.859375, 64.25, 66.640625, 69.03125, 71.421875, 73.8125, 76.203125, 78.59375, 80.984375, 83.375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 16.0, 17.0, 47.0, 126.0, 241.0, 261.0, 159.0, 58.0, 27.0, 9.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-789.8038330078125, -768.443115234375, -747.0823364257812, -725.7216186523438, -704.3609008789062, -683.0001831054688, -661.639404296875, -640.2786865234375, -618.91796875, -597.5572509765625, -576.1964721679688, -554.8357543945312, -533.4750366210938, -512.1143188476562, -490.7535400390625, -469.392822265625, -448.0320739746094, -426.67132568359375, -405.31060791015625, -383.9498596191406, -362.5891418457031, -341.2283935546875, -319.86767578125, -298.5069274902344, -277.14617919921875, -255.7854461669922, -234.42471313476562, -213.06396484375, -191.7032470703125, -170.34249877929688, -148.9817657470703, -127.62103271484375, -106.26031494140625, -84.89958190917969, -63.53884506225586, -42.17810821533203, -20.81737518310547, 0.5433578491210938, 21.904098510742188, 43.26483154296875, 64.62556457519531, 85.98629760742188, 107.34703063964844, 128.707763671875, 150.06851196289062, 171.42922973632812, 192.78997802734375, 214.1507110595703, 235.51144409179688, 256.8721923828125, 278.23291015625, 299.5936584472656, 320.9543762207031, 342.31512451171875, 363.67584228515625, 385.0365905761719, 406.3973388671875, 427.7580871582031, 449.1188049316406, 470.47955322265625, 491.84027099609375, 513.2009887695312, 534.561767578125, 555.9224853515625, 577.283203125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 14.0, 5.0, 11.0, 19.0, 19.0, 19.0, 39.0, 40.0, 48.0, 57.0, 62.0, 60.0, 81.0, 78.0, 55.0, 55.0, 57.0, 51.0, 51.0, 40.0, 33.0, 20.0, 19.0, 13.0, 13.0, 11.0, 7.0, 0.0, 5.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-317.19891357421875, -307.2953796386719, -297.391845703125, -287.4883117675781, -277.58477783203125, -267.6812438964844, -257.7777099609375, -247.87417602539062, -237.97064208984375, -228.06710815429688, -218.16357421875, -208.26004028320312, -198.35650634765625, -188.45297241210938, -178.5494384765625, -168.64590454101562, -158.74237060546875, -148.83883666992188, -138.935302734375, -129.03176879882812, -119.12823486328125, -109.22470092773438, -99.3211669921875, -89.41763305664062, -79.51409912109375, -69.61056518554688, -59.70703125, -49.803497314453125, -39.89996337890625, -29.996429443359375, -20.0928955078125, -10.189361572265625, -0.28582763671875, 9.617706298828125, 19.521240234375, 29.424774169921875, 39.32830810546875, 49.231842041015625, 59.1353759765625, 69.03890991210938, 78.94244384765625, 88.84597778320312, 98.74951171875, 108.65304565429688, 118.55657958984375, 128.46011352539062, 138.3636474609375, 148.26718139648438, 158.17071533203125, 168.07424926757812, 177.977783203125, 187.88131713867188, 197.78485107421875, 207.68838500976562, 217.5919189453125, 227.49545288085938, 237.39898681640625, 247.30252075195312, 257.2060546875, 267.1095886230469, 277.01312255859375, 286.9166564941406, 296.8201904296875, 306.7237243652344, 316.62725830078125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 6.0, 4.0, 4.0, 8.0, 12.0, 14.0, 22.0, 40.0, 44.0, 54.0, 147.0, 232.0, 402.0, 717.0, 1352.0, 2640.0, 5650.0, 12704.0, 31656.0, 84645.0, 223082.0, 351675.0, 205395.0, 76783.0, 28995.0, 11693.0, 5147.0, 2560.0, 1228.0, 672.0, 383.0, 225.0, 132.0, 87.0, 55.0, 31.0, 31.0, 13.0, 4.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.5625, -24.51708984375, -23.4716796875, -22.42626953125, -21.380859375, -20.33544921875, -19.2900390625, -18.24462890625, -17.19921875, -16.15380859375, -15.1083984375, -14.06298828125, -13.017578125, -11.97216796875, -10.9267578125, -9.88134765625, -8.8359375, -7.79052734375, -6.7451171875, -5.69970703125, -4.654296875, -3.60888671875, -2.5634765625, -1.51806640625, -0.47265625, 0.57275390625, 1.6181640625, 2.66357421875, 3.708984375, 4.75439453125, 5.7998046875, 6.84521484375, 7.890625, 8.93603515625, 9.9814453125, 11.02685546875, 12.072265625, 13.11767578125, 14.1630859375, 15.20849609375, 16.25390625, 17.29931640625, 18.3447265625, 19.39013671875, 20.435546875, 21.48095703125, 22.5263671875, 23.57177734375, 24.6171875, 25.66259765625, 26.7080078125, 27.75341796875, 28.798828125, 29.84423828125, 30.8896484375, 31.93505859375, 32.98046875, 34.02587890625, 35.0712890625, 36.11669921875, 37.162109375, 38.20751953125, 39.2529296875, 40.29833984375, 41.34375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 7.0, 7.0, 7.0, 8.0, 10.0, 14.0, 7.0, 13.0, 13.0, 16.0, 19.0, 22.0, 33.0, 27.0, 31.0, 40.0, 34.0, 35.0, 38.0, 33.0, 28.0, 47.0, 46.0, 38.0, 38.0, 55.0, 33.0, 34.0, 34.0, 28.0, 28.0, 23.0, 21.0, 18.0, 19.0, 17.0, 11.0, 14.0, 12.0, 10.0, 5.0, 7.0, 5.0, 3.0, 3.0, 2.0, 6.0, 4.0, 2.0, 1.0, 2.0], "bins": [-20.0, -19.427734375, -18.85546875, -18.283203125, -17.7109375, -17.138671875, -16.56640625, -15.994140625, -15.421875, -14.849609375, -14.27734375, -13.705078125, -13.1328125, -12.560546875, -11.98828125, -11.416015625, -10.84375, -10.271484375, -9.69921875, -9.126953125, -8.5546875, -7.982421875, -7.41015625, -6.837890625, -6.265625, -5.693359375, -5.12109375, -4.548828125, -3.9765625, -3.404296875, -2.83203125, -2.259765625, -1.6875, -1.115234375, -0.54296875, 0.029296875, 0.6015625, 1.173828125, 1.74609375, 2.318359375, 2.890625, 3.462890625, 4.03515625, 4.607421875, 5.1796875, 5.751953125, 6.32421875, 6.896484375, 7.46875, 8.041015625, 8.61328125, 9.185546875, 9.7578125, 10.330078125, 10.90234375, 11.474609375, 12.046875, 12.619140625, 13.19140625, 13.763671875, 14.3359375, 14.908203125, 15.48046875, 16.052734375, 16.625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 8.0, 10.0, 15.0, 28.0, 32.0, 45.0, 88.0, 122.0, 245.0, 474.0, 1111.0, 2751.0, 8605.0, 38384.0, 283995.0, 626165.0, 66977.0, 12929.0, 3788.0, 1459.0, 657.0, 280.0, 145.0, 84.0, 41.0, 29.0, 27.0, 16.0, 11.0, 10.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.78125, -60.62744140625, -58.4736328125, -56.31982421875, -54.166015625, -52.01220703125, -49.8583984375, -47.70458984375, -45.55078125, -43.39697265625, -41.2431640625, -39.08935546875, -36.935546875, -34.78173828125, -32.6279296875, -30.47412109375, -28.3203125, -26.16650390625, -24.0126953125, -21.85888671875, -19.705078125, -17.55126953125, -15.3974609375, -13.24365234375, -11.08984375, -8.93603515625, -6.7822265625, -4.62841796875, -2.474609375, -0.32080078125, 1.8330078125, 3.98681640625, 6.140625, 8.29443359375, 10.4482421875, 12.60205078125, 14.755859375, 16.90966796875, 19.0634765625, 21.21728515625, 23.37109375, 25.52490234375, 27.6787109375, 29.83251953125, 31.986328125, 34.14013671875, 36.2939453125, 38.44775390625, 40.6015625, 42.75537109375, 44.9091796875, 47.06298828125, 49.216796875, 51.37060546875, 53.5244140625, 55.67822265625, 57.83203125, 59.98583984375, 62.1396484375, 64.29345703125, 66.447265625, 68.60107421875, 70.7548828125, 72.90869140625, 75.0625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 2.0, 6.0, 19.0, 22.0, 23.0, 18.0, 28.0, 39.0, 34.0, 53.0, 47.0, 62.0, 71.0, 82.0, 75.0, 62.0, 59.0, 58.0, 54.0, 27.0, 36.0, 24.0, 23.0, 17.0, 13.0, 13.0, 11.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.9375, -101.7265625, -98.515625, -95.3046875, -92.09375, -88.8828125, -85.671875, -82.4609375, -79.25, -76.0390625, -72.828125, -69.6171875, -66.40625, -63.1953125, -59.984375, -56.7734375, -53.5625, -50.3515625, -47.140625, -43.9296875, -40.71875, -37.5078125, -34.296875, -31.0859375, -27.875, -24.6640625, -21.453125, -18.2421875, -15.03125, -11.8203125, -8.609375, -5.3984375, -2.1875, 1.0234375, 4.234375, 7.4453125, 10.65625, 13.8671875, 17.078125, 20.2890625, 23.5, 26.7109375, 29.921875, 33.1328125, 36.34375, 39.5546875, 42.765625, 45.9765625, 49.1875, 52.3984375, 55.609375, 58.8203125, 62.03125, 65.2421875, 68.453125, 71.6640625, 74.875, 78.0859375, 81.296875, 84.5078125, 87.71875, 90.9296875, 94.140625, 97.3515625, 100.5625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 2.0, 1.0, 10.0, 12.0, 24.0, 24.0, 34.0, 47.0, 79.0, 129.0, 221.0, 424.0, 842.0, 1859.0, 4467.0, 13687.0, 55007.0, 307289.0, 564560.0, 73267.0, 17015.0, 5253.0, 2192.0, 967.0, 478.0, 225.0, 140.0, 105.0, 63.0, 31.0, 31.0, 18.0, 7.0, 11.0, 7.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.765625, -16.226318359375, -15.68701171875, -15.147705078125, -14.6083984375, -14.069091796875, -13.52978515625, -12.990478515625, -12.451171875, -11.911865234375, -11.37255859375, -10.833251953125, -10.2939453125, -9.754638671875, -9.21533203125, -8.676025390625, -8.13671875, -7.597412109375, -7.05810546875, -6.518798828125, -5.9794921875, -5.440185546875, -4.90087890625, -4.361572265625, -3.822265625, -3.282958984375, -2.74365234375, -2.204345703125, -1.6650390625, -1.125732421875, -0.58642578125, -0.047119140625, 0.4921875, 1.031494140625, 1.57080078125, 2.110107421875, 2.6494140625, 3.188720703125, 3.72802734375, 4.267333984375, 4.806640625, 5.345947265625, 5.88525390625, 6.424560546875, 6.9638671875, 7.503173828125, 8.04248046875, 8.581787109375, 9.12109375, 9.660400390625, 10.19970703125, 10.739013671875, 11.2783203125, 11.817626953125, 12.35693359375, 12.896240234375, 13.435546875, 13.974853515625, 14.51416015625, 15.053466796875, 15.5927734375, 16.132080078125, 16.67138671875, 17.210693359375, 17.75]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 7.0, 5.0, 7.0, 11.0, 18.0, 31.0, 30.0, 67.0, 76.0, 95.0, 99.0, 147.0, 116.0, 89.0, 60.0, 41.0, 36.0, 16.0, 12.0, 10.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00527191162109375, -0.005102992057800293, -0.004934072494506836, -0.004765152931213379, -0.004596233367919922, -0.004427313804626465, -0.004258394241333008, -0.004089474678039551, -0.003920555114746094, -0.0037516355514526367, -0.0035827159881591797, -0.0034137964248657227, -0.0032448768615722656, -0.0030759572982788086, -0.0029070377349853516, -0.0027381181716918945, -0.0025691986083984375, -0.0024002790451049805, -0.0022313594818115234, -0.0020624399185180664, -0.0018935203552246094, -0.0017246007919311523, -0.0015556812286376953, -0.0013867616653442383, -0.0012178421020507812, -0.0010489225387573242, -0.0008800029754638672, -0.0007110834121704102, -0.0005421638488769531, -0.0003732442855834961, -0.00020432472229003906, -3.540515899658203e-05, 0.000133514404296875, 0.00030243396759033203, 0.00047135353088378906, 0.0006402730941772461, 0.0008091926574707031, 0.0009781122207641602, 0.0011470317840576172, 0.0013159513473510742, 0.0014848709106445312, 0.0016537904739379883, 0.0018227100372314453, 0.0019916296005249023, 0.0021605491638183594, 0.0023294687271118164, 0.0024983882904052734, 0.0026673078536987305, 0.0028362274169921875, 0.0030051469802856445, 0.0031740665435791016, 0.0033429861068725586, 0.0035119056701660156, 0.0036808252334594727, 0.0038497447967529297, 0.004018664360046387, 0.004187583923339844, 0.004356503486633301, 0.004525423049926758, 0.004694342613220215, 0.004863262176513672, 0.005032181739807129, 0.005201101303100586, 0.005370020866394043, 0.0055389404296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 11.0, 13.0, 19.0, 20.0, 38.0, 63.0, 95.0, 133.0, 263.0, 526.0, 1161.0, 2984.0, 9561.0, 44456.0, 321187.0, 589623.0, 60321.0, 11847.0, 3443.0, 1416.0, 655.0, 288.0, 174.0, 97.0, 55.0, 32.0, 23.0, 18.0, 11.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.09375, -20.436279296875, -19.77880859375, -19.121337890625, -18.4638671875, -17.806396484375, -17.14892578125, -16.491455078125, -15.833984375, -15.176513671875, -14.51904296875, -13.861572265625, -13.2041015625, -12.546630859375, -11.88916015625, -11.231689453125, -10.57421875, -9.916748046875, -9.25927734375, -8.601806640625, -7.9443359375, -7.286865234375, -6.62939453125, -5.971923828125, -5.314453125, -4.656982421875, -3.99951171875, -3.342041015625, -2.6845703125, -2.027099609375, -1.36962890625, -0.712158203125, -0.0546875, 0.602783203125, 1.26025390625, 1.917724609375, 2.5751953125, 3.232666015625, 3.89013671875, 4.547607421875, 5.205078125, 5.862548828125, 6.52001953125, 7.177490234375, 7.8349609375, 8.492431640625, 9.14990234375, 9.807373046875, 10.46484375, 11.122314453125, 11.77978515625, 12.437255859375, 13.0947265625, 13.752197265625, 14.40966796875, 15.067138671875, 15.724609375, 16.382080078125, 17.03955078125, 17.697021484375, 18.3544921875, 19.011962890625, 19.66943359375, 20.326904296875, 20.984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 12.0, 19.0, 25.0, 33.0, 42.0, 73.0, 89.0, 102.0, 108.0, 114.0, 94.0, 63.0, 53.0, 42.0, 29.0, 28.0, 11.0, 18.0, 7.0, 7.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0, -17.277099609375, -16.55419921875, -15.831298828125, -15.1083984375, -14.385498046875, -13.66259765625, -12.939697265625, -12.216796875, -11.493896484375, -10.77099609375, -10.048095703125, -9.3251953125, -8.602294921875, -7.87939453125, -7.156494140625, -6.43359375, -5.710693359375, -4.98779296875, -4.264892578125, -3.5419921875, -2.819091796875, -2.09619140625, -1.373291015625, -0.650390625, 0.072509765625, 0.79541015625, 1.518310546875, 2.2412109375, 2.964111328125, 3.68701171875, 4.409912109375, 5.1328125, 5.855712890625, 6.57861328125, 7.301513671875, 8.0244140625, 8.747314453125, 9.47021484375, 10.193115234375, 10.916015625, 11.638916015625, 12.36181640625, 13.084716796875, 13.8076171875, 14.530517578125, 15.25341796875, 15.976318359375, 16.69921875, 17.422119140625, 18.14501953125, 18.867919921875, 19.5908203125, 20.313720703125, 21.03662109375, 21.759521484375, 22.482421875, 23.205322265625, 23.92822265625, 24.651123046875, 25.3740234375, 26.096923828125, 26.81982421875, 27.542724609375, 28.265625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 13.0, 18.0, 58.0, 209.0, 464.0, 170.0, 45.0, 14.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1135.611083984375, -1105.9742431640625, -1076.3372802734375, -1046.700439453125, -1017.0634765625, -987.4266357421875, -957.7897338867188, -928.15283203125, -898.5159301757812, -868.8790283203125, -839.2421264648438, -809.605224609375, -779.9683837890625, -750.3314208984375, -720.694580078125, -691.0576782226562, -661.4207763671875, -631.7838745117188, -602.14697265625, -572.5100708007812, -542.8731689453125, -513.236328125, -483.59942626953125, -453.9625244140625, -424.32562255859375, -394.688720703125, -365.05181884765625, -335.4149475097656, -305.7780456542969, -276.1411437988281, -246.50425720214844, -216.86737060546875, -187.23046875, -157.59356689453125, -127.95668029785156, -98.31978607177734, -68.68289184570312, -39.045989990234375, -9.409103393554688, 20.227783203125, 49.86468505859375, 79.50157928466797, 109.13847351074219, 138.77536010742188, 168.41226196289062, 198.04916381835938, 227.68605041503906, 257.32293701171875, 286.9598388671875, 316.59674072265625, 346.233642578125, 375.8705139160156, 405.5074157714844, 435.1443176269531, 464.78118896484375, 494.4180908203125, 524.0549926757812, 553.69189453125, 583.3287963867188, 612.9656982421875, 642.6025390625, 672.239501953125, 701.8763427734375, 731.5132446289062, 761.150146484375]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 9.0, 19.0, 11.0, 13.0, 13.0, 16.0, 18.0, 23.0, 29.0, 26.0, 33.0, 40.0, 40.0, 50.0, 64.0, 63.0, 65.0, 52.0, 57.0, 36.0, 40.0, 29.0, 33.0, 23.0, 28.0, 26.0, 17.0, 16.0, 12.0, 15.0, 13.0, 7.0, 11.0, 6.0, 10.0, 6.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-331.1248779296875, -322.1282958984375, -313.1317138671875, -304.1351623535156, -295.1385803222656, -286.1419982910156, -277.14544677734375, -268.14886474609375, -259.15228271484375, -250.15570068359375, -241.1591339111328, -232.16256713867188, -223.16598510742188, -214.16940307617188, -205.17283630371094, -196.17626953125, -187.1796875, -178.18310546875, -169.18653869628906, -160.18997192382812, -151.19338989257812, -142.19680786132812, -133.2002410888672, -124.20366668701172, -115.20709228515625, -106.21051788330078, -97.21394348144531, -88.21736907958984, -79.22079467773438, -70.2242202758789, -61.22764587402344, -52.23107147216797, -43.2344970703125, -34.23792266845703, -25.241348266601562, -16.244773864746094, -7.248199462890625, 1.7483749389648438, 10.744949340820312, 19.74152374267578, 28.73809814453125, 37.73467254638672, 46.73124694824219, 55.727821350097656, 64.72439575195312, 73.7209701538086, 82.71754455566406, 91.71411895751953, 100.710693359375, 109.70726776123047, 118.70384216308594, 127.7004165649414, 136.69699096679688, 145.69357299804688, 154.6901397705078, 163.68670654296875, 172.68328857421875, 181.67987060546875, 190.6764373779297, 199.67300415039062, 208.66958618164062, 217.66616821289062, 226.66273498535156, 235.6593017578125, 244.6558837890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 5.0, 5.0, 14.0, 13.0, 18.0, 15.0, 16.0, 47.0, 62.0, 115.0, 210.0, 362.0, 713.0, 1651.0, 4895.0, 21015.0, 338934.0, 3430574.0, 364740.0, 22576.0, 5099.0, 1674.0, 706.0, 347.0, 160.0, 96.0, 80.0, 46.0, 27.0, 18.0, 11.0, 7.0, 7.0, 6.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-48.8125, -47.31103515625, -45.8095703125, -44.30810546875, -42.806640625, -41.30517578125, -39.8037109375, -38.30224609375, -36.80078125, -35.29931640625, -33.7978515625, -32.29638671875, -30.794921875, -29.29345703125, -27.7919921875, -26.29052734375, -24.7890625, -23.28759765625, -21.7861328125, -20.28466796875, -18.783203125, -17.28173828125, -15.7802734375, -14.27880859375, -12.77734375, -11.27587890625, -9.7744140625, -8.27294921875, -6.771484375, -5.27001953125, -3.7685546875, -2.26708984375, -0.765625, 0.73583984375, 2.2373046875, 3.73876953125, 5.240234375, 6.74169921875, 8.2431640625, 9.74462890625, 11.24609375, 12.74755859375, 14.2490234375, 15.75048828125, 17.251953125, 18.75341796875, 20.2548828125, 21.75634765625, 23.2578125, 24.75927734375, 26.2607421875, 27.76220703125, 29.263671875, 30.76513671875, 32.2666015625, 33.76806640625, 35.26953125, 36.77099609375, 38.2724609375, 39.77392578125, 41.275390625, 42.77685546875, 44.2783203125, 45.77978515625, 47.28125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 4.0, 10.0, 9.0, 17.0, 8.0, 19.0, 18.0, 21.0, 30.0, 24.0, 33.0, 34.0, 37.0, 43.0, 44.0, 42.0, 55.0, 51.0, 41.0, 52.0, 38.0, 43.0, 43.0, 37.0, 39.0, 29.0, 23.0, 20.0, 12.0, 21.0, 18.0, 11.0, 15.0, 11.0, 10.0, 5.0, 5.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-21.609375, -21.002685546875, -20.39599609375, -19.789306640625, -19.1826171875, -18.575927734375, -17.96923828125, -17.362548828125, -16.755859375, -16.149169921875, -15.54248046875, -14.935791015625, -14.3291015625, -13.722412109375, -13.11572265625, -12.509033203125, -11.90234375, -11.295654296875, -10.68896484375, -10.082275390625, -9.4755859375, -8.868896484375, -8.26220703125, -7.655517578125, -7.048828125, -6.442138671875, -5.83544921875, -5.228759765625, -4.6220703125, -4.015380859375, -3.40869140625, -2.802001953125, -2.1953125, -1.588623046875, -0.98193359375, -0.375244140625, 0.2314453125, 0.838134765625, 1.44482421875, 2.051513671875, 2.658203125, 3.264892578125, 3.87158203125, 4.478271484375, 5.0849609375, 5.691650390625, 6.29833984375, 6.905029296875, 7.51171875, 8.118408203125, 8.72509765625, 9.331787109375, 9.9384765625, 10.545166015625, 11.15185546875, 11.758544921875, 12.365234375, 12.971923828125, 13.57861328125, 14.185302734375, 14.7919921875, 15.398681640625, 16.00537109375, 16.612060546875, 17.21875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 12.0, 22.0, 36.0, 36.0, 66.0, 165.0, 376.0, 992.0, 3671.0, 22665.0, 1471148.0, 2661548.0, 27546.0, 4134.0, 1124.0, 345.0, 176.0, 66.0, 51.0, 29.0, 12.0, 14.0, 7.0, 3.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.5, -90.48828125, -87.4765625, -84.46484375, -81.453125, -78.44140625, -75.4296875, -72.41796875, -69.40625, -66.39453125, -63.3828125, -60.37109375, -57.359375, -54.34765625, -51.3359375, -48.32421875, -45.3125, -42.30078125, -39.2890625, -36.27734375, -33.265625, -30.25390625, -27.2421875, -24.23046875, -21.21875, -18.20703125, -15.1953125, -12.18359375, -9.171875, -6.16015625, -3.1484375, -0.13671875, 2.875, 5.88671875, 8.8984375, 11.91015625, 14.921875, 17.93359375, 20.9453125, 23.95703125, 26.96875, 29.98046875, 32.9921875, 36.00390625, 39.015625, 42.02734375, 45.0390625, 48.05078125, 51.0625, 54.07421875, 57.0859375, 60.09765625, 63.109375, 66.12109375, 69.1328125, 72.14453125, 75.15625, 78.16796875, 81.1796875, 84.19140625, 87.203125, 90.21484375, 93.2265625, 96.23828125, 99.25]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 8.0, 10.0, 20.0, 20.0, 41.0, 72.0, 100.0, 221.0, 511.0, 1024.0, 986.0, 561.0, 211.0, 104.0, 51.0, 45.0, 17.0, 11.0, 10.0, 7.0, 8.0, 9.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-87.875, -85.62255859375, -83.3701171875, -81.11767578125, -78.865234375, -76.61279296875, -74.3603515625, -72.10791015625, -69.85546875, -67.60302734375, -65.3505859375, -63.09814453125, -60.845703125, -58.59326171875, -56.3408203125, -54.08837890625, -51.8359375, -49.58349609375, -47.3310546875, -45.07861328125, -42.826171875, -40.57373046875, -38.3212890625, -36.06884765625, -33.81640625, -31.56396484375, -29.3115234375, -27.05908203125, -24.806640625, -22.55419921875, -20.3017578125, -18.04931640625, -15.796875, -13.54443359375, -11.2919921875, -9.03955078125, -6.787109375, -4.53466796875, -2.2822265625, -0.02978515625, 2.22265625, 4.47509765625, 6.7275390625, 8.97998046875, 11.232421875, 13.48486328125, 15.7373046875, 17.98974609375, 20.2421875, 22.49462890625, 24.7470703125, 26.99951171875, 29.251953125, 31.50439453125, 33.7568359375, 36.00927734375, 38.26171875, 40.51416015625, 42.7666015625, 45.01904296875, 47.271484375, 49.52392578125, 51.7763671875, 54.02880859375, 56.28125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 23.0, 57.0, 149.0, 312.0, 234.0, 122.0, 48.0, 22.0, 12.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-877.1295166015625, -855.1187744140625, -833.1080322265625, -811.0972900390625, -789.0865478515625, -767.0758666992188, -745.0651245117188, -723.0543823242188, -701.0436401367188, -679.0328979492188, -657.0221557617188, -635.0114135742188, -613.000732421875, -590.989990234375, -568.979248046875, -546.968505859375, -524.957763671875, -502.947021484375, -480.936279296875, -458.9255676269531, -436.9148254394531, -414.9040832519531, -392.89337158203125, -370.88262939453125, -348.87188720703125, -326.86114501953125, -304.85040283203125, -282.8396911621094, -260.8289489746094, -238.81820678710938, -216.80747985839844, -194.7967529296875, -172.7860107421875, -150.7752685546875, -128.76454162597656, -106.7538070678711, -84.74307250976562, -62.732337951660156, -40.72160339355469, -18.71087646484375, 3.29986572265625, 25.31060028076172, 47.32133483886719, 69.33206939697266, 91.34280395507812, 113.3535385131836, 135.36427307128906, 157.375, 179.3857421875, 201.396484375, 223.40721130371094, 245.41793823242188, 267.4286804199219, 289.4394226074219, 311.45013427734375, 333.46087646484375, 355.47161865234375, 377.48236083984375, 399.49310302734375, 421.5038146972656, 443.5145568847656, 465.5252990722656, 487.5360107421875, 509.5467529296875, 531.5574951171875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 1.0, 7.0, 3.0, 12.0, 14.0, 12.0, 12.0, 29.0, 31.0, 28.0, 36.0, 38.0, 45.0, 43.0, 53.0, 51.0, 53.0, 61.0, 51.0, 60.0, 48.0, 35.0, 45.0, 35.0, 28.0, 28.0, 25.0, 18.0, 22.0, 8.0, 15.0, 15.0, 8.0, 5.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-238.19119262695312, -229.75479125976562, -221.31837463378906, -212.8819580078125, -204.445556640625, -196.0091552734375, -187.57273864746094, -179.13632202148438, -170.69992065429688, -162.26351928710938, -153.8271026611328, -145.39068603515625, -136.95428466796875, -128.51788330078125, -120.08146667480469, -111.64505767822266, -103.20864868164062, -94.7722396850586, -86.33583068847656, -77.89942169189453, -69.4630126953125, -61.02660369873047, -52.59019470214844, -44.153785705566406, -35.717376708984375, -27.280967712402344, -18.844558715820312, -10.408149719238281, -1.97174072265625, 6.464668273925781, 14.901077270507812, 23.337486267089844, 31.773895263671875, 40.210304260253906, 48.64671325683594, 57.08312225341797, 65.51953125, 73.95594024658203, 82.39234924316406, 90.8287582397461, 99.26516723632812, 107.70157623291016, 116.13798522949219, 124.57439422607422, 133.01080322265625, 141.44720458984375, 149.8836212158203, 158.32003784179688, 166.75643920898438, 175.19284057617188, 183.62925720214844, 192.065673828125, 200.5020751953125, 208.9384765625, 217.37489318847656, 225.81130981445312, 234.24771118164062, 242.68411254882812, 251.1205291748047, 259.55694580078125, 267.99334716796875, 276.42974853515625, 284.86614990234375, 293.3025817871094, 301.7389831542969]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 8.0, 11.0, 13.0, 27.0, 38.0, 61.0, 115.0, 187.0, 328.0, 625.0, 1085.0, 2090.0, 4489.0, 10411.0, 25269.0, 67704.0, 193627.0, 383143.0, 227872.0, 79756.0, 29504.0, 11946.0, 5156.0, 2387.0, 1166.0, 640.0, 356.0, 213.0, 115.0, 83.0, 57.0, 25.0, 12.0, 14.0, 10.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.40625, -37.38427734375, -36.3623046875, -35.34033203125, -34.318359375, -33.29638671875, -32.2744140625, -31.25244140625, -30.23046875, -29.20849609375, -28.1865234375, -27.16455078125, -26.142578125, -25.12060546875, -24.0986328125, -23.07666015625, -22.0546875, -21.03271484375, -20.0107421875, -18.98876953125, -17.966796875, -16.94482421875, -15.9228515625, -14.90087890625, -13.87890625, -12.85693359375, -11.8349609375, -10.81298828125, -9.791015625, -8.76904296875, -7.7470703125, -6.72509765625, -5.703125, -4.68115234375, -3.6591796875, -2.63720703125, -1.615234375, -0.59326171875, 0.4287109375, 1.45068359375, 2.47265625, 3.49462890625, 4.5166015625, 5.53857421875, 6.560546875, 7.58251953125, 8.6044921875, 9.62646484375, 10.6484375, 11.67041015625, 12.6923828125, 13.71435546875, 14.736328125, 15.75830078125, 16.7802734375, 17.80224609375, 18.82421875, 19.84619140625, 20.8681640625, 21.89013671875, 22.912109375, 23.93408203125, 24.9560546875, 25.97802734375, 27.0]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 1.0, 4.0, 6.0, 11.0, 9.0, 12.0, 8.0, 25.0, 16.0, 13.0, 28.0, 23.0, 31.0, 26.0, 33.0, 33.0, 35.0, 41.0, 47.0, 53.0, 36.0, 32.0, 44.0, 33.0, 34.0, 39.0, 38.0, 30.0, 34.0, 27.0, 29.0, 23.0, 26.0, 16.0, 14.0, 16.0, 10.0, 14.0, 6.0, 11.0, 5.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.234375, -18.6533203125, -18.072265625, -17.4912109375, -16.91015625, -16.3291015625, -15.748046875, -15.1669921875, -14.5859375, -14.0048828125, -13.423828125, -12.8427734375, -12.26171875, -11.6806640625, -11.099609375, -10.5185546875, -9.9375, -9.3564453125, -8.775390625, -8.1943359375, -7.61328125, -7.0322265625, -6.451171875, -5.8701171875, -5.2890625, -4.7080078125, -4.126953125, -3.5458984375, -2.96484375, -2.3837890625, -1.802734375, -1.2216796875, -0.640625, -0.0595703125, 0.521484375, 1.1025390625, 1.68359375, 2.2646484375, 2.845703125, 3.4267578125, 4.0078125, 4.5888671875, 5.169921875, 5.7509765625, 6.33203125, 6.9130859375, 7.494140625, 8.0751953125, 8.65625, 9.2373046875, 9.818359375, 10.3994140625, 10.98046875, 11.5615234375, 12.142578125, 12.7236328125, 13.3046875, 13.8857421875, 14.466796875, 15.0478515625, 15.62890625, 16.2099609375, 16.791015625, 17.3720703125, 17.953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 6.0, 5.0, 8.0, 13.0, 28.0, 44.0, 73.0, 133.0, 250.0, 587.0, 1708.0, 8662.0, 108895.0, 871550.0, 49018.0, 5382.0, 1264.0, 476.0, 200.0, 108.0, 50.0, 29.0, 16.0, 20.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.1875, -96.7763671875, -93.365234375, -89.9541015625, -86.54296875, -83.1318359375, -79.720703125, -76.3095703125, -72.8984375, -69.4873046875, -66.076171875, -62.6650390625, -59.25390625, -55.8427734375, -52.431640625, -49.0205078125, -45.609375, -42.1982421875, -38.787109375, -35.3759765625, -31.96484375, -28.5537109375, -25.142578125, -21.7314453125, -18.3203125, -14.9091796875, -11.498046875, -8.0869140625, -4.67578125, -1.2646484375, 2.146484375, 5.5576171875, 8.96875, 12.3798828125, 15.791015625, 19.2021484375, 22.61328125, 26.0244140625, 29.435546875, 32.8466796875, 36.2578125, 39.6689453125, 43.080078125, 46.4912109375, 49.90234375, 53.3134765625, 56.724609375, 60.1357421875, 63.546875, 66.9580078125, 70.369140625, 73.7802734375, 77.19140625, 80.6025390625, 84.013671875, 87.4248046875, 90.8359375, 94.2470703125, 97.658203125, 101.0693359375, 104.48046875, 107.8916015625, 111.302734375, 114.7138671875, 118.125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 2.0, 7.0, 6.0, 11.0, 9.0, 17.0, 14.0, 20.0, 17.0, 19.0, 27.0, 29.0, 24.0, 28.0, 40.0, 47.0, 58.0, 60.0, 61.0, 53.0, 62.0, 56.0, 56.0, 32.0, 48.0, 39.0, 23.0, 25.0, 15.0, 12.0, 14.0, 12.0, 12.0, 12.0, 9.0, 8.0, 4.0, 8.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.25, -65.7080078125, -63.166015625, -60.6240234375, -58.08203125, -55.5400390625, -52.998046875, -50.4560546875, -47.9140625, -45.3720703125, -42.830078125, -40.2880859375, -37.74609375, -35.2041015625, -32.662109375, -30.1201171875, -27.578125, -25.0361328125, -22.494140625, -19.9521484375, -17.41015625, -14.8681640625, -12.326171875, -9.7841796875, -7.2421875, -4.7001953125, -2.158203125, 0.3837890625, 2.92578125, 5.4677734375, 8.009765625, 10.5517578125, 13.09375, 15.6357421875, 18.177734375, 20.7197265625, 23.26171875, 25.8037109375, 28.345703125, 30.8876953125, 33.4296875, 35.9716796875, 38.513671875, 41.0556640625, 43.59765625, 46.1396484375, 48.681640625, 51.2236328125, 53.765625, 56.3076171875, 58.849609375, 61.3916015625, 63.93359375, 66.4755859375, 69.017578125, 71.5595703125, 74.1015625, 76.6435546875, 79.185546875, 81.7275390625, 84.26953125, 86.8115234375, 89.353515625, 91.8955078125, 94.4375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 3.0, 10.0, 9.0, 20.0, 24.0, 54.0, 77.0, 156.0, 284.0, 551.0, 1178.0, 2848.0, 8314.0, 31542.0, 236327.0, 694184.0, 53925.0, 12105.0, 4000.0, 1503.0, 658.0, 346.0, 166.0, 108.0, 57.0, 32.0, 22.0, 15.0, 11.0, 7.0, 5.0, 7.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.640625, -21.0582275390625, -20.475830078125, -19.8934326171875, -19.31103515625, -18.7286376953125, -18.146240234375, -17.5638427734375, -16.9814453125, -16.3990478515625, -15.816650390625, -15.2342529296875, -14.65185546875, -14.0694580078125, -13.487060546875, -12.9046630859375, -12.322265625, -11.7398681640625, -11.157470703125, -10.5750732421875, -9.99267578125, -9.4102783203125, -8.827880859375, -8.2454833984375, -7.6630859375, -7.0806884765625, -6.498291015625, -5.9158935546875, -5.33349609375, -4.7510986328125, -4.168701171875, -3.5863037109375, -3.00390625, -2.4215087890625, -1.839111328125, -1.2567138671875, -0.67431640625, -0.0919189453125, 0.490478515625, 1.0728759765625, 1.6552734375, 2.2376708984375, 2.820068359375, 3.4024658203125, 3.98486328125, 4.5672607421875, 5.149658203125, 5.7320556640625, 6.314453125, 6.8968505859375, 7.479248046875, 8.0616455078125, 8.64404296875, 9.2264404296875, 9.808837890625, 10.3912353515625, 10.9736328125, 11.5560302734375, 12.138427734375, 12.7208251953125, 13.30322265625, 13.8856201171875, 14.468017578125, 15.0504150390625, 15.6328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 3.0, 10.0, 11.0, 12.0, 18.0, 21.0, 37.0, 49.0, 58.0, 89.0, 142.0, 134.0, 99.0, 79.0, 64.0, 32.0, 29.0, 20.0, 20.0, 9.0, 10.0, 10.0, 7.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003986358642578125, -0.003850281238555908, -0.0037142038345336914, -0.0035781264305114746, -0.003442049026489258, -0.003305971622467041, -0.0031698942184448242, -0.0030338168144226074, -0.0028977394104003906, -0.002761662006378174, -0.002625584602355957, -0.0024895071983337402, -0.0023534297943115234, -0.0022173523902893066, -0.00208127498626709, -0.001945197582244873, -0.0018091201782226562, -0.0016730427742004395, -0.0015369653701782227, -0.0014008879661560059, -0.001264810562133789, -0.0011287331581115723, -0.0009926557540893555, -0.0008565783500671387, -0.0007205009460449219, -0.0005844235420227051, -0.0004483461380004883, -0.0003122687339782715, -0.0001761913299560547, -4.011392593383789e-05, 9.59634780883789e-05, 0.0002320408821105957, 0.0003681182861328125, 0.0005041956901550293, 0.0006402730941772461, 0.0007763504981994629, 0.0009124279022216797, 0.0010485053062438965, 0.0011845827102661133, 0.00132066011428833, 0.0014567375183105469, 0.0015928149223327637, 0.0017288923263549805, 0.0018649697303771973, 0.002001047134399414, 0.002137124538421631, 0.0022732019424438477, 0.0024092793464660645, 0.0025453567504882812, 0.002681434154510498, 0.002817511558532715, 0.0029535889625549316, 0.0030896663665771484, 0.0032257437705993652, 0.003361821174621582, 0.003497898578643799, 0.0036339759826660156, 0.0037700533866882324, 0.0039061307907104492, 0.004042208194732666, 0.004178285598754883, 0.0043143630027771, 0.004450440406799316, 0.004586517810821533, 0.00472259521484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 10.0, 11.0, 18.0, 25.0, 39.0, 63.0, 118.0, 226.0, 520.0, 1243.0, 3651.0, 16319.0, 128189.0, 807510.0, 74795.0, 11073.0, 2801.0, 978.0, 440.0, 193.0, 120.0, 54.0, 40.0, 35.0, 15.0, 16.0, 10.0, 10.0, 7.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.515625, -20.830078125, -20.14453125, -19.458984375, -18.7734375, -18.087890625, -17.40234375, -16.716796875, -16.03125, -15.345703125, -14.66015625, -13.974609375, -13.2890625, -12.603515625, -11.91796875, -11.232421875, -10.546875, -9.861328125, -9.17578125, -8.490234375, -7.8046875, -7.119140625, -6.43359375, -5.748046875, -5.0625, -4.376953125, -3.69140625, -3.005859375, -2.3203125, -1.634765625, -0.94921875, -0.263671875, 0.421875, 1.107421875, 1.79296875, 2.478515625, 3.1640625, 3.849609375, 4.53515625, 5.220703125, 5.90625, 6.591796875, 7.27734375, 7.962890625, 8.6484375, 9.333984375, 10.01953125, 10.705078125, 11.390625, 12.076171875, 12.76171875, 13.447265625, 14.1328125, 14.818359375, 15.50390625, 16.189453125, 16.875, 17.560546875, 18.24609375, 18.931640625, 19.6171875, 20.302734375, 20.98828125, 21.673828125, 22.359375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 1.0, 4.0, 4.0, 8.0, 7.0, 16.0, 18.0, 18.0, 28.0, 25.0, 34.0, 45.0, 80.0, 94.0, 108.0, 105.0, 96.0, 69.0, 55.0, 43.0, 33.0, 24.0, 14.0, 17.0, 5.0, 10.0, 9.0, 9.0, 8.0, 0.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.265625, -16.76123046875, -16.2568359375, -15.75244140625, -15.248046875, -14.74365234375, -14.2392578125, -13.73486328125, -13.23046875, -12.72607421875, -12.2216796875, -11.71728515625, -11.212890625, -10.70849609375, -10.2041015625, -9.69970703125, -9.1953125, -8.69091796875, -8.1865234375, -7.68212890625, -7.177734375, -6.67333984375, -6.1689453125, -5.66455078125, -5.16015625, -4.65576171875, -4.1513671875, -3.64697265625, -3.142578125, -2.63818359375, -2.1337890625, -1.62939453125, -1.125, -0.62060546875, -0.1162109375, 0.38818359375, 0.892578125, 1.39697265625, 1.9013671875, 2.40576171875, 2.91015625, 3.41455078125, 3.9189453125, 4.42333984375, 4.927734375, 5.43212890625, 5.9365234375, 6.44091796875, 6.9453125, 7.44970703125, 7.9541015625, 8.45849609375, 8.962890625, 9.46728515625, 9.9716796875, 10.47607421875, 10.98046875, 11.48486328125, 11.9892578125, 12.49365234375, 12.998046875, 13.50244140625, 14.0068359375, 14.51123046875, 15.015625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 12.0, 5.0, 5.0, 16.0, 28.0, 39.0, 84.0, 120.0, 260.0, 165.0, 98.0, 62.0, 38.0, 27.0, 16.0, 12.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-469.0545654296875, -457.233642578125, -445.4126892089844, -433.59173583984375, -421.77081298828125, -409.94989013671875, -398.1289367675781, -386.3079833984375, -374.487060546875, -362.6661376953125, -350.8451843261719, -339.02423095703125, -327.20330810546875, -315.38238525390625, -303.5614318847656, -291.740478515625, -279.9195556640625, -268.0986328125, -256.2776794433594, -244.4567413330078, -232.63580322265625, -220.8148651123047, -208.99392700195312, -197.17298889160156, -185.35205078125, -173.53111267089844, -161.71017456054688, -149.8892364501953, -138.06829833984375, -126.24736022949219, -114.42642211914062, -102.60548400878906, -90.7845458984375, -78.96360778808594, -67.14266967773438, -55.32173156738281, -43.50079345703125, -31.679855346679688, -19.858917236328125, -8.037979125976562, 3.782958984375, 15.603897094726562, 27.424835205078125, 39.24577331542969, 51.06671142578125, 62.88764953613281, 74.70858764648438, 86.52952575683594, 98.3504638671875, 110.17140197753906, 121.99234008789062, 133.8132781982422, 145.63421630859375, 157.4551544189453, 169.27609252929688, 181.09703063964844, 192.91796875, 204.73890686035156, 216.55984497070312, 228.3807830810547, 240.20172119140625, 252.0226593017578, 263.8435974121094, 275.66455078125, 287.4854736328125]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 10.0, 7.0, 15.0, 8.0, 17.0, 17.0, 18.0, 27.0, 32.0, 22.0, 36.0, 30.0, 39.0, 38.0, 68.0, 100.0, 114.0, 67.0, 41.0, 30.0, 28.0, 28.0, 27.0, 33.0, 13.0, 16.0, 16.0, 15.0, 14.0, 6.0, 7.0, 8.0, 8.0, 3.0, 5.0, 3.0, 9.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-267.234619140625, -257.72015380859375, -248.20567321777344, -238.6912078857422, -229.17672729492188, -219.66226196289062, -210.14779663085938, -200.63333129882812, -191.1188507080078, -181.60438537597656, -172.08990478515625, -162.575439453125, -153.06097412109375, -143.54649353027344, -134.0320281982422, -124.5175552368164, -115.00308227539062, -105.48860931396484, -95.97413635253906, -86.45967102050781, -76.94519805908203, -67.43072509765625, -57.916255950927734, -48.40178680419922, -38.88731384277344, -29.37284278869629, -19.85837173461914, -10.343900680541992, -0.8294296264648438, 8.685043334960938, 18.199512481689453, 27.71398162841797, 37.228485107421875, 46.742958068847656, 56.25742721557617, 65.77189636230469, 75.28636932373047, 84.80084228515625, 94.3153076171875, 103.82978057861328, 113.34425354003906, 122.85872650146484, 132.37319946289062, 141.88766479492188, 151.40213012695312, 160.91661071777344, 170.4310760498047, 179.945556640625, 189.46002197265625, 198.9744873046875, 208.4889678955078, 218.00343322753906, 227.51791381835938, 237.03237915039062, 246.54684448242188, 256.0613098144531, 265.5758056640625, 275.09027099609375, 284.604736328125, 294.1192321777344, 303.6336975097656, 313.1481628417969, 322.6626281738281, 332.1770935058594, 341.6915588378906]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 10.0, 8.0, 14.0, 19.0, 28.0, 27.0, 58.0, 100.0, 144.0, 254.0, 413.0, 658.0, 1139.0, 1925.0, 3760.0, 8007.0, 20099.0, 68044.0, 287965.0, 1157140.0, 1822745.0, 611785.0, 145623.0, 39060.0, 13254.0, 5623.0, 2813.0, 1481.0, 843.0, 474.0, 293.0, 159.0, 111.0, 73.0, 48.0, 27.0, 17.0, 15.0, 8.0, 7.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-19.59375, -18.9462890625, -18.298828125, -17.6513671875, -17.00390625, -16.3564453125, -15.708984375, -15.0615234375, -14.4140625, -13.7666015625, -13.119140625, -12.4716796875, -11.82421875, -11.1767578125, -10.529296875, -9.8818359375, -9.234375, -8.5869140625, -7.939453125, -7.2919921875, -6.64453125, -5.9970703125, -5.349609375, -4.7021484375, -4.0546875, -3.4072265625, -2.759765625, -2.1123046875, -1.46484375, -0.8173828125, -0.169921875, 0.4775390625, 1.125, 1.7724609375, 2.419921875, 3.0673828125, 3.71484375, 4.3623046875, 5.009765625, 5.6572265625, 6.3046875, 6.9521484375, 7.599609375, 8.2470703125, 8.89453125, 9.5419921875, 10.189453125, 10.8369140625, 11.484375, 12.1318359375, 12.779296875, 13.4267578125, 14.07421875, 14.7216796875, 15.369140625, 16.0166015625, 16.6640625, 17.3115234375, 17.958984375, 18.6064453125, 19.25390625, 19.9013671875, 20.548828125, 21.1962890625, 21.84375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 4.0, 15.0, 7.0, 9.0, 18.0, 12.0, 10.0, 19.0, 29.0, 25.0, 26.0, 32.0, 32.0, 29.0, 45.0, 44.0, 45.0, 39.0, 38.0, 53.0, 35.0, 40.0, 38.0, 38.0, 29.0, 37.0, 26.0, 36.0, 35.0, 25.0, 19.0, 15.0, 16.0, 9.0, 9.0, 9.0, 6.0, 9.0, 1.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.9453125, -16.375, -15.8046875, -15.234375, -14.6640625, -14.09375, -13.5234375, -12.953125, -12.3828125, -11.8125, -11.2421875, -10.671875, -10.1015625, -9.53125, -8.9609375, -8.390625, -7.8203125, -7.25, -6.6796875, -6.109375, -5.5390625, -4.96875, -4.3984375, -3.828125, -3.2578125, -2.6875, -2.1171875, -1.546875, -0.9765625, -0.40625, 0.1640625, 0.734375, 1.3046875, 1.875, 2.4453125, 3.015625, 3.5859375, 4.15625, 4.7265625, 5.296875, 5.8671875, 6.4375, 7.0078125, 7.578125, 8.1484375, 8.71875, 9.2890625, 9.859375, 10.4296875, 11.0, 11.5703125, 12.140625, 12.7109375, 13.28125, 13.8515625, 14.421875, 14.9921875, 15.5625, 16.1328125, 16.703125, 17.2734375, 17.84375, 18.4140625, 18.984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 9.0, 2.0, 7.0, 7.0, 11.0, 17.0, 21.0, 28.0, 54.0, 96.0, 159.0, 336.0, 818.0, 2648.0, 14058.0, 185421.0, 3809034.0, 164675.0, 12804.0, 2497.0, 816.0, 325.0, 174.0, 97.0, 57.0, 36.0, 17.0, 14.0, 10.0, 9.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-73.0625, -70.94384765625, -68.8251953125, -66.70654296875, -64.587890625, -62.46923828125, -60.3505859375, -58.23193359375, -56.11328125, -53.99462890625, -51.8759765625, -49.75732421875, -47.638671875, -45.52001953125, -43.4013671875, -41.28271484375, -39.1640625, -37.04541015625, -34.9267578125, -32.80810546875, -30.689453125, -28.57080078125, -26.4521484375, -24.33349609375, -22.21484375, -20.09619140625, -17.9775390625, -15.85888671875, -13.740234375, -11.62158203125, -9.5029296875, -7.38427734375, -5.265625, -3.14697265625, -1.0283203125, 1.09033203125, 3.208984375, 5.32763671875, 7.4462890625, 9.56494140625, 11.68359375, 13.80224609375, 15.9208984375, 18.03955078125, 20.158203125, 22.27685546875, 24.3955078125, 26.51416015625, 28.6328125, 30.75146484375, 32.8701171875, 34.98876953125, 37.107421875, 39.22607421875, 41.3447265625, 43.46337890625, 45.58203125, 47.70068359375, 49.8193359375, 51.93798828125, 54.056640625, 56.17529296875, 58.2939453125, 60.41259765625, 62.53125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 7.0, 11.0, 15.0, 26.0, 30.0, 47.0, 73.0, 111.0, 204.0, 350.0, 680.0, 851.0, 707.0, 413.0, 231.0, 117.0, 86.0, 27.0, 20.0, 21.0, 13.0, 10.0, 6.0, 2.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.84375, -55.95361328125, -54.0634765625, -52.17333984375, -50.283203125, -48.39306640625, -46.5029296875, -44.61279296875, -42.72265625, -40.83251953125, -38.9423828125, -37.05224609375, -35.162109375, -33.27197265625, -31.3818359375, -29.49169921875, -27.6015625, -25.71142578125, -23.8212890625, -21.93115234375, -20.041015625, -18.15087890625, -16.2607421875, -14.37060546875, -12.48046875, -10.59033203125, -8.7001953125, -6.81005859375, -4.919921875, -3.02978515625, -1.1396484375, 0.75048828125, 2.640625, 4.53076171875, 6.4208984375, 8.31103515625, 10.201171875, 12.09130859375, 13.9814453125, 15.87158203125, 17.76171875, 19.65185546875, 21.5419921875, 23.43212890625, 25.322265625, 27.21240234375, 29.1025390625, 30.99267578125, 32.8828125, 34.77294921875, 36.6630859375, 38.55322265625, 40.443359375, 42.33349609375, 44.2236328125, 46.11376953125, 48.00390625, 49.89404296875, 51.7841796875, 53.67431640625, 55.564453125, 57.45458984375, 59.3447265625, 61.23486328125, 63.125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 12.0, 9.0, 38.0, 105.0, 231.0, 263.0, 208.0, 88.0, 25.0, 10.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-776.28076171875, -757.06201171875, -737.84326171875, -718.62451171875, -699.40576171875, -680.18701171875, -660.96826171875, -641.74951171875, -622.53076171875, -603.31201171875, -584.09326171875, -564.87451171875, -545.65576171875, -526.43701171875, -507.2182312011719, -487.9994812011719, -468.78070068359375, -449.56195068359375, -430.34320068359375, -411.12445068359375, -391.90570068359375, -372.68695068359375, -353.4681701660156, -334.2494201660156, -315.0306701660156, -295.8119201660156, -276.5931701660156, -257.3744201660156, -238.15565490722656, -218.93690490722656, -199.7181396484375, -180.4993896484375, -161.28067016601562, -142.06192016601562, -122.8431625366211, -103.62440490722656, -84.40565490722656, -65.18690490722656, -45.96814727783203, -26.7493896484375, -7.5306396484375, 11.688114166259766, 30.90686798095703, 50.1256217956543, 69.34437561035156, 88.56312561035156, 107.7818832397461, 127.00064086914062, 146.21939086914062, 165.43814086914062, 184.65689086914062, 203.8756561279297, 223.0944061279297, 242.3131561279297, 261.53192138671875, 280.75067138671875, 299.96942138671875, 319.18817138671875, 338.40692138671875, 357.62567138671875, 376.84442138671875, 396.06317138671875, 415.2819519042969, 434.5007019042969, 453.7194519042969]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 12.0, 13.0, 10.0, 17.0, 15.0, 26.0, 25.0, 33.0, 29.0, 44.0, 39.0, 35.0, 47.0, 51.0, 54.0, 62.0, 47.0, 45.0, 49.0, 35.0, 40.0, 41.0, 29.0, 25.0, 20.0, 20.0, 18.0, 10.0, 13.0, 10.0, 15.0, 12.0, 10.0, 7.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-184.3595733642578, -177.9515380859375, -171.54351806640625, -165.13548278808594, -158.72744750976562, -152.31942749023438, -145.91139221191406, -139.50335693359375, -133.0953369140625, -126.68730926513672, -120.27928161621094, -113.87124633789062, -107.46321868896484, -101.05519104003906, -94.64715576171875, -88.23912811279297, -81.83110046386719, -75.4230728149414, -69.01504516601562, -62.60700988769531, -56.19898223876953, -49.79095458984375, -43.3829231262207, -36.974891662597656, -30.566864013671875, -24.15883445739746, -17.750804901123047, -11.342775344848633, -4.934745788574219, 1.4732818603515625, 7.881313323974609, 14.289344787597656, 20.6973876953125, 27.105417251586914, 33.51344680786133, 39.921478271484375, 46.329505920410156, 52.73753356933594, 59.145565032958984, 65.55359649658203, 71.96162414550781, 78.3696517944336, 84.77767944335938, 91.18571472167969, 97.59374237060547, 104.00177001953125, 110.40980529785156, 116.81783294677734, 123.22586059570312, 129.63389587402344, 136.0419158935547, 142.449951171875, 148.85797119140625, 155.26600646972656, 161.67404174804688, 168.08206176757812, 174.49009704589844, 180.89813232421875, 187.30615234375, 193.7141876220703, 200.12222290039062, 206.53024291992188, 212.9382781982422, 219.3463134765625, 225.75433349609375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 6.0, 0.0, 5.0, 5.0, 8.0, 10.0, 19.0, 20.0, 27.0, 49.0, 85.0, 92.0, 165.0, 247.0, 389.0, 680.0, 1115.0, 1954.0, 3648.0, 6598.0, 13110.0, 26472.0, 57669.0, 134841.0, 303143.0, 277816.0, 119799.0, 51065.0, 23776.0, 11777.0, 6124.0, 3254.0, 1815.0, 1099.0, 622.0, 354.0, 237.0, 144.0, 105.0, 73.0, 42.0, 37.0, 14.0, 17.0, 12.0, 13.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.328125, -23.45703125, -22.5859375, -21.71484375, -20.84375, -19.97265625, -19.1015625, -18.23046875, -17.359375, -16.48828125, -15.6171875, -14.74609375, -13.875, -13.00390625, -12.1328125, -11.26171875, -10.390625, -9.51953125, -8.6484375, -7.77734375, -6.90625, -6.03515625, -5.1640625, -4.29296875, -3.421875, -2.55078125, -1.6796875, -0.80859375, 0.0625, 0.93359375, 1.8046875, 2.67578125, 3.546875, 4.41796875, 5.2890625, 6.16015625, 7.03125, 7.90234375, 8.7734375, 9.64453125, 10.515625, 11.38671875, 12.2578125, 13.12890625, 14.0, 14.87109375, 15.7421875, 16.61328125, 17.484375, 18.35546875, 19.2265625, 20.09765625, 20.96875, 21.83984375, 22.7109375, 23.58203125, 24.453125, 25.32421875, 26.1953125, 27.06640625, 27.9375, 28.80859375, 29.6796875, 30.55078125, 31.421875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 1.0, 4.0, 4.0, 9.0, 5.0, 11.0, 7.0, 9.0, 21.0, 15.0, 21.0, 22.0, 26.0, 16.0, 21.0, 30.0, 34.0, 28.0, 35.0, 43.0, 45.0, 37.0, 39.0, 37.0, 33.0, 43.0, 45.0, 30.0, 43.0, 39.0, 17.0, 32.0, 26.0, 27.0, 26.0, 25.0, 15.0, 13.0, 10.0, 6.0, 5.0, 7.0, 11.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-17.3125, -16.755615234375, -16.19873046875, -15.641845703125, -15.0849609375, -14.528076171875, -13.97119140625, -13.414306640625, -12.857421875, -12.300537109375, -11.74365234375, -11.186767578125, -10.6298828125, -10.072998046875, -9.51611328125, -8.959228515625, -8.40234375, -7.845458984375, -7.28857421875, -6.731689453125, -6.1748046875, -5.617919921875, -5.06103515625, -4.504150390625, -3.947265625, -3.390380859375, -2.83349609375, -2.276611328125, -1.7197265625, -1.162841796875, -0.60595703125, -0.049072265625, 0.5078125, 1.064697265625, 1.62158203125, 2.178466796875, 2.7353515625, 3.292236328125, 3.84912109375, 4.406005859375, 4.962890625, 5.519775390625, 6.07666015625, 6.633544921875, 7.1904296875, 7.747314453125, 8.30419921875, 8.861083984375, 9.41796875, 9.974853515625, 10.53173828125, 11.088623046875, 11.6455078125, 12.202392578125, 12.75927734375, 13.316162109375, 13.873046875, 14.429931640625, 14.98681640625, 15.543701171875, 16.1005859375, 16.657470703125, 17.21435546875, 17.771240234375, 18.328125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 9.0, 6.0, 15.0, 6.0, 22.0, 25.0, 40.0, 63.0, 99.0, 149.0, 241.0, 406.0, 721.0, 1385.0, 3698.0, 14757.0, 128216.0, 824261.0, 60088.0, 9130.0, 2620.0, 1096.0, 562.0, 348.0, 202.0, 117.0, 74.0, 64.0, 25.0, 23.0, 19.0, 13.0, 14.0, 12.0, 7.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-77.0, -74.462890625, -71.92578125, -69.388671875, -66.8515625, -64.314453125, -61.77734375, -59.240234375, -56.703125, -54.166015625, -51.62890625, -49.091796875, -46.5546875, -44.017578125, -41.48046875, -38.943359375, -36.40625, -33.869140625, -31.33203125, -28.794921875, -26.2578125, -23.720703125, -21.18359375, -18.646484375, -16.109375, -13.572265625, -11.03515625, -8.498046875, -5.9609375, -3.423828125, -0.88671875, 1.650390625, 4.1875, 6.724609375, 9.26171875, 11.798828125, 14.3359375, 16.873046875, 19.41015625, 21.947265625, 24.484375, 27.021484375, 29.55859375, 32.095703125, 34.6328125, 37.169921875, 39.70703125, 42.244140625, 44.78125, 47.318359375, 49.85546875, 52.392578125, 54.9296875, 57.466796875, 60.00390625, 62.541015625, 65.078125, 67.615234375, 70.15234375, 72.689453125, 75.2265625, 77.763671875, 80.30078125, 82.837890625, 85.375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 15.0, 4.0, 13.0, 13.0, 22.0, 31.0, 30.0, 42.0, 34.0, 57.0, 65.0, 66.0, 84.0, 77.0, 62.0, 70.0, 57.0, 53.0, 42.0, 33.0, 23.0, 25.0, 21.0, 19.0, 7.0, 8.0, 7.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.6875, -69.4482421875, -66.208984375, -62.9697265625, -59.73046875, -56.4912109375, -53.251953125, -50.0126953125, -46.7734375, -43.5341796875, -40.294921875, -37.0556640625, -33.81640625, -30.5771484375, -27.337890625, -24.0986328125, -20.859375, -17.6201171875, -14.380859375, -11.1416015625, -7.90234375, -4.6630859375, -1.423828125, 1.8154296875, 5.0546875, 8.2939453125, 11.533203125, 14.7724609375, 18.01171875, 21.2509765625, 24.490234375, 27.7294921875, 30.96875, 34.2080078125, 37.447265625, 40.6865234375, 43.92578125, 47.1650390625, 50.404296875, 53.6435546875, 56.8828125, 60.1220703125, 63.361328125, 66.6005859375, 69.83984375, 73.0791015625, 76.318359375, 79.5576171875, 82.796875, 86.0361328125, 89.275390625, 92.5146484375, 95.75390625, 98.9931640625, 102.232421875, 105.4716796875, 108.7109375, 111.9501953125, 115.189453125, 118.4287109375, 121.66796875, 124.9072265625, 128.146484375, 131.3857421875, 134.625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 7.0, 19.0, 15.0, 28.0, 24.0, 28.0, 57.0, 82.0, 144.0, 193.0, 317.0, 508.0, 944.0, 2026.0, 5238.0, 16516.0, 79030.0, 779738.0, 128406.0, 23123.0, 6814.0, 2525.0, 1168.0, 579.0, 336.0, 222.0, 129.0, 97.0, 58.0, 57.0, 26.0, 17.0, 20.0, 12.0, 9.0, 7.0, 5.0, 0.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0], "bins": [-13.8671875, -13.4547119140625, -13.042236328125, -12.6297607421875, -12.21728515625, -11.8048095703125, -11.392333984375, -10.9798583984375, -10.5673828125, -10.1549072265625, -9.742431640625, -9.3299560546875, -8.91748046875, -8.5050048828125, -8.092529296875, -7.6800537109375, -7.267578125, -6.8551025390625, -6.442626953125, -6.0301513671875, -5.61767578125, -5.2052001953125, -4.792724609375, -4.3802490234375, -3.9677734375, -3.5552978515625, -3.142822265625, -2.7303466796875, -2.31787109375, -1.9053955078125, -1.492919921875, -1.0804443359375, -0.66796875, -0.2554931640625, 0.156982421875, 0.5694580078125, 0.98193359375, 1.3944091796875, 1.806884765625, 2.2193603515625, 2.6318359375, 3.0443115234375, 3.456787109375, 3.8692626953125, 4.28173828125, 4.6942138671875, 5.106689453125, 5.5191650390625, 5.931640625, 6.3441162109375, 6.756591796875, 7.1690673828125, 7.58154296875, 7.9940185546875, 8.406494140625, 8.8189697265625, 9.2314453125, 9.6439208984375, 10.056396484375, 10.4688720703125, 10.88134765625, 11.2938232421875, 11.706298828125, 12.1187744140625, 12.53125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 7.0, 5.0, 2.0, 5.0, 5.0, 17.0, 12.0, 19.0, 22.0, 21.0, 26.0, 43.0, 61.0, 78.0, 110.0, 118.0, 90.0, 93.0, 56.0, 37.0, 35.0, 26.0, 18.0, 16.0, 10.0, 12.0, 6.0, 11.0, 8.0, 6.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0031890869140625, -0.0030842721462249756, -0.002979457378387451, -0.0028746426105499268, -0.0027698278427124023, -0.002665013074874878, -0.0025601983070373535, -0.002455383539199829, -0.0023505687713623047, -0.0022457540035247803, -0.002140939235687256, -0.0020361244678497314, -0.001931309700012207, -0.0018264949321746826, -0.0017216801643371582, -0.0016168653964996338, -0.0015120506286621094, -0.001407235860824585, -0.0013024210929870605, -0.0011976063251495361, -0.0010927915573120117, -0.0009879767894744873, -0.0008831620216369629, -0.0007783472537994385, -0.0006735324859619141, -0.0005687177181243896, -0.00046390295028686523, -0.0003590881824493408, -0.0002542734146118164, -0.000149458646774292, -4.464387893676758e-05, 6.0170888900756836e-05, 0.00016498565673828125, 0.00026980042457580566, 0.0003746151924133301, 0.0004794299602508545, 0.0005842447280883789, 0.0006890594959259033, 0.0007938742637634277, 0.0008986890316009521, 0.0010035037994384766, 0.001108318567276001, 0.0012131333351135254, 0.0013179481029510498, 0.0014227628707885742, 0.0015275776386260986, 0.001632392406463623, 0.0017372071743011475, 0.0018420219421386719, 0.0019468367099761963, 0.0020516514778137207, 0.002156466245651245, 0.0022612810134887695, 0.002366095781326294, 0.0024709105491638184, 0.0025757253170013428, 0.002680540084838867, 0.0027853548526763916, 0.002890169620513916, 0.0029949843883514404, 0.003099799156188965, 0.0032046139240264893, 0.0033094286918640137, 0.003414243459701538, 0.0035190582275390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 8.0, 5.0, 5.0, 1.0, 6.0, 13.0, 21.0, 28.0, 41.0, 70.0, 96.0, 127.0, 238.0, 455.0, 1006.0, 2695.0, 8818.0, 56526.0, 858362.0, 101678.0, 12439.0, 3266.0, 1295.0, 575.0, 308.0, 171.0, 112.0, 56.0, 53.0, 22.0, 13.0, 15.0, 10.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.821044921875, -16.18896484375, -15.556884765625, -14.9248046875, -14.292724609375, -13.66064453125, -13.028564453125, -12.396484375, -11.764404296875, -11.13232421875, -10.500244140625, -9.8681640625, -9.236083984375, -8.60400390625, -7.971923828125, -7.33984375, -6.707763671875, -6.07568359375, -5.443603515625, -4.8115234375, -4.179443359375, -3.54736328125, -2.915283203125, -2.283203125, -1.651123046875, -1.01904296875, -0.386962890625, 0.2451171875, 0.877197265625, 1.50927734375, 2.141357421875, 2.7734375, 3.405517578125, 4.03759765625, 4.669677734375, 5.3017578125, 5.933837890625, 6.56591796875, 7.197998046875, 7.830078125, 8.462158203125, 9.09423828125, 9.726318359375, 10.3583984375, 10.990478515625, 11.62255859375, 12.254638671875, 12.88671875, 13.518798828125, 14.15087890625, 14.782958984375, 15.4150390625, 16.047119140625, 16.67919921875, 17.311279296875, 17.943359375, 18.575439453125, 19.20751953125, 19.839599609375, 20.4716796875, 21.103759765625, 21.73583984375, 22.367919921875, 23.0]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 1.0, 7.0, 7.0, 11.0, 7.0, 8.0, 11.0, 21.0, 25.0, 28.0, 31.0, 34.0, 34.0, 49.0, 61.0, 78.0, 82.0, 88.0, 73.0, 72.0, 48.0, 34.0, 39.0, 28.0, 20.0, 18.0, 12.0, 12.0, 12.0, 6.0, 9.0, 4.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.7578125, -10.440185546875, -10.12255859375, -9.804931640625, -9.4873046875, -9.169677734375, -8.85205078125, -8.534423828125, -8.216796875, -7.899169921875, -7.58154296875, -7.263916015625, -6.9462890625, -6.628662109375, -6.31103515625, -5.993408203125, -5.67578125, -5.358154296875, -5.04052734375, -4.722900390625, -4.4052734375, -4.087646484375, -3.77001953125, -3.452392578125, -3.134765625, -2.817138671875, -2.49951171875, -2.181884765625, -1.8642578125, -1.546630859375, -1.22900390625, -0.911376953125, -0.59375, -0.276123046875, 0.04150390625, 0.359130859375, 0.6767578125, 0.994384765625, 1.31201171875, 1.629638671875, 1.947265625, 2.264892578125, 2.58251953125, 2.900146484375, 3.2177734375, 3.535400390625, 3.85302734375, 4.170654296875, 4.48828125, 4.805908203125, 5.12353515625, 5.441162109375, 5.7587890625, 6.076416015625, 6.39404296875, 6.711669921875, 7.029296875, 7.346923828125, 7.66455078125, 7.982177734375, 8.2998046875, 8.617431640625, 8.93505859375, 9.252685546875, 9.5703125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 11.0, 35.0, 48.0, 97.0, 257.0, 267.0, 111.0, 78.0, 33.0, 22.0, 11.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-506.16717529296875, -492.85101318359375, -479.53485107421875, -466.21868896484375, -452.9024963378906, -439.5863342285156, -426.2701721191406, -412.9540100097656, -399.6378479003906, -386.3216857910156, -373.0055236816406, -359.6893310546875, -346.3731689453125, -333.0570068359375, -319.7408447265625, -306.4246826171875, -293.1085205078125, -279.7923583984375, -266.4761962890625, -253.16001892089844, -239.84385681152344, -226.52767944335938, -213.21151733398438, -199.89535522460938, -186.57916259765625, -173.26300048828125, -159.9468231201172, -146.6306610107422, -133.3144989013672, -119.99832916259766, -106.68215942382812, -93.36599731445312, -80.04983520507812, -66.7336654663086, -53.417503356933594, -40.10133361816406, -26.785167694091797, -13.469001770019531, -0.15283203125, 13.163330078125, 26.47949981689453, 39.7956657409668, 53.11183166503906, 66.4280014038086, 79.74417114257812, 93.06033325195312, 106.37650299072266, 119.69266510009766, 133.0088348388672, 146.3249969482422, 159.64117431640625, 172.95733642578125, 186.27349853515625, 199.58966064453125, 212.9058380126953, 226.2220001220703, 239.53817749023438, 252.85433959960938, 266.1705017089844, 279.4866943359375, 292.8028564453125, 306.1190185546875, 319.4351806640625, 332.7513427734375, 346.0675048828125]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 12.0, 10.0, 11.0, 11.0, 20.0, 24.0, 22.0, 26.0, 23.0, 25.0, 39.0, 40.0, 51.0, 109.0, 158.0, 82.0, 60.0, 39.0, 31.0, 24.0, 27.0, 24.0, 20.0, 18.0, 10.0, 17.0, 16.0, 9.0, 7.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-376.76458740234375, -367.212646484375, -357.6606750488281, -348.1087341308594, -338.5567932128906, -329.00482177734375, -319.452880859375, -309.90093994140625, -300.3489990234375, -290.79705810546875, -281.2450866699219, -271.6931457519531, -262.1412048339844, -252.58924865722656, -243.03729248046875, -233.4853515625, -223.93338012695312, -214.3814239501953, -204.82948303222656, -195.27752685546875, -185.7255859375, -176.1736297607422, -166.62167358398438, -157.06973266601562, -147.5177764892578, -137.9658203125, -128.41387939453125, -118.86192321777344, -109.30997467041016, -99.75802612304688, -90.20606994628906, -80.65412139892578, -71.1021728515625, -61.55022430419922, -51.99827194213867, -42.446319580078125, -32.894371032714844, -23.342422485351562, -13.790470123291016, -4.238517761230469, 5.3134307861328125, 14.865381240844727, 24.41733169555664, 33.96928405761719, 43.52123260498047, 53.07318115234375, 62.6251335144043, 72.17708587646484, 81.72903442382812, 91.2809829711914, 100.83293151855469, 110.3848876953125, 119.93683624267578, 129.48878479003906, 139.04074096679688, 148.59268188476562, 158.14463806152344, 167.69659423828125, 177.24853515625, 186.8004913330078, 196.35244750976562, 205.90438842773438, 215.4563446044922, 225.00830078125, 234.56024169921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 13.0, 12.0, 20.0, 29.0, 48.0, 52.0, 74.0, 103.0, 178.0, 275.0, 440.0, 877.0, 1768.0, 4305.0, 14571.0, 102867.0, 1713810.0, 2190659.0, 138283.0, 16874.0, 4825.0, 2000.0, 909.0, 456.0, 294.0, 171.0, 108.0, 68.0, 53.0, 35.0, 32.0, 17.0, 15.0, 8.0, 4.0, 8.0, 4.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.96875, -52.3359375, -50.703125, -49.0703125, -47.4375, -45.8046875, -44.171875, -42.5390625, -40.90625, -39.2734375, -37.640625, -36.0078125, -34.375, -32.7421875, -31.109375, -29.4765625, -27.84375, -26.2109375, -24.578125, -22.9453125, -21.3125, -19.6796875, -18.046875, -16.4140625, -14.78125, -13.1484375, -11.515625, -9.8828125, -8.25, -6.6171875, -4.984375, -3.3515625, -1.71875, -0.0859375, 1.546875, 3.1796875, 4.8125, 6.4453125, 8.078125, 9.7109375, 11.34375, 12.9765625, 14.609375, 16.2421875, 17.875, 19.5078125, 21.140625, 22.7734375, 24.40625, 26.0390625, 27.671875, 29.3046875, 30.9375, 32.5703125, 34.203125, 35.8359375, 37.46875, 39.1015625, 40.734375, 42.3671875, 44.0, 45.6328125, 47.265625, 48.8984375, 50.53125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 8.0, 9.0, 5.0, 7.0, 6.0, 9.0, 10.0, 20.0, 27.0, 9.0, 28.0, 21.0, 28.0, 25.0, 36.0, 34.0, 39.0, 30.0, 43.0, 32.0, 43.0, 50.0, 40.0, 44.0, 40.0, 40.0, 33.0, 46.0, 19.0, 30.0, 23.0, 27.0, 21.0, 17.0, 20.0, 9.0, 17.0, 11.0, 8.0, 8.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.9375, -16.412841796875, -15.88818359375, -15.363525390625, -14.8388671875, -14.314208984375, -13.78955078125, -13.264892578125, -12.740234375, -12.215576171875, -11.69091796875, -11.166259765625, -10.6416015625, -10.116943359375, -9.59228515625, -9.067626953125, -8.54296875, -8.018310546875, -7.49365234375, -6.968994140625, -6.4443359375, -5.919677734375, -5.39501953125, -4.870361328125, -4.345703125, -3.821044921875, -3.29638671875, -2.771728515625, -2.2470703125, -1.722412109375, -1.19775390625, -0.673095703125, -0.1484375, 0.376220703125, 0.90087890625, 1.425537109375, 1.9501953125, 2.474853515625, 2.99951171875, 3.524169921875, 4.048828125, 4.573486328125, 5.09814453125, 5.622802734375, 6.1474609375, 6.672119140625, 7.19677734375, 7.721435546875, 8.24609375, 8.770751953125, 9.29541015625, 9.820068359375, 10.3447265625, 10.869384765625, 11.39404296875, 11.918701171875, 12.443359375, 12.968017578125, 13.49267578125, 14.017333984375, 14.5419921875, 15.066650390625, 15.59130859375, 16.115966796875, 16.640625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 8.0, 8.0, 18.0, 19.0, 42.0, 65.0, 125.0, 244.0, 480.0, 1376.0, 7559.0, 726264.0, 3443099.0, 11890.0, 1836.0, 617.0, 269.0, 143.0, 82.0, 47.0, 29.0, 19.0, 14.0, 9.0, 1.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-168.625, -163.52734375, -158.4296875, -153.33203125, -148.234375, -143.13671875, -138.0390625, -132.94140625, -127.84375, -122.74609375, -117.6484375, -112.55078125, -107.453125, -102.35546875, -97.2578125, -92.16015625, -87.0625, -81.96484375, -76.8671875, -71.76953125, -66.671875, -61.57421875, -56.4765625, -51.37890625, -46.28125, -41.18359375, -36.0859375, -30.98828125, -25.890625, -20.79296875, -15.6953125, -10.59765625, -5.5, -0.40234375, 4.6953125, 9.79296875, 14.890625, 19.98828125, 25.0859375, 30.18359375, 35.28125, 40.37890625, 45.4765625, 50.57421875, 55.671875, 60.76953125, 65.8671875, 70.96484375, 76.0625, 81.16015625, 86.2578125, 91.35546875, 96.453125, 101.55078125, 106.6484375, 111.74609375, 116.84375, 121.94140625, 127.0390625, 132.13671875, 137.234375, 142.33203125, 147.4296875, 152.52734375, 157.625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 10.0, 15.0, 27.0, 42.0, 64.0, 91.0, 169.0, 348.0, 731.0, 1113.0, 678.0, 334.0, 168.0, 104.0, 69.0, 35.0, 29.0, 24.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.0625, -84.0, -80.9375, -77.875, -74.8125, -71.75, -68.6875, -65.625, -62.5625, -59.5, -56.4375, -53.375, -50.3125, -47.25, -44.1875, -41.125, -38.0625, -35.0, -31.9375, -28.875, -25.8125, -22.75, -19.6875, -16.625, -13.5625, -10.5, -7.4375, -4.375, -1.3125, 1.75, 4.8125, 7.875, 10.9375, 14.0, 17.0625, 20.125, 23.1875, 26.25, 29.3125, 32.375, 35.4375, 38.5, 41.5625, 44.625, 47.6875, 50.75, 53.8125, 56.875, 59.9375, 63.0, 66.0625, 69.125, 72.1875, 75.25, 78.3125, 81.375, 84.4375, 87.5, 90.5625, 93.625, 96.6875, 99.75, 102.8125, 105.875, 108.9375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 7.0, 24.0, 62.0, 148.0, 332.0, 234.0, 101.0, 44.0, 22.0, 6.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1322.56689453125, -1285.486328125, -1248.4056396484375, -1211.3250732421875, -1174.244384765625, -1137.163818359375, -1100.083251953125, -1063.002685546875, -1025.9219970703125, -988.8413696289062, -951.7607421875, -914.68017578125, -877.5995483398438, -840.5189208984375, -803.4383544921875, -766.3577270507812, -729.277099609375, -692.1964721679688, -655.1158447265625, -618.0352783203125, -580.9546508789062, -543.8740234375, -506.7934265136719, -469.71282958984375, -432.6322021484375, -395.55157470703125, -358.4709777832031, -321.390380859375, -284.30975341796875, -247.22914123535156, -210.14852905273438, -173.06793212890625, -135.9874267578125, -98.90681457519531, -61.826202392578125, -24.745590209960938, 12.33502197265625, 49.41563415527344, 86.49624633789062, 123.57684326171875, 160.657470703125, 197.7380828857422, 234.81869506835938, 271.8992919921875, 308.97991943359375, 346.060546875, 383.1411437988281, 420.22174072265625, 457.3023681640625, 494.38299560546875, 531.463623046875, 568.544189453125, 605.6248168945312, 642.7054443359375, 679.7860107421875, 716.8666381835938, 753.947265625, 791.0278930664062, 828.1085205078125, 865.1890869140625, 902.2697143554688, 939.350341796875, 976.430908203125, 1013.5115356445312, 1050.5921630859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 3.0, 8.0, 7.0, 9.0, 11.0, 7.0, 18.0, 16.0, 29.0, 22.0, 27.0, 31.0, 31.0, 32.0, 55.0, 38.0, 51.0, 41.0, 49.0, 70.0, 41.0, 52.0, 48.0, 31.0, 41.0, 39.0, 19.0, 31.0, 21.0, 28.0, 15.0, 17.0, 9.0, 8.0, 6.0, 3.0, 3.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-370.226318359375, -359.552001953125, -348.8777160644531, -338.2033996582031, -327.52911376953125, -316.85479736328125, -306.18048095703125, -295.5061950683594, -284.8319091796875, -274.1575927734375, -263.4833068847656, -252.80899047851562, -242.13470458984375, -231.46038818359375, -220.7860870361328, -210.11178588867188, -199.43746948242188, -188.76316833496094, -178.0888671875, -167.41455078125, -156.74026489257812, -146.06594848632812, -135.3916473388672, -124.71734619140625, -114.04304504394531, -103.36874389648438, -92.69444274902344, -82.02013397216797, -71.34583282470703, -60.671531677246094, -49.997222900390625, -39.32292175292969, -28.648590087890625, -17.974287033081055, -7.299983978271484, 3.3743209838867188, 14.048622131347656, 24.722923278808594, 35.39723205566406, 46.071533203125, 56.74583435058594, 67.42013549804688, 78.09443664550781, 88.76874542236328, 99.44304656982422, 110.11734771728516, 120.79165649414062, 131.46595764160156, 142.1402587890625, 152.81455993652344, 163.48886108398438, 174.16317749023438, 184.83746337890625, 195.51177978515625, 206.1860809326172, 216.86038208007812, 227.53468322753906, 238.208984375, 248.88328552246094, 259.5575866699219, 270.2319030761719, 280.90618896484375, 291.58050537109375, 302.25482177734375, 312.9291076660156]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 8.0, 7.0, 19.0, 52.0, 67.0, 144.0, 270.0, 514.0, 1288.0, 3365.0, 10512.0, 46824.0, 371099.0, 532735.0, 61926.0, 13219.0, 3853.0, 1458.0, 579.0, 303.0, 126.0, 93.0, 41.0, 16.0, 16.0, 8.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-78.375, -76.41943359375, -74.4638671875, -72.50830078125, -70.552734375, -68.59716796875, -66.6416015625, -64.68603515625, -62.73046875, -60.77490234375, -58.8193359375, -56.86376953125, -54.908203125, -52.95263671875, -50.9970703125, -49.04150390625, -47.0859375, -45.13037109375, -43.1748046875, -41.21923828125, -39.263671875, -37.30810546875, -35.3525390625, -33.39697265625, -31.44140625, -29.48583984375, -27.5302734375, -25.57470703125, -23.619140625, -21.66357421875, -19.7080078125, -17.75244140625, -15.796875, -13.84130859375, -11.8857421875, -9.93017578125, -7.974609375, -6.01904296875, -4.0634765625, -2.10791015625, -0.15234375, 1.80322265625, 3.7587890625, 5.71435546875, 7.669921875, 9.62548828125, 11.5810546875, 13.53662109375, 15.4921875, 17.44775390625, 19.4033203125, 21.35888671875, 23.314453125, 25.27001953125, 27.2255859375, 29.18115234375, 31.13671875, 33.09228515625, 35.0478515625, 37.00341796875, 38.958984375, 40.91455078125, 42.8701171875, 44.82568359375, 46.78125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 10.0, 4.0, 3.0, 5.0, 9.0, 11.0, 11.0, 19.0, 18.0, 26.0, 33.0, 18.0, 30.0, 38.0, 25.0, 51.0, 40.0, 39.0, 50.0, 45.0, 50.0, 31.0, 53.0, 39.0, 34.0, 42.0, 30.0, 40.0, 28.0, 26.0, 32.0, 21.0, 19.0, 9.0, 8.0, 13.0, 9.0, 6.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.96875, -22.26953125, -21.5703125, -20.87109375, -20.171875, -19.47265625, -18.7734375, -18.07421875, -17.375, -16.67578125, -15.9765625, -15.27734375, -14.578125, -13.87890625, -13.1796875, -12.48046875, -11.78125, -11.08203125, -10.3828125, -9.68359375, -8.984375, -8.28515625, -7.5859375, -6.88671875, -6.1875, -5.48828125, -4.7890625, -4.08984375, -3.390625, -2.69140625, -1.9921875, -1.29296875, -0.59375, 0.10546875, 0.8046875, 1.50390625, 2.203125, 2.90234375, 3.6015625, 4.30078125, 5.0, 5.69921875, 6.3984375, 7.09765625, 7.796875, 8.49609375, 9.1953125, 9.89453125, 10.59375, 11.29296875, 11.9921875, 12.69140625, 13.390625, 14.08984375, 14.7890625, 15.48828125, 16.1875, 16.88671875, 17.5859375, 18.28515625, 18.984375, 19.68359375, 20.3828125, 21.08203125, 21.78125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 9.0, 17.0, 32.0, 41.0, 68.0, 109.0, 240.0, 486.0, 1357.0, 6214.0, 108303.0, 907870.0, 19727.0, 2593.0, 764.0, 335.0, 150.0, 87.0, 52.0, 33.0, 16.0, 16.0, 9.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.1875, -90.2978515625, -87.408203125, -84.5185546875, -81.62890625, -78.7392578125, -75.849609375, -72.9599609375, -70.0703125, -67.1806640625, -64.291015625, -61.4013671875, -58.51171875, -55.6220703125, -52.732421875, -49.8427734375, -46.953125, -44.0634765625, -41.173828125, -38.2841796875, -35.39453125, -32.5048828125, -29.615234375, -26.7255859375, -23.8359375, -20.9462890625, -18.056640625, -15.1669921875, -12.27734375, -9.3876953125, -6.498046875, -3.6083984375, -0.71875, 2.1708984375, 5.060546875, 7.9501953125, 10.83984375, 13.7294921875, 16.619140625, 19.5087890625, 22.3984375, 25.2880859375, 28.177734375, 31.0673828125, 33.95703125, 36.8466796875, 39.736328125, 42.6259765625, 45.515625, 48.4052734375, 51.294921875, 54.1845703125, 57.07421875, 59.9638671875, 62.853515625, 65.7431640625, 68.6328125, 71.5224609375, 74.412109375, 77.3017578125, 80.19140625, 83.0810546875, 85.970703125, 88.8603515625, 91.75]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 8.0, 3.0, 5.0, 3.0, 5.0, 8.0, 9.0, 13.0, 14.0, 15.0, 23.0, 13.0, 29.0, 29.0, 34.0, 36.0, 51.0, 62.0, 61.0, 63.0, 63.0, 70.0, 59.0, 52.0, 45.0, 29.0, 32.0, 24.0, 28.0, 19.0, 13.0, 16.0, 13.0, 6.0, 14.0, 6.0, 3.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.0, -77.26171875, -74.5234375, -71.78515625, -69.046875, -66.30859375, -63.5703125, -60.83203125, -58.09375, -55.35546875, -52.6171875, -49.87890625, -47.140625, -44.40234375, -41.6640625, -38.92578125, -36.1875, -33.44921875, -30.7109375, -27.97265625, -25.234375, -22.49609375, -19.7578125, -17.01953125, -14.28125, -11.54296875, -8.8046875, -6.06640625, -3.328125, -0.58984375, 2.1484375, 4.88671875, 7.625, 10.36328125, 13.1015625, 15.83984375, 18.578125, 21.31640625, 24.0546875, 26.79296875, 29.53125, 32.26953125, 35.0078125, 37.74609375, 40.484375, 43.22265625, 45.9609375, 48.69921875, 51.4375, 54.17578125, 56.9140625, 59.65234375, 62.390625, 65.12890625, 67.8671875, 70.60546875, 73.34375, 76.08203125, 78.8203125, 81.55859375, 84.296875, 87.03515625, 89.7734375, 92.51171875, 95.25]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 9.0, 12.0, 31.0, 35.0, 71.0, 143.0, 384.0, 1892.0, 19130.0, 982898.0, 40313.0, 2715.0, 548.0, 196.0, 72.0, 41.0, 24.0, 14.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.578125, -18.893798828125, -18.20947265625, -17.525146484375, -16.8408203125, -16.156494140625, -15.47216796875, -14.787841796875, -14.103515625, -13.419189453125, -12.73486328125, -12.050537109375, -11.3662109375, -10.681884765625, -9.99755859375, -9.313232421875, -8.62890625, -7.944580078125, -7.26025390625, -6.575927734375, -5.8916015625, -5.207275390625, -4.52294921875, -3.838623046875, -3.154296875, -2.469970703125, -1.78564453125, -1.101318359375, -0.4169921875, 0.267333984375, 0.95166015625, 1.635986328125, 2.3203125, 3.004638671875, 3.68896484375, 4.373291015625, 5.0576171875, 5.741943359375, 6.42626953125, 7.110595703125, 7.794921875, 8.479248046875, 9.16357421875, 9.847900390625, 10.5322265625, 11.216552734375, 11.90087890625, 12.585205078125, 13.26953125, 13.953857421875, 14.63818359375, 15.322509765625, 16.0068359375, 16.691162109375, 17.37548828125, 18.059814453125, 18.744140625, 19.428466796875, 20.11279296875, 20.797119140625, 21.4814453125, 22.165771484375, 22.85009765625, 23.534423828125, 24.21875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 11.0, 17.0, 14.0, 26.0, 29.0, 40.0, 31.0, 48.0, 81.0, 89.0, 114.0, 109.0, 91.0, 82.0, 49.0, 32.0, 29.0, 20.0, 22.0, 13.0, 8.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028228759765625, -0.002737104892730713, -0.0026513338088989258, -0.0025655627250671387, -0.0024797916412353516, -0.0023940205574035645, -0.0023082494735717773, -0.0022224783897399902, -0.002136707305908203, -0.002050936222076416, -0.001965165138244629, -0.0018793940544128418, -0.0017936229705810547, -0.0017078518867492676, -0.0016220808029174805, -0.0015363097190856934, -0.0014505386352539062, -0.0013647675514221191, -0.001278996467590332, -0.001193225383758545, -0.0011074542999267578, -0.0010216832160949707, -0.0009359121322631836, -0.0008501410484313965, -0.0007643699645996094, -0.0006785988807678223, -0.0005928277969360352, -0.000507056713104248, -0.00042128562927246094, -0.00033551454544067383, -0.0002497434616088867, -0.0001639723777770996, -7.82012939453125e-05, 7.569789886474609e-06, 9.334087371826172e-05, 0.00017911195755004883, 0.00026488304138183594, 0.00035065412521362305, 0.00043642520904541016, 0.0005221962928771973, 0.0006079673767089844, 0.0006937384605407715, 0.0007795095443725586, 0.0008652806282043457, 0.0009510517120361328, 0.00103682279586792, 0.001122593879699707, 0.0012083649635314941, 0.0012941360473632812, 0.0013799071311950684, 0.0014656782150268555, 0.0015514492988586426, 0.0016372203826904297, 0.0017229914665222168, 0.001808762550354004, 0.001894533634185791, 0.001980304718017578, 0.0020660758018493652, 0.0021518468856811523, 0.0022376179695129395, 0.0023233890533447266, 0.0024091601371765137, 0.0024949312210083008, 0.002580702304840088, 0.002666473388671875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 1.0, 7.0, 10.0, 14.0, 18.0, 51.0, 97.0, 244.0, 994.0, 11301.0, 999518.0, 33933.0, 1763.0, 348.0, 123.0, 69.0, 23.0, 10.0, 4.0, 5.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.8125, -31.98486328125, -31.1572265625, -30.32958984375, -29.501953125, -28.67431640625, -27.8466796875, -27.01904296875, -26.19140625, -25.36376953125, -24.5361328125, -23.70849609375, -22.880859375, -22.05322265625, -21.2255859375, -20.39794921875, -19.5703125, -18.74267578125, -17.9150390625, -17.08740234375, -16.259765625, -15.43212890625, -14.6044921875, -13.77685546875, -12.94921875, -12.12158203125, -11.2939453125, -10.46630859375, -9.638671875, -8.81103515625, -7.9833984375, -7.15576171875, -6.328125, -5.50048828125, -4.6728515625, -3.84521484375, -3.017578125, -2.18994140625, -1.3623046875, -0.53466796875, 0.29296875, 1.12060546875, 1.9482421875, 2.77587890625, 3.603515625, 4.43115234375, 5.2587890625, 6.08642578125, 6.9140625, 7.74169921875, 8.5693359375, 9.39697265625, 10.224609375, 11.05224609375, 11.8798828125, 12.70751953125, 13.53515625, 14.36279296875, 15.1904296875, 16.01806640625, 16.845703125, 17.67333984375, 18.5009765625, 19.32861328125, 20.15625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 6.0, 10.0, 6.0, 14.0, 21.0, 20.0, 44.0, 52.0, 75.0, 86.0, 140.0, 120.0, 107.0, 86.0, 65.0, 46.0, 28.0, 19.0, 9.0, 8.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-9.8203125, -9.5064697265625, -9.192626953125, -8.8787841796875, -8.56494140625, -8.2510986328125, -7.937255859375, -7.6234130859375, -7.3095703125, -6.9957275390625, -6.681884765625, -6.3680419921875, -6.05419921875, -5.7403564453125, -5.426513671875, -5.1126708984375, -4.798828125, -4.4849853515625, -4.171142578125, -3.8572998046875, -3.54345703125, -3.2296142578125, -2.915771484375, -2.6019287109375, -2.2880859375, -1.9742431640625, -1.660400390625, -1.3465576171875, -1.03271484375, -0.7188720703125, -0.405029296875, -0.0911865234375, 0.22265625, 0.5364990234375, 0.850341796875, 1.1641845703125, 1.47802734375, 1.7918701171875, 2.105712890625, 2.4195556640625, 2.7333984375, 3.0472412109375, 3.361083984375, 3.6749267578125, 3.98876953125, 4.3026123046875, 4.616455078125, 4.9302978515625, 5.244140625, 5.5579833984375, 5.871826171875, 6.1856689453125, 6.49951171875, 6.8133544921875, 7.127197265625, 7.4410400390625, 7.7548828125, 8.0687255859375, 8.382568359375, 8.6964111328125, 9.01025390625, 9.3240966796875, 9.637939453125, 9.9517822265625, 10.265625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 11.0, 31.0, 67.0, 324.0, 455.0, 80.0, 19.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1020.0196533203125, -994.6287231445312, -969.23779296875, -943.846923828125, -918.4559936523438, -893.0650634765625, -867.6741333007812, -842.283203125, -816.892333984375, -791.5014038085938, -766.1104736328125, -740.7196044921875, -715.3286743164062, -689.937744140625, -664.5468139648438, -639.1558837890625, -613.7650146484375, -588.3740844726562, -562.983154296875, -537.59228515625, -512.2013549804688, -486.8104248046875, -461.41949462890625, -436.0285949707031, -410.63763427734375, -385.2467041015625, -359.8558044433594, -334.4648742675781, -309.073974609375, -283.68304443359375, -258.2921142578125, -232.90121459960938, -207.51031494140625, -182.11940002441406, -156.72848510742188, -131.33755493164062, -105.94664764404297, -80.55573272705078, -55.16481018066406, -29.773895263671875, -4.3829803466796875, 21.007936477661133, 46.39885330200195, 71.7897720336914, 97.1806869506836, 122.57160186767578, 147.9625244140625, 173.3534393310547, 198.74435424804688, 224.13526916503906, 249.52618408203125, 274.9171142578125, 300.3080139160156, 325.6989440917969, 351.08984375, 376.48077392578125, 401.8717041015625, 427.26263427734375, 452.6535339355469, 478.0444641113281, 503.43536376953125, 528.8262939453125, 554.2172241210938, 579.608154296875, 604.9990234375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 8.0, 5.0, 12.0, 11.0, 7.0, 10.0, 16.0, 15.0, 13.0, 13.0, 18.0, 33.0, 62.0, 105.0, 71.0, 70.0, 60.0, 58.0, 65.0, 118.0, 51.0, 29.0, 30.0, 21.0, 14.0, 22.0, 21.0, 7.0, 7.0, 4.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-309.3206787109375, -300.3393249511719, -291.35797119140625, -282.3766174316406, -273.395263671875, -264.4139099121094, -255.4325714111328, -246.4512176513672, -237.46986389160156, -228.48851013183594, -219.5071563720703, -210.5258026123047, -201.54446411132812, -192.5631103515625, -183.58175659179688, -174.60040283203125, -165.61904907226562, -156.6376953125, -147.65634155273438, -138.67498779296875, -129.69363403320312, -120.71228790283203, -111.73094177246094, -102.74958801269531, -93.76823425292969, -84.78688049316406, -75.80552673339844, -66.82418060302734, -57.84282684326172, -48.861473083496094, -39.880123138427734, -30.898773193359375, -21.917449951171875, -12.936098098754883, -3.9547462463378906, 5.026605606079102, 14.007957458496094, 22.98931121826172, 31.970661163330078, 40.95201110839844, 49.93336486816406, 58.91471862792969, 67.89607238769531, 76.8774185180664, 85.85877227783203, 94.84012603759766, 103.82147216796875, 112.80282592773438, 121.7841796875, 130.76553344726562, 139.74688720703125, 148.72824096679688, 157.7095947265625, 166.69094848632812, 175.6722869873047, 184.6536407470703, 193.63499450683594, 202.61634826660156, 211.5977020263672, 220.5790557861328, 229.56039428710938, 238.541748046875, 247.52310180664062, 256.50445556640625, 265.4858093261719]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 5.0, 7.0, 10.0, 10.0, 16.0, 15.0, 23.0, 34.0, 31.0, 32.0, 30.0, 58.0, 138.0, 238.0, 59.0, 48.0, 42.0, 29.0, 33.0, 19.0, 16.0, 16.0, 18.0, 16.0, 9.0, 6.0, 6.0, 12.0, 6.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.984375, -25.178466796875, -24.37255859375, -23.566650390625, -22.7607421875, -21.954833984375, -21.14892578125, -20.343017578125, -19.537109375, -18.731201171875, -17.92529296875, -17.119384765625, -16.3134765625, -15.507568359375, -14.70166015625, -13.895751953125, -13.08984375, -12.283935546875, -11.47802734375, -10.672119140625, -9.8662109375, -9.060302734375, -8.25439453125, -7.448486328125, -6.642578125, -5.836669921875, -5.03076171875, -4.224853515625, -3.4189453125, -2.613037109375, -1.80712890625, -1.001220703125, -0.1953125, 0.610595703125, 1.41650390625, 2.222412109375, 3.0283203125, 3.834228515625, 4.64013671875, 5.446044921875, 6.251953125, 7.057861328125, 7.86376953125, 8.669677734375, 9.4755859375, 10.281494140625, 11.08740234375, 11.893310546875, 12.69921875, 13.505126953125, 14.31103515625, 15.116943359375, 15.9228515625, 16.728759765625, 17.53466796875, 18.340576171875, 19.146484375, 19.952392578125, 20.75830078125, 21.564208984375, 22.3701171875, 23.176025390625, 23.98193359375, 24.787841796875, 25.59375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 8.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 5.0, 2.0, 11.0, 10.0, 20.0, 13.0, 28.0, 48.0, 80.0, 209.0, 611.0, 3383.0, 7849317.0, 530555.0, 3227.0, 632.0, 171.0, 73.0, 32.0, 33.0, 26.0, 29.0, 13.0, 10.0, 8.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-325.1297607421875, -313.08160400390625, -301.0334777832031, -288.9853210449219, -276.93719482421875, -264.8890380859375, -252.84091186523438, -240.79275512695312, -228.74462890625, -216.6964874267578, -204.64834594726562, -192.60020446777344, -180.55206298828125, -168.50392150878906, -156.45578002929688, -144.40762329101562, -132.35948181152344, -120.31134033203125, -108.26319885253906, -96.21505737304688, -84.16691589355469, -72.1187744140625, -60.07062530517578, -48.022483825683594, -35.974342346191406, -23.92620086669922, -11.878057479858398, 0.17008590698242188, 12.21822738647461, 24.266368865966797, 36.31451416015625, 48.36265563964844, 60.410797119140625, 72.45893859863281, 84.507080078125, 96.55522155761719, 108.60336303710938, 120.65150451660156, 132.69964599609375, 144.747802734375, 156.79592895507812, 168.8440704345703, 180.8922119140625, 192.9403533935547, 204.98849487304688, 217.03663635253906, 229.08477783203125, 241.1329345703125, 253.1810760498047, 265.2292175292969, 277.2773742675781, 289.32550048828125, 301.3736572265625, 313.4217834472656, 325.4699401855469, 337.51806640625, 349.56622314453125, 361.6143798828125, 373.6625061035156, 385.7106628417969, 397.7587890625, 409.80694580078125, 421.8550720214844, 433.9032287597656, 445.95135498046875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 6.0, 8.0, 10.0, 7.0, 5.0, 5.0, 2.0, 4.0, 10.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-575.4168090820312, -561.3034057617188, -547.1900634765625, -533.07666015625, -518.9633178710938, -504.84991455078125, -490.7365417480469, -476.6231689453125, -462.509765625, -448.3963928222656, -434.28302001953125, -420.16961669921875, -406.0562438964844, -391.94287109375, -377.8294982910156, -363.71612548828125, -349.6027526855469, -335.4893798828125, -321.3760070800781, -307.26263427734375, -293.14923095703125, -279.0358581542969, -264.9224853515625, -250.80911254882812, -236.6957244873047, -222.5823516845703, -208.46896362304688, -194.3555908203125, -180.24221801757812, -166.1288299560547, -152.0154571533203, -137.90206909179688, -123.78872680664062, -109.67534637451172, -95.56196594238281, -81.44859313964844, -67.33521270751953, -53.221832275390625, -39.10845947265625, -24.995079040527344, -10.881698608398438, 3.231679916381836, 17.34505844116211, 31.45843505859375, 45.571815490722656, 59.68519592285156, 73.79856872558594, 87.91194915771484, 102.02532958984375, 116.13871002197266, 130.25209045410156, 144.36546325683594, 158.47885131835938, 172.59222412109375, 186.70559692382812, 200.8189697265625, 214.93235778808594, 229.0457305908203, 243.15911865234375, 257.2724914550781, 271.3858642578125, 285.499267578125, 299.61260986328125, 313.72601318359375, 327.8393859863281]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 4.0, 7.0, 15.0, 24.0, 32.0, 32.0, 46.0, 84.0, 127.0, 205.0, 364.0, 566.0, 1265.0, 2893.0, 7531.0, 21454.0, 65663.0, 179675.0, 161210.0, 55019.0, 17413.0, 6110.0, 2344.0, 1054.0, 506.0, 252.0, 151.0, 67.0, 58.0, 34.0, 10.0, 12.0, 12.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.5, -200.751953125, -195.00390625, -189.255859375, -183.5078125, -177.759765625, -172.01171875, -166.263671875, -160.515625, -154.767578125, -149.01953125, -143.271484375, -137.5234375, -131.775390625, -126.02734375, -120.279296875, -114.53125, -108.783203125, -103.03515625, -97.287109375, -91.5390625, -85.791015625, -80.04296875, -74.294921875, -68.546875, -62.798828125, -57.05078125, -51.302734375, -45.5546875, -39.806640625, -34.05859375, -28.310546875, -22.5625, -16.814453125, -11.06640625, -5.318359375, 0.4296875, 6.177734375, 11.92578125, 17.673828125, 23.421875, 29.169921875, 34.91796875, 40.666015625, 46.4140625, 52.162109375, 57.91015625, 63.658203125, 69.40625, 75.154296875, 80.90234375, 86.650390625, 92.3984375, 98.146484375, 103.89453125, 109.642578125, 115.390625, 121.138671875, 126.88671875, 132.634765625, 138.3828125, 144.130859375, 149.87890625, 155.626953125, 161.375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 2.0, 9.0, 5.0, 8.0, 10.0, 10.0, 11.0, 20.0, 7.0, 9.0, 16.0, 23.0, 23.0, 29.0, 27.0, 37.0, 37.0, 56.0, 45.0, 60.0, 65.0, 57.0, 48.0, 32.0, 45.0, 52.0, 37.0, 35.0, 30.0, 26.0, 29.0, 16.0, 22.0, 12.0, 13.0, 11.0, 7.0, 5.0, 4.0, 5.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-27.640625, -26.92138671875, -26.2021484375, -25.48291015625, -24.763671875, -24.04443359375, -23.3251953125, -22.60595703125, -21.88671875, -21.16748046875, -20.4482421875, -19.72900390625, -19.009765625, -18.29052734375, -17.5712890625, -16.85205078125, -16.1328125, -15.41357421875, -14.6943359375, -13.97509765625, -13.255859375, -12.53662109375, -11.8173828125, -11.09814453125, -10.37890625, -9.65966796875, -8.9404296875, -8.22119140625, -7.501953125, -6.78271484375, -6.0634765625, -5.34423828125, -4.625, -3.90576171875, -3.1865234375, -2.46728515625, -1.748046875, -1.02880859375, -0.3095703125, 0.40966796875, 1.12890625, 1.84814453125, 2.5673828125, 3.28662109375, 4.005859375, 4.72509765625, 5.4443359375, 6.16357421875, 6.8828125, 7.60205078125, 8.3212890625, 9.04052734375, 9.759765625, 10.47900390625, 11.1982421875, 11.91748046875, 12.63671875, 13.35595703125, 14.0751953125, 14.79443359375, 15.513671875, 16.23291015625, 16.9521484375, 17.67138671875, 18.390625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 3.0, 5.0, 5.0, 6.0, 7.0, 9.0, 13.0, 22.0, 32.0, 66.0, 80.0, 104.0, 75.0, 41.0, 8.0, 6.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-218.3271484375, -208.95359802246094, -199.58004760742188, -190.2064971923828, -180.83294677734375, -171.45938110351562, -162.08583068847656, -152.7122802734375, -143.33872985839844, -133.96517944335938, -124.59162902832031, -115.21807098388672, -105.84452056884766, -96.4709701538086, -87.097412109375, -77.72386169433594, -68.35031127929688, -58.97676086425781, -49.603206634521484, -40.229652404785156, -30.856101989746094, -21.48255157470703, -12.108997344970703, -2.735443115234375, 6.6381072998046875, 16.011659622192383, 25.385211944580078, 34.758766174316406, 44.13231658935547, 53.50586700439453, 62.87942123413086, 72.25297546386719, 81.62652587890625, 91.00007629394531, 100.37362670898438, 109.74718475341797, 119.12073516845703, 128.49429321289062, 137.8678436279297, 147.24139404296875, 156.6149444580078, 165.98849487304688, 175.36204528808594, 184.735595703125, 194.10916137695312, 203.48269653320312, 212.85626220703125, 222.2298126220703, 231.60336303710938, 240.97691345214844, 250.3504638671875, 259.7240295410156, 269.0975646972656, 278.47113037109375, 287.84466552734375, 297.2182312011719, 306.591796875, 315.9653625488281, 325.3388977050781, 334.71246337890625, 344.08599853515625, 353.4595642089844, 362.8330993652344, 372.2066650390625, 381.5802001953125]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 7.0, 8.0, 4.0, 5.0, 9.0, 17.0, 17.0, 44.0, 62.0, 76.0, 91.0, 54.0, 28.0, 23.0, 4.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.83026123046875, -161.76821899414062, -156.7061767578125, -151.64413452148438, -146.58209228515625, -141.52005004882812, -136.4580078125, -131.39596557617188, -126.33393096923828, -121.27188873291016, -116.20984649658203, -111.1478042602539, -106.08576965332031, -101.02372741699219, -95.96168518066406, -90.89964294433594, -85.83760070800781, -80.77555847167969, -75.71351623535156, -70.65147399902344, -65.58943176269531, -60.52739334106445, -55.465354919433594, -50.40331268310547, -45.341270446777344, -40.27922821044922, -35.217185974121094, -30.155147552490234, -25.09310531616211, -20.031063079833984, -14.969022750854492, -9.906982421875, -4.844940185546875, 0.2171010971069336, 5.279142379760742, 10.34118366241455, 15.40322494506836, 20.465267181396484, 25.527307510375977, 30.58934783935547, 35.651390075683594, 40.71343231201172, 45.775474548339844, 50.8375129699707, 55.89955520629883, 60.96159744262695, 66.02363586425781, 71.08567810058594, 76.14772033691406, 81.20976257324219, 86.27180480957031, 91.33384704589844, 96.39588928222656, 101.45793151855469, 106.51996612548828, 111.5820083618164, 116.64405059814453, 121.70609283447266, 126.76813507080078, 131.83016967773438, 136.8922119140625, 141.95425415039062, 147.01629638671875, 152.07833862304688, 157.140380859375]}, "eval/loss": 2.4603452682495117, "eval/wer": 0.35762049328333034, "eval/runtime": 877.6671, "eval/samples_per_second": 3.01, "eval/steps_per_second": 0.377} \ No newline at end of file +{"train/loss": 1.6379, "train/learning_rate": 1.8423990498812354e-05, "train/epoch": 8.41, "train/global_step": 7500, "_runtime": 48784, "_timestamp": 1646710023, "_step": 7504, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 38.0, 30.0, 12.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 2.0, 19.0, 30.0, 30125.0, 172.0, 24.0, 10.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-184.75, -180.35546875, -175.9609375, -171.56640625, -167.171875, -162.77734375, -158.3828125, -153.98828125, -149.59375, -145.19921875, -140.8046875, -136.41015625, -132.015625, -127.62109375, -123.2265625, -118.83203125, -114.4375, -110.04296875, -105.6484375, -101.25390625, -96.859375, -92.46484375, -88.0703125, -83.67578125, -79.28125, -74.88671875, -70.4921875, -66.09765625, -61.703125, -57.30859375, -52.9140625, -48.51953125, -44.125, -39.73046875, -35.3359375, -30.94140625, -26.546875, -22.15234375, -17.7578125, -13.36328125, -8.96875, -4.57421875, -0.1796875, 4.21484375, 8.609375, 13.00390625, 17.3984375, 21.79296875, 26.1875, 30.58203125, 34.9765625, 39.37109375, 43.765625, 48.16015625, 52.5546875, 56.94921875, 61.34375, 65.73828125, 70.1328125, 74.52734375, 78.921875, 83.31640625, 87.7109375, 92.10546875, 96.5]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 9.0, 7.0, 17.0, 15.0, 16.0, 24.0, 26.0, 18.0, 19.0, 32.0, 44.0, 45.0, 38.0, 44.0, 42.0, 47.0, 50.0, 45.0, 57.0, 46.0, 33.0, 40.0, 38.0, 42.0, 24.0, 31.0, 36.0, 24.0, 22.0, 16.0, 10.0, 9.0, 8.0, 6.0, 5.0, 0.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.5896224975586, -96.26017761230469, -93.93073272705078, -91.60128784179688, -89.27184295654297, -86.94239807128906, -84.61295318603516, -82.28350830078125, -79.95406341552734, -77.62461853027344, -75.29517364501953, -72.96572875976562, -70.63628387451172, -68.30683898925781, -65.9773941040039, -63.64794921875, -61.31850051879883, -58.98905563354492, -56.659610748291016, -54.33016586303711, -52.0007209777832, -49.6712760925293, -47.341827392578125, -45.01238250732422, -42.68293762207031, -40.353492736816406, -38.0240478515625, -35.694602966308594, -33.36515808105469, -31.03571319580078, -28.706266403198242, -26.376821517944336, -24.047378540039062, -21.717933654785156, -19.38848876953125, -17.059043884277344, -14.729598045349121, -12.400153160095215, -10.070707321166992, -7.741262435913086, -5.41181755065918, -3.0823724269866943, -0.752927303314209, 1.5765180587768555, 3.9059629440307617, 6.235407829284668, 8.56485366821289, 10.894298553466797, 13.223743438720703, 15.55318832397461, 17.882633209228516, 20.212078094482422, 22.541522979736328, 24.870967864990234, 27.200414657592773, 29.52985954284668, 31.859304428100586, 34.188751220703125, 36.51819610595703, 38.84764099121094, 41.177085876464844, 43.50653076171875, 45.835975646972656, 48.16542053222656, 50.49486541748047]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 4.0, 8.0, 6.0, 6.0, 7.0, 10.0, 15.0, 20.0, 14.0, 17.0, 27.0, 23.0, 28.0, 27.0, 34.0, 29.0, 35.0, 36.0, 37.0, 26.0, 31.0, 42.0, 45.0, 31.0, 42.0, 29.0, 34.0, 39.0, 41.0, 26.0, 23.0, 27.0, 27.0, 19.0, 20.0, 14.0, 20.0, 14.0, 13.0, 10.0, 8.0, 16.0, 3.0, 2.0, 5.0, 6.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.94499969482422, -51.063453674316406, -49.18190383911133, -47.300357818603516, -45.41880798339844, -43.537261962890625, -41.65571594238281, -39.774166107177734, -37.892616271972656, -36.011070251464844, -34.129520416259766, -32.24797439575195, -30.366424560546875, -28.484878540039062, -26.603330612182617, -24.721782684326172, -22.84023666381836, -20.958688735961914, -19.07714080810547, -17.195594787597656, -15.314045906066895, -13.43249797821045, -11.55095100402832, -9.669403076171875, -7.78785514831543, -5.906307220458984, -4.024759769439697, -2.14321231842041, -0.26166439056396484, 1.6198835372924805, 3.5014305114746094, 5.382978439331055, 7.2645263671875, 9.146074295043945, 11.02762222290039, 12.90916919708252, 14.790717124938965, 16.672264099121094, 18.55381202697754, 20.435359954833984, 22.31690788269043, 24.198455810546875, 26.08000373840332, 27.961551666259766, 29.843097686767578, 31.724647521972656, 33.60619354248047, 35.48773956298828, 37.36928939819336, 39.25083541870117, 41.13238525390625, 43.01393127441406, 44.89548110961914, 46.77702713012695, 48.65857696533203, 50.540122985839844, 52.421669006347656, 54.30321502685547, 56.18476486206055, 58.06631088256836, 59.94786071777344, 61.82940673828125, 63.71095275878906, 65.59249877929688, 67.47405242919922]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 10.0, 4.0, 25.0, 26.0, 34.0, 75.0, 108.0, 164.0, 252.0, 359.0, 637.0, 936.0, 1393.0, 2143.0, 3381.0, 4875.0, 7100.0, 10366.0, 14597.0, 20231.0, 27437.0, 36079.0, 46093.0, 57539.0, 67906.0, 77964.0, 87831.0, 111764.0, 88175.0, 78217.0, 68250.0, 57502.0, 46304.0, 35992.0, 27674.0, 20321.0, 14680.0, 10416.0, 7275.0, 4897.0, 3327.0, 2176.0, 1463.0, 955.0, 558.0, 371.0, 255.0, 179.0, 84.0, 60.0, 41.0, 26.0, 15.0, 5.0, 10.0, 4.0, 7.0, 1.0, 2.0], "bins": [-172.125, -166.830078125, -161.53515625, -156.240234375, -150.9453125, -145.650390625, -140.35546875, -135.060546875, -129.765625, -124.470703125, -119.17578125, -113.880859375, -108.5859375, -103.291015625, -97.99609375, -92.701171875, -87.40625, -82.111328125, -76.81640625, -71.521484375, -66.2265625, -60.931640625, -55.63671875, -50.341796875, -45.046875, -39.751953125, -34.45703125, -29.162109375, -23.8671875, -18.572265625, -13.27734375, -7.982421875, -2.6875, 2.607421875, 7.90234375, 13.197265625, 18.4921875, 23.787109375, 29.08203125, 34.376953125, 39.671875, 44.966796875, 50.26171875, 55.556640625, 60.8515625, 66.146484375, 71.44140625, 76.736328125, 82.03125, 87.326171875, 92.62109375, 97.916015625, 103.2109375, 108.505859375, 113.80078125, 119.095703125, 124.390625, 129.685546875, 134.98046875, 140.275390625, 145.5703125, 150.865234375, 156.16015625, 161.455078125, 166.75]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 7.0, 14.0, 10.0, 21.0, 18.0, 25.0, 15.0, 23.0, 18.0, 28.0, 33.0, 27.0, 37.0, 39.0, 37.0, 30.0, 43.0, 57.0, 54.0, 49.0, 37.0, 28.0, 39.0, 37.0, 30.0, 36.0, 27.0, 32.0, 19.0, 23.0, 15.0, 16.0, 17.0, 10.0, 10.0, 10.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-84.8125, -82.091796875, -79.37109375, -76.650390625, -73.9296875, -71.208984375, -68.48828125, -65.767578125, -63.046875, -60.326171875, -57.60546875, -54.884765625, -52.1640625, -49.443359375, -46.72265625, -44.001953125, -41.28125, -38.560546875, -35.83984375, -33.119140625, -30.3984375, -27.677734375, -24.95703125, -22.236328125, -19.515625, -16.794921875, -14.07421875, -11.353515625, -8.6328125, -5.912109375, -3.19140625, -0.470703125, 2.25, 4.970703125, 7.69140625, 10.412109375, 13.1328125, 15.853515625, 18.57421875, 21.294921875, 24.015625, 26.736328125, 29.45703125, 32.177734375, 34.8984375, 37.619140625, 40.33984375, 43.060546875, 45.78125, 48.501953125, 51.22265625, 53.943359375, 56.6640625, 59.384765625, 62.10546875, 64.826171875, 67.546875, 70.267578125, 72.98828125, 75.708984375, 78.4296875, 81.150390625, 83.87109375, 86.591796875, 89.3125]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 2.0, 6.0, 6.0, 9.0, 4.0, 8.0, 9.0, 18.0, 10.0, 17.0, 27.0, 20.0, 16.0, 24.0, 32.0, 32.0, 41.0, 33.0, 50.0, 41.0, 39.0, 44.0, 37.0, 49.0, 40.0, 36.0, 41.0, 41.0, 28.0, 26.0, 25.0, 23.0, 27.0, 18.0, 17.0, 14.0, 12.0, 16.0, 12.0, 9.0, 9.0, 9.0, 4.0, 4.0, 2.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.109832763671875, -52.39028549194336, -50.67073440551758, -48.95118713378906, -47.23163604736328, -45.512088775634766, -43.79254150390625, -42.07299041748047, -40.35343933105469, -38.63389205932617, -36.91434097290039, -35.194793701171875, -33.475242614746094, -31.755695343017578, -30.03614616394043, -28.31659698486328, -26.597049713134766, -24.877500534057617, -23.15795135498047, -21.438404083251953, -19.718852996826172, -17.999305725097656, -16.279756546020508, -14.56020736694336, -12.840658187866211, -11.121109008789062, -9.401559829711914, -7.682011604309082, -5.962462425231934, -4.242913246154785, -2.523365020751953, -0.8038158416748047, 0.9157333374023438, 2.635282278060913, 4.354831218719482, 6.074379920959473, 7.793929100036621, 9.51347827911377, 11.233026504516602, 12.95257568359375, 14.672124862670898, 16.391674041748047, 18.111223220825195, 19.830772399902344, 21.55031967163086, 23.26987075805664, 24.989418029785156, 26.708967208862305, 28.428516387939453, 30.1480655670166, 31.86761474609375, 33.587162017822266, 35.30671310424805, 37.02626037597656, 38.745811462402344, 40.46535873413086, 42.184906005859375, 43.90445327758789, 45.62400436401367, 47.34355163574219, 49.06310272216797, 50.782649993896484, 52.502197265625, 54.22174835205078, 55.94129943847656]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 8.0, 6.0, 8.0, 11.0, 12.0, 10.0, 21.0, 21.0, 23.0, 17.0, 25.0, 35.0, 25.0, 34.0, 25.0, 30.0, 30.0, 41.0, 48.0, 42.0, 35.0, 35.0, 37.0, 31.0, 39.0, 38.0, 28.0, 30.0, 30.0, 33.0, 25.0, 20.0, 27.0, 20.0, 19.0, 22.0, 12.0, 10.0, 9.0, 6.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-53.5904541015625, -51.90418243408203, -50.21791458129883, -48.53164291381836, -46.84537124633789, -45.15910339355469, -43.47283172607422, -41.78656005859375, -40.10028839111328, -38.41401672363281, -36.72774887084961, -35.04147720336914, -33.35520553588867, -31.668935775756836, -29.982666015625, -28.29639434814453, -26.610124588012695, -24.92385482788086, -23.23758316040039, -21.551313400268555, -19.865041732788086, -18.17877197265625, -16.49250030517578, -14.806230545043945, -13.119959831237793, -11.43368911743164, -9.747418403625488, -8.061147689819336, -6.374877452850342, -4.688607215881348, -3.0023365020751953, -1.316065788269043, 0.3702049255371094, 2.0564756393432617, 3.742746114730835, 5.429016590118408, 7.1152873039245605, 8.801557540893555, 10.487828254699707, 12.17409896850586, 13.860369682312012, 15.546640396118164, 17.23291015625, 18.91918182373047, 20.605451583862305, 22.29172134399414, 23.97799301147461, 25.664264678955078, 27.350534439086914, 29.03680419921875, 30.72307586669922, 32.40934753417969, 34.09561538696289, 35.78188705444336, 37.46815872192383, 39.15442657470703, 40.8406982421875, 42.52696990966797, 44.21323776245117, 45.89950942993164, 47.58578109741211, 49.27204895019531, 50.95832061767578, 52.64459228515625, 54.33086395263672]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 6.0, 6.0, 8.0, 11.0, 22.0, 36.0, 54.0, 80.0, 127.0, 200.0, 287.0, 474.0, 846.0, 1230.0, 1915.0, 2945.0, 4591.0, 7448.0, 11754.0, 19222.0, 30270.0, 49367.0, 79329.0, 126941.0, 200365.0, 309601.0, 450199.0, 588116.0, 635145.0, 546627.0, 400777.0, 268323.0, 172091.0, 108125.0, 67521.0, 41891.0, 25520.0, 15823.0, 9958.0, 6165.0, 3954.0, 2463.0, 1575.0, 1063.0, 623.0, 429.0, 257.0, 176.0, 117.0, 80.0, 45.0, 22.0, 29.0, 14.0, 12.0, 8.0, 9.0, 3.0, 0.0, 0.0, 1.0], "bins": [-67.6875, -65.5263671875, -63.365234375, -61.2041015625, -59.04296875, -56.8818359375, -54.720703125, -52.5595703125, -50.3984375, -48.2373046875, -46.076171875, -43.9150390625, -41.75390625, -39.5927734375, -37.431640625, -35.2705078125, -33.109375, -30.9482421875, -28.787109375, -26.6259765625, -24.46484375, -22.3037109375, -20.142578125, -17.9814453125, -15.8203125, -13.6591796875, -11.498046875, -9.3369140625, -7.17578125, -5.0146484375, -2.853515625, -0.6923828125, 1.46875, 3.6298828125, 5.791015625, 7.9521484375, 10.11328125, 12.2744140625, 14.435546875, 16.5966796875, 18.7578125, 20.9189453125, 23.080078125, 25.2412109375, 27.40234375, 29.5634765625, 31.724609375, 33.8857421875, 36.046875, 38.2080078125, 40.369140625, 42.5302734375, 44.69140625, 46.8525390625, 49.013671875, 51.1748046875, 53.3359375, 55.4970703125, 57.658203125, 59.8193359375, 61.98046875, 64.1416015625, 66.302734375, 68.4638671875, 70.625]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 9.0, 8.0, 13.0, 10.0, 14.0, 17.0, 21.0, 23.0, 30.0, 29.0, 34.0, 34.0, 41.0, 25.0, 37.0, 39.0, 43.0, 46.0, 47.0, 45.0, 39.0, 49.0, 37.0, 31.0, 33.0, 31.0, 33.0, 27.0, 26.0, 23.0, 18.0, 18.0, 13.0, 16.0, 13.0, 6.0, 6.0, 3.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.5625, -44.056640625, -42.55078125, -41.044921875, -39.5390625, -38.033203125, -36.52734375, -35.021484375, -33.515625, -32.009765625, -30.50390625, -28.998046875, -27.4921875, -25.986328125, -24.48046875, -22.974609375, -21.46875, -19.962890625, -18.45703125, -16.951171875, -15.4453125, -13.939453125, -12.43359375, -10.927734375, -9.421875, -7.916015625, -6.41015625, -4.904296875, -3.3984375, -1.892578125, -0.38671875, 1.119140625, 2.625, 4.130859375, 5.63671875, 7.142578125, 8.6484375, 10.154296875, 11.66015625, 13.166015625, 14.671875, 16.177734375, 17.68359375, 19.189453125, 20.6953125, 22.201171875, 23.70703125, 25.212890625, 26.71875, 28.224609375, 29.73046875, 31.236328125, 32.7421875, 34.248046875, 35.75390625, 37.259765625, 38.765625, 40.271484375, 41.77734375, 43.283203125, 44.7890625, 46.294921875, 47.80078125, 49.306640625, 50.8125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 15.0, 26.0, 36.0, 58.0, 98.0, 114.0, 254.0, 419.0, 739.0, 1170.0, 1915.0, 3335.0, 5685.0, 9387.0, 16166.0, 26921.0, 45970.0, 76018.0, 122962.0, 193065.0, 291067.0, 407141.0, 516534.0, 577411.0, 544352.0, 443818.0, 324793.0, 220704.0, 143147.0, 88735.0, 53801.0, 32082.0, 18991.0, 11098.0, 6609.0, 3927.0, 2233.0, 1428.0, 817.0, 491.0, 294.0, 184.0, 106.0, 59.0, 39.0, 25.0, 23.0, 10.0, 6.0, 4.0, 2.0, 2.0], "bins": [-58.65625, -57.01123046875, -55.3662109375, -53.72119140625, -52.076171875, -50.43115234375, -48.7861328125, -47.14111328125, -45.49609375, -43.85107421875, -42.2060546875, -40.56103515625, -38.916015625, -37.27099609375, -35.6259765625, -33.98095703125, -32.3359375, -30.69091796875, -29.0458984375, -27.40087890625, -25.755859375, -24.11083984375, -22.4658203125, -20.82080078125, -19.17578125, -17.53076171875, -15.8857421875, -14.24072265625, -12.595703125, -10.95068359375, -9.3056640625, -7.66064453125, -6.015625, -4.37060546875, -2.7255859375, -1.08056640625, 0.564453125, 2.20947265625, 3.8544921875, 5.49951171875, 7.14453125, 8.78955078125, 10.4345703125, 12.07958984375, 13.724609375, 15.36962890625, 17.0146484375, 18.65966796875, 20.3046875, 21.94970703125, 23.5947265625, 25.23974609375, 26.884765625, 28.52978515625, 30.1748046875, 31.81982421875, 33.46484375, 35.10986328125, 36.7548828125, 38.39990234375, 40.044921875, 41.68994140625, 43.3349609375, 44.97998046875, 46.625]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 5.0, 8.0, 13.0, 18.0, 21.0, 33.0, 45.0, 54.0, 63.0, 91.0, 96.0, 144.0, 187.0, 189.0, 218.0, 242.0, 234.0, 248.0, 243.0, 268.0, 250.0, 232.0, 203.0, 176.0, 165.0, 124.0, 117.0, 96.0, 66.0, 56.0, 35.0, 41.0, 26.0, 13.0, 20.0, 11.0, 9.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.4375, -25.593017578125, -24.74853515625, -23.904052734375, -23.0595703125, -22.215087890625, -21.37060546875, -20.526123046875, -19.681640625, -18.837158203125, -17.99267578125, -17.148193359375, -16.3037109375, -15.459228515625, -14.61474609375, -13.770263671875, -12.92578125, -12.081298828125, -11.23681640625, -10.392333984375, -9.5478515625, -8.703369140625, -7.85888671875, -7.014404296875, -6.169921875, -5.325439453125, -4.48095703125, -3.636474609375, -2.7919921875, -1.947509765625, -1.10302734375, -0.258544921875, 0.5859375, 1.430419921875, 2.27490234375, 3.119384765625, 3.9638671875, 4.808349609375, 5.65283203125, 6.497314453125, 7.341796875, 8.186279296875, 9.03076171875, 9.875244140625, 10.7197265625, 11.564208984375, 12.40869140625, 13.253173828125, 14.09765625, 14.942138671875, 15.78662109375, 16.631103515625, 17.4755859375, 18.320068359375, 19.16455078125, 20.009033203125, 20.853515625, 21.697998046875, 22.54248046875, 23.386962890625, 24.2314453125, 25.075927734375, 25.92041015625, 26.764892578125, 27.609375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 7.0, 6.0, 9.0, 11.0, 13.0, 13.0, 13.0, 21.0, 22.0, 21.0, 27.0, 31.0, 29.0, 25.0, 35.0, 43.0, 38.0, 31.0, 42.0, 40.0, 41.0, 53.0, 52.0, 49.0, 32.0, 30.0, 28.0, 28.0, 27.0, 34.0, 23.0, 23.0, 17.0, 15.0, 15.0, 9.0, 8.0, 6.0, 8.0, 4.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-52.2464485168457, -50.6294059753418, -49.012359619140625, -47.39531707763672, -45.77827072143555, -44.16122817993164, -42.54418182373047, -40.92713928222656, -39.310096740722656, -37.69305419921875, -36.07600784301758, -34.45896530151367, -32.8419189453125, -31.224876403808594, -29.607831954956055, -27.990787506103516, -26.373741149902344, -24.756696701049805, -23.139652252197266, -21.52260971069336, -19.905563354492188, -18.28852081298828, -16.671476364135742, -15.054431915283203, -13.437387466430664, -11.820343017578125, -10.203298568725586, -8.586255073547363, -6.969210624694824, -5.352166175842285, -3.7351226806640625, -2.1180782318115234, -0.5010337829589844, 1.1160104274749756, 2.7330546379089355, 4.350098609924316, 5.9671430587768555, 7.5841875076293945, 9.201231002807617, 10.818275451660156, 12.435319900512695, 14.052364349365234, 15.669408798217773, 17.286453247070312, 18.90349578857422, 20.52054214477539, 22.137584686279297, 23.754629135131836, 25.371673583984375, 26.988718032836914, 28.605762481689453, 30.22280502319336, 31.83985137939453, 33.45689392089844, 35.073936462402344, 36.690982818603516, 38.30802917480469, 39.925071716308594, 41.542118072509766, 43.15916061401367, 44.776206970214844, 46.39324951171875, 48.010292053222656, 49.62733840942383, 51.244380950927734]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 3.0, 2.0, 11.0, 8.0, 16.0, 12.0, 14.0, 22.0, 23.0, 30.0, 32.0, 24.0, 20.0, 29.0, 36.0, 38.0, 51.0, 46.0, 37.0, 41.0, 46.0, 25.0, 47.0, 38.0, 47.0, 37.0, 35.0, 32.0, 30.0, 29.0, 28.0, 12.0, 19.0, 20.0, 13.0, 9.0, 11.0, 12.0, 5.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-56.34663772583008, -54.58415222167969, -52.82167053222656, -51.05918502807617, -49.29670333862305, -47.534217834472656, -45.77173614501953, -44.00925064086914, -42.246768951416016, -40.484283447265625, -38.7218017578125, -36.95931625366211, -35.196834564208984, -33.434349060058594, -31.67186737060547, -29.909381866455078, -28.14689826965332, -26.384414672851562, -24.621931076049805, -22.859447479248047, -21.09696388244629, -19.33448028564453, -17.57199478149414, -15.8095121383667, -14.047028541564941, -12.284544944763184, -10.522061347961426, -8.759576797485352, -6.997093677520752, -5.234609603881836, -3.472126007080078, -1.7096424102783203, 0.0528411865234375, 1.8153249025344849, 3.5778086185455322, 5.340292453765869, 7.102776050567627, 8.865260124206543, 10.6277437210083, 12.390227317810059, 14.152710914611816, 15.915194511413574, 17.67767906188965, 19.440162658691406, 21.202646255493164, 22.965129852294922, 24.72761344909668, 26.490097045898438, 28.252580642700195, 30.015064239501953, 31.77754783630371, 33.54003143310547, 35.30251693725586, 37.064998626708984, 38.827484130859375, 40.5899658203125, 42.35245132446289, 44.11493682861328, 45.877418518066406, 47.6399040222168, 49.40238571166992, 51.16487121582031, 52.92735290527344, 54.68983840942383, 56.45232009887695]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 6.0, 2.0, 13.0, 19.0, 23.0, 48.0, 60.0, 97.0, 125.0, 212.0, 299.0, 456.0, 683.0, 937.0, 1483.0, 2086.0, 3401.0, 5321.0, 8041.0, 12287.0, 19897.0, 31296.0, 49889.0, 81316.0, 127738.0, 173978.0, 174695.0, 130790.0, 83273.0, 51188.0, 31910.0, 20259.0, 12882.0, 8175.0, 5301.0, 3517.0, 2328.0, 1482.0, 969.0, 717.0, 460.0, 290.0, 193.0, 144.0, 91.0, 63.0, 43.0, 21.0, 20.0, 14.0, 10.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-76.0625, -73.529296875, -70.99609375, -68.462890625, -65.9296875, -63.396484375, -60.86328125, -58.330078125, -55.796875, -53.263671875, -50.73046875, -48.197265625, -45.6640625, -43.130859375, -40.59765625, -38.064453125, -35.53125, -32.998046875, -30.46484375, -27.931640625, -25.3984375, -22.865234375, -20.33203125, -17.798828125, -15.265625, -12.732421875, -10.19921875, -7.666015625, -5.1328125, -2.599609375, -0.06640625, 2.466796875, 5.0, 7.533203125, 10.06640625, 12.599609375, 15.1328125, 17.666015625, 20.19921875, 22.732421875, 25.265625, 27.798828125, 30.33203125, 32.865234375, 35.3984375, 37.931640625, 40.46484375, 42.998046875, 45.53125, 48.064453125, 50.59765625, 53.130859375, 55.6640625, 58.197265625, 60.73046875, 63.263671875, 65.796875, 68.330078125, 70.86328125, 73.396484375, 75.9296875, 78.462890625, 80.99609375, 83.529296875, 86.0625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 5.0, 4.0, 9.0, 7.0, 12.0, 13.0, 22.0, 18.0, 22.0, 22.0, 26.0, 16.0, 27.0, 29.0, 28.0, 38.0, 34.0, 44.0, 46.0, 39.0, 38.0, 44.0, 45.0, 41.0, 29.0, 43.0, 26.0, 31.0, 31.0, 28.0, 31.0, 28.0, 23.0, 13.0, 16.0, 9.0, 16.0, 10.0, 4.0, 10.0, 3.0, 5.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-45.875, -44.4375, -43.0, -41.5625, -40.125, -38.6875, -37.25, -35.8125, -34.375, -32.9375, -31.5, -30.0625, -28.625, -27.1875, -25.75, -24.3125, -22.875, -21.4375, -20.0, -18.5625, -17.125, -15.6875, -14.25, -12.8125, -11.375, -9.9375, -8.5, -7.0625, -5.625, -4.1875, -2.75, -1.3125, 0.125, 1.5625, 3.0, 4.4375, 5.875, 7.3125, 8.75, 10.1875, 11.625, 13.0625, 14.5, 15.9375, 17.375, 18.8125, 20.25, 21.6875, 23.125, 24.5625, 26.0, 27.4375, 28.875, 30.3125, 31.75, 33.1875, 34.625, 36.0625, 37.5, 38.9375, 40.375, 41.8125, 43.25, 44.6875, 46.125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 2.0, 5.0, 6.0, 13.0, 21.0, 32.0, 39.0, 48.0, 84.0, 112.0, 147.0, 200.0, 308.0, 457.0, 664.0, 1015.0, 1468.0, 2189.0, 3403.0, 5330.0, 8411.0, 13663.0, 22780.0, 39208.0, 71391.0, 139218.0, 247155.0, 223172.0, 118152.0, 61702.0, 34229.0, 20196.0, 12151.0, 7604.0, 4691.0, 3073.0, 2030.0, 1317.0, 898.0, 634.0, 401.0, 266.0, 206.0, 151.0, 103.0, 65.0, 53.0, 28.0, 19.0, 17.0, 9.0, 12.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-103.625, -100.1572265625, -96.689453125, -93.2216796875, -89.75390625, -86.2861328125, -82.818359375, -79.3505859375, -75.8828125, -72.4150390625, -68.947265625, -65.4794921875, -62.01171875, -58.5439453125, -55.076171875, -51.6083984375, -48.140625, -44.6728515625, -41.205078125, -37.7373046875, -34.26953125, -30.8017578125, -27.333984375, -23.8662109375, -20.3984375, -16.9306640625, -13.462890625, -9.9951171875, -6.52734375, -3.0595703125, 0.408203125, 3.8759765625, 7.34375, 10.8115234375, 14.279296875, 17.7470703125, 21.21484375, 24.6826171875, 28.150390625, 31.6181640625, 35.0859375, 38.5537109375, 42.021484375, 45.4892578125, 48.95703125, 52.4248046875, 55.892578125, 59.3603515625, 62.828125, 66.2958984375, 69.763671875, 73.2314453125, 76.69921875, 80.1669921875, 83.634765625, 87.1025390625, 90.5703125, 94.0380859375, 97.505859375, 100.9736328125, 104.44140625, 107.9091796875, 111.376953125, 114.8447265625, 118.3125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 2.0, 10.0, 11.0, 15.0, 26.0, 25.0, 22.0, 21.0, 24.0, 31.0, 33.0, 46.0, 31.0, 50.0, 44.0, 40.0, 46.0, 40.0, 49.0, 47.0, 40.0, 48.0, 44.0, 34.0, 28.0, 31.0, 20.0, 25.0, 24.0, 16.0, 21.0, 11.0, 9.0, 2.0, 8.0, 7.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.4375, -36.22998046875, -35.0224609375, -33.81494140625, -32.607421875, -31.39990234375, -30.1923828125, -28.98486328125, -27.77734375, -26.56982421875, -25.3623046875, -24.15478515625, -22.947265625, -21.73974609375, -20.5322265625, -19.32470703125, -18.1171875, -16.90966796875, -15.7021484375, -14.49462890625, -13.287109375, -12.07958984375, -10.8720703125, -9.66455078125, -8.45703125, -7.24951171875, -6.0419921875, -4.83447265625, -3.626953125, -2.41943359375, -1.2119140625, -0.00439453125, 1.203125, 2.41064453125, 3.6181640625, 4.82568359375, 6.033203125, 7.24072265625, 8.4482421875, 9.65576171875, 10.86328125, 12.07080078125, 13.2783203125, 14.48583984375, 15.693359375, 16.90087890625, 18.1083984375, 19.31591796875, 20.5234375, 21.73095703125, 22.9384765625, 24.14599609375, 25.353515625, 26.56103515625, 27.7685546875, 28.97607421875, 30.18359375, 31.39111328125, 32.5986328125, 33.80615234375, 35.013671875, 36.22119140625, 37.4287109375, 38.63623046875, 39.84375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 12.0, 14.0, 18.0, 20.0, 35.0, 53.0, 77.0, 123.0, 167.0, 258.0, 339.0, 550.0, 894.0, 1401.0, 2701.0, 5400.0, 12858.0, 40344.0, 174405.0, 527516.0, 207391.0, 46538.0, 14437.0, 5888.0, 2948.0, 1551.0, 912.0, 551.0, 365.0, 241.0, 169.0, 107.0, 84.0, 56.0, 37.0, 30.0, 11.0, 12.0, 10.0, 11.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.6875, -99.212890625, -95.73828125, -92.263671875, -88.7890625, -85.314453125, -81.83984375, -78.365234375, -74.890625, -71.416015625, -67.94140625, -64.466796875, -60.9921875, -57.517578125, -54.04296875, -50.568359375, -47.09375, -43.619140625, -40.14453125, -36.669921875, -33.1953125, -29.720703125, -26.24609375, -22.771484375, -19.296875, -15.822265625, -12.34765625, -8.873046875, -5.3984375, -1.923828125, 1.55078125, 5.025390625, 8.5, 11.974609375, 15.44921875, 18.923828125, 22.3984375, 25.873046875, 29.34765625, 32.822265625, 36.296875, 39.771484375, 43.24609375, 46.720703125, 50.1953125, 53.669921875, 57.14453125, 60.619140625, 64.09375, 67.568359375, 71.04296875, 74.517578125, 77.9921875, 81.466796875, 84.94140625, 88.416015625, 91.890625, 95.365234375, 98.83984375, 102.314453125, 105.7890625, 109.263671875, 112.73828125, 116.212890625, 119.6875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 3.0, 6.0, 11.0, 6.0, 9.0, 11.0, 30.0, 27.0, 35.0, 86.0, 137.0, 158.0, 146.0, 112.0, 67.0, 37.0, 31.0, 21.0, 10.0, 10.0, 8.0, 5.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00617218017578125, -0.005971193313598633, -0.005770206451416016, -0.0055692195892333984, -0.005368232727050781, -0.005167245864868164, -0.004966259002685547, -0.00476527214050293, -0.0045642852783203125, -0.004363298416137695, -0.004162311553955078, -0.003961324691772461, -0.0037603378295898438, -0.0035593509674072266, -0.0033583641052246094, -0.003157377243041992, -0.002956390380859375, -0.002755403518676758, -0.0025544166564941406, -0.0023534297943115234, -0.0021524429321289062, -0.001951456069946289, -0.0017504692077636719, -0.0015494823455810547, -0.0013484954833984375, -0.0011475086212158203, -0.0009465217590332031, -0.0007455348968505859, -0.0005445480346679688, -0.00034356117248535156, -0.00014257431030273438, 5.841255187988281e-05, 0.0002593994140625, 0.0004603862762451172, 0.0006613731384277344, 0.0008623600006103516, 0.0010633468627929688, 0.001264333724975586, 0.0014653205871582031, 0.0016663074493408203, 0.0018672943115234375, 0.0020682811737060547, 0.002269268035888672, 0.002470254898071289, 0.0026712417602539062, 0.0028722286224365234, 0.0030732154846191406, 0.003274202346801758, 0.003475189208984375, 0.003676176071166992, 0.0038771629333496094, 0.0040781497955322266, 0.004279136657714844, 0.004480123519897461, 0.004681110382080078, 0.004882097244262695, 0.0050830841064453125, 0.00528407096862793, 0.005485057830810547, 0.005686044692993164, 0.005887031555175781, 0.0060880184173583984, 0.006289005279541016, 0.006489992141723633, 0.00669097900390625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 11.0, 4.0, 13.0, 15.0, 28.0, 29.0, 39.0, 90.0, 123.0, 185.0, 289.0, 468.0, 714.0, 1193.0, 2169.0, 3946.0, 7946.0, 19047.0, 52993.0, 164292.0, 372703.0, 273114.0, 93358.0, 30938.0, 12122.0, 5626.0, 2860.0, 1650.0, 945.0, 611.0, 388.0, 189.0, 150.0, 104.0, 63.0, 43.0, 38.0, 15.0, 14.0, 7.0, 3.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-110.125, -106.9560546875, -103.787109375, -100.6181640625, -97.44921875, -94.2802734375, -91.111328125, -87.9423828125, -84.7734375, -81.6044921875, -78.435546875, -75.2666015625, -72.09765625, -68.9287109375, -65.759765625, -62.5908203125, -59.421875, -56.2529296875, -53.083984375, -49.9150390625, -46.74609375, -43.5771484375, -40.408203125, -37.2392578125, -34.0703125, -30.9013671875, -27.732421875, -24.5634765625, -21.39453125, -18.2255859375, -15.056640625, -11.8876953125, -8.71875, -5.5498046875, -2.380859375, 0.7880859375, 3.95703125, 7.1259765625, 10.294921875, 13.4638671875, 16.6328125, 19.8017578125, 22.970703125, 26.1396484375, 29.30859375, 32.4775390625, 35.646484375, 38.8154296875, 41.984375, 45.1533203125, 48.322265625, 51.4912109375, 54.66015625, 57.8291015625, 60.998046875, 64.1669921875, 67.3359375, 70.5048828125, 73.673828125, 76.8427734375, 80.01171875, 83.1806640625, 86.349609375, 89.5185546875, 92.6875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 1.0, 5.0, 5.0, 10.0, 6.0, 6.0, 9.0, 17.0, 24.0, 27.0, 41.0, 50.0, 56.0, 67.0, 97.0, 109.0, 92.0, 74.0, 66.0, 43.0, 42.0, 33.0, 33.0, 27.0, 16.0, 8.0, 10.0, 6.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.1875, -24.33837890625, -23.4892578125, -22.64013671875, -21.791015625, -20.94189453125, -20.0927734375, -19.24365234375, -18.39453125, -17.54541015625, -16.6962890625, -15.84716796875, -14.998046875, -14.14892578125, -13.2998046875, -12.45068359375, -11.6015625, -10.75244140625, -9.9033203125, -9.05419921875, -8.205078125, -7.35595703125, -6.5068359375, -5.65771484375, -4.80859375, -3.95947265625, -3.1103515625, -2.26123046875, -1.412109375, -0.56298828125, 0.2861328125, 1.13525390625, 1.984375, 2.83349609375, 3.6826171875, 4.53173828125, 5.380859375, 6.22998046875, 7.0791015625, 7.92822265625, 8.77734375, 9.62646484375, 10.4755859375, 11.32470703125, 12.173828125, 13.02294921875, 13.8720703125, 14.72119140625, 15.5703125, 16.41943359375, 17.2685546875, 18.11767578125, 18.966796875, 19.81591796875, 20.6650390625, 21.51416015625, 22.36328125, 23.21240234375, 24.0615234375, 24.91064453125, 25.759765625, 26.60888671875, 27.4580078125, 28.30712890625, 29.15625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 4.0, 4.0, 4.0, 1.0, 8.0, 13.0, 17.0, 17.0, 17.0, 27.0, 27.0, 30.0, 26.0, 25.0, 30.0, 25.0, 48.0, 43.0, 35.0, 55.0, 40.0, 34.0, 40.0, 44.0, 46.0, 38.0, 30.0, 36.0, 30.0, 40.0, 22.0, 24.0, 22.0, 23.0, 18.0, 7.0, 11.0, 10.0, 4.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-47.84823226928711, -46.39822006225586, -44.948211669921875, -43.498199462890625, -42.048187255859375, -40.59817886352539, -39.14816665649414, -37.698158264160156, -36.248146057128906, -34.798133850097656, -33.34812545776367, -31.898113250732422, -30.448102951049805, -28.998092651367188, -27.548080444335938, -26.09807014465332, -24.648059844970703, -23.198049545288086, -21.74803924560547, -20.29802703857422, -18.8480167388916, -17.398006439208984, -15.94799518585205, -14.497983932495117, -13.0479736328125, -11.597963333129883, -10.14795207977295, -8.697940826416016, -7.247930526733398, -5.797919750213623, -4.347908973693848, -2.897897720336914, -1.4478836059570312, 0.0021271705627441406, 1.4521379470825195, 2.902148723602295, 4.35215950012207, 5.802170276641846, 7.252181053161621, 8.702192306518555, 10.152202606201172, 11.602212905883789, 13.052224159240723, 14.502235412597656, 15.952245712280273, 17.40225601196289, 18.85226821899414, 20.302278518676758, 21.752288818359375, 23.202299118041992, 24.65230941772461, 26.10232162475586, 27.552331924438477, 29.002342224121094, 30.452354431152344, 31.90236473083496, 33.35237503051758, 34.80238723754883, 36.25239562988281, 37.70240783691406, 39.15242004394531, 40.6024284362793, 42.05244064331055, 43.50244903564453, 44.95246124267578]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 8.0, 11.0, 11.0, 15.0, 19.0, 18.0, 13.0, 25.0, 20.0, 28.0, 30.0, 25.0, 33.0, 29.0, 37.0, 54.0, 44.0, 26.0, 47.0, 42.0, 45.0, 37.0, 32.0, 39.0, 39.0, 32.0, 32.0, 36.0, 31.0, 24.0, 17.0, 16.0, 18.0, 15.0, 13.0, 6.0, 3.0, 9.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.483909606933594, -47.978050231933594, -46.472190856933594, -44.966331481933594, -43.46047592163086, -41.95461654663086, -40.44875717163086, -38.94289779663086, -37.437042236328125, -35.931182861328125, -34.425323486328125, -32.919464111328125, -31.41360855102539, -29.90774917602539, -28.40188980102539, -26.89603042602539, -25.39017105102539, -23.88431167602539, -22.378454208374023, -20.872594833374023, -19.366737365722656, -17.860877990722656, -16.355018615722656, -14.849160194396973, -13.343301773071289, -11.837443351745605, -10.331584930419922, -8.825725555419922, -7.319867134094238, -5.814008712768555, -4.308149337768555, -2.802290916442871, -1.2964286804199219, 0.20942997932434082, 1.7152886390686035, 3.2211475372314453, 4.727005958557129, 6.2328643798828125, 7.7387237548828125, 9.244582176208496, 10.75044059753418, 12.256299018859863, 13.762157440185547, 15.268016815185547, 16.773876190185547, 18.279733657836914, 19.785593032836914, 21.29145050048828, 22.79730987548828, 24.30316925048828, 25.80902671813965, 27.31488609313965, 28.820743560791016, 30.326602935791016, 31.832462310791016, 33.338321685791016, 34.84417724609375, 36.35003662109375, 37.85589599609375, 39.36175537109375, 40.867610931396484, 42.373470306396484, 43.879329681396484, 45.385189056396484, 46.891048431396484]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 13.0, 19.0, 35.0, 46.0, 69.0, 115.0, 173.0, 263.0, 354.0, 592.0, 844.0, 1235.0, 1982.0, 2799.0, 4226.0, 6164.0, 9035.0, 13362.0, 18758.0, 26362.0, 36131.0, 48386.0, 62113.0, 76318.0, 88627.0, 97208.0, 98599.0, 93876.0, 83877.0, 70547.0, 56349.0, 43364.0, 31791.0, 23264.0, 16529.0, 11366.0, 7701.0, 5288.0, 3577.0, 2354.0, 1607.0, 1104.0, 732.0, 476.0, 337.0, 218.0, 136.0, 77.0, 57.0, 28.0, 25.0, 16.0, 13.0, 7.0, 5.0, 6.0, 1.0], "bins": [-40.9375, -39.7080078125, -38.478515625, -37.2490234375, -36.01953125, -34.7900390625, -33.560546875, -32.3310546875, -31.1015625, -29.8720703125, -28.642578125, -27.4130859375, -26.18359375, -24.9541015625, -23.724609375, -22.4951171875, -21.265625, -20.0361328125, -18.806640625, -17.5771484375, -16.34765625, -15.1181640625, -13.888671875, -12.6591796875, -11.4296875, -10.2001953125, -8.970703125, -7.7412109375, -6.51171875, -5.2822265625, -4.052734375, -2.8232421875, -1.59375, -0.3642578125, 0.865234375, 2.0947265625, 3.32421875, 4.5537109375, 5.783203125, 7.0126953125, 8.2421875, 9.4716796875, 10.701171875, 11.9306640625, 13.16015625, 14.3896484375, 15.619140625, 16.8486328125, 18.078125, 19.3076171875, 20.537109375, 21.7666015625, 22.99609375, 24.2255859375, 25.455078125, 26.6845703125, 27.9140625, 29.1435546875, 30.373046875, 31.6025390625, 32.83203125, 34.0615234375, 35.291015625, 36.5205078125, 37.75]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 7.0, 10.0, 8.0, 12.0, 18.0, 14.0, 21.0, 25.0, 22.0, 20.0, 31.0, 24.0, 32.0, 27.0, 41.0, 41.0, 36.0, 45.0, 48.0, 39.0, 51.0, 41.0, 44.0, 52.0, 30.0, 46.0, 29.0, 29.0, 22.0, 31.0, 15.0, 16.0, 19.0, 16.0, 8.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-49.0625, -47.541015625, -46.01953125, -44.498046875, -42.9765625, -41.455078125, -39.93359375, -38.412109375, -36.890625, -35.369140625, -33.84765625, -32.326171875, -30.8046875, -29.283203125, -27.76171875, -26.240234375, -24.71875, -23.197265625, -21.67578125, -20.154296875, -18.6328125, -17.111328125, -15.58984375, -14.068359375, -12.546875, -11.025390625, -9.50390625, -7.982421875, -6.4609375, -4.939453125, -3.41796875, -1.896484375, -0.375, 1.146484375, 2.66796875, 4.189453125, 5.7109375, 7.232421875, 8.75390625, 10.275390625, 11.796875, 13.318359375, 14.83984375, 16.361328125, 17.8828125, 19.404296875, 20.92578125, 22.447265625, 23.96875, 25.490234375, 27.01171875, 28.533203125, 30.0546875, 31.576171875, 33.09765625, 34.619140625, 36.140625, 37.662109375, 39.18359375, 40.705078125, 42.2265625, 43.748046875, 45.26953125, 46.791015625, 48.3125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 10.0, 7.0, 17.0, 34.0, 69.0, 89.0, 136.0, 216.0, 356.0, 558.0, 797.0, 1312.0, 1869.0, 2958.0, 4437.0, 6553.0, 9599.0, 13836.0, 19813.0, 27833.0, 37867.0, 50341.0, 63886.0, 76330.0, 88633.0, 95609.0, 97124.0, 91998.0, 81987.0, 69448.0, 55707.0, 43182.0, 31940.0, 23086.0, 16518.0, 11230.0, 7673.0, 5336.0, 3573.0, 2249.0, 1519.0, 1018.0, 630.0, 438.0, 255.0, 175.0, 115.0, 86.0, 40.0, 21.0, 22.0, 6.0, 5.0, 6.0, 5.0, 2.0, 2.0], "bins": [-41.75, -40.4931640625, -39.236328125, -37.9794921875, -36.72265625, -35.4658203125, -34.208984375, -32.9521484375, -31.6953125, -30.4384765625, -29.181640625, -27.9248046875, -26.66796875, -25.4111328125, -24.154296875, -22.8974609375, -21.640625, -20.3837890625, -19.126953125, -17.8701171875, -16.61328125, -15.3564453125, -14.099609375, -12.8427734375, -11.5859375, -10.3291015625, -9.072265625, -7.8154296875, -6.55859375, -5.3017578125, -4.044921875, -2.7880859375, -1.53125, -0.2744140625, 0.982421875, 2.2392578125, 3.49609375, 4.7529296875, 6.009765625, 7.2666015625, 8.5234375, 9.7802734375, 11.037109375, 12.2939453125, 13.55078125, 14.8076171875, 16.064453125, 17.3212890625, 18.578125, 19.8349609375, 21.091796875, 22.3486328125, 23.60546875, 24.8623046875, 26.119140625, 27.3759765625, 28.6328125, 29.8896484375, 31.146484375, 32.4033203125, 33.66015625, 34.9169921875, 36.173828125, 37.4306640625, 38.6875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 5.0, 10.0, 7.0, 9.0, 16.0, 9.0, 18.0, 20.0, 18.0, 24.0, 29.0, 28.0, 30.0, 29.0, 32.0, 37.0, 29.0, 47.0, 29.0, 29.0, 31.0, 37.0, 33.0, 47.0, 36.0, 34.0, 37.0, 25.0, 32.0, 34.0, 22.0, 20.0, 23.0, 17.0, 16.0, 15.0, 8.0, 14.0, 11.0, 5.0, 7.0, 11.0, 4.0, 5.0, 5.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-27.65625, -26.785888671875, -25.91552734375, -25.045166015625, -24.1748046875, -23.304443359375, -22.43408203125, -21.563720703125, -20.693359375, -19.822998046875, -18.95263671875, -18.082275390625, -17.2119140625, -16.341552734375, -15.47119140625, -14.600830078125, -13.73046875, -12.860107421875, -11.98974609375, -11.119384765625, -10.2490234375, -9.378662109375, -8.50830078125, -7.637939453125, -6.767578125, -5.897216796875, -5.02685546875, -4.156494140625, -3.2861328125, -2.415771484375, -1.54541015625, -0.675048828125, 0.1953125, 1.065673828125, 1.93603515625, 2.806396484375, 3.6767578125, 4.547119140625, 5.41748046875, 6.287841796875, 7.158203125, 8.028564453125, 8.89892578125, 9.769287109375, 10.6396484375, 11.510009765625, 12.38037109375, 13.250732421875, 14.12109375, 14.991455078125, 15.86181640625, 16.732177734375, 17.6025390625, 18.472900390625, 19.34326171875, 20.213623046875, 21.083984375, 21.954345703125, 22.82470703125, 23.695068359375, 24.5654296875, 25.435791015625, 26.30615234375, 27.176513671875, 28.046875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 5.0, 7.0, 15.0, 19.0, 27.0, 42.0, 56.0, 91.0, 161.0, 198.0, 334.0, 552.0, 813.0, 1319.0, 2192.0, 3677.0, 6190.0, 9864.0, 15910.0, 25625.0, 40412.0, 60657.0, 85116.0, 111055.0, 130686.0, 133723.0, 120799.0, 96881.0, 70602.0, 48291.0, 31646.0, 19770.0, 12305.0, 7684.0, 4415.0, 2796.0, 1678.0, 1070.0, 646.0, 453.0, 289.0, 174.0, 105.0, 83.0, 31.0, 28.0, 20.0, 17.0, 13.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.109375, -14.573974609375, -14.03857421875, -13.503173828125, -12.9677734375, -12.432373046875, -11.89697265625, -11.361572265625, -10.826171875, -10.290771484375, -9.75537109375, -9.219970703125, -8.6845703125, -8.149169921875, -7.61376953125, -7.078369140625, -6.54296875, -6.007568359375, -5.47216796875, -4.936767578125, -4.4013671875, -3.865966796875, -3.33056640625, -2.795166015625, -2.259765625, -1.724365234375, -1.18896484375, -0.653564453125, -0.1181640625, 0.417236328125, 0.95263671875, 1.488037109375, 2.0234375, 2.558837890625, 3.09423828125, 3.629638671875, 4.1650390625, 4.700439453125, 5.23583984375, 5.771240234375, 6.306640625, 6.842041015625, 7.37744140625, 7.912841796875, 8.4482421875, 8.983642578125, 9.51904296875, 10.054443359375, 10.58984375, 11.125244140625, 11.66064453125, 12.196044921875, 12.7314453125, 13.266845703125, 13.80224609375, 14.337646484375, 14.873046875, 15.408447265625, 15.94384765625, 16.479248046875, 17.0146484375, 17.550048828125, 18.08544921875, 18.620849609375, 19.15625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 6.0, 6.0, 8.0, 11.0, 25.0, 15.0, 17.0, 23.0, 29.0, 30.0, 50.0, 52.0, 51.0, 52.0, 52.0, 60.0, 57.0, 55.0, 53.0, 51.0, 41.0, 46.0, 28.0, 42.0, 32.0, 21.0, 14.0, 19.0, 6.0, 7.0, 9.0, 6.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0024433135986328125, -0.002374202013015747, -0.0023050904273986816, -0.002235978841781616, -0.0021668672561645508, -0.0020977556705474854, -0.00202864408493042, -0.0019595324993133545, -0.001890420913696289, -0.0018213093280792236, -0.0017521977424621582, -0.0016830861568450928, -0.0016139745712280273, -0.001544862985610962, -0.0014757513999938965, -0.001406639814376831, -0.0013375282287597656, -0.0012684166431427002, -0.0011993050575256348, -0.0011301934719085693, -0.001061081886291504, -0.0009919703006744385, -0.000922858715057373, -0.0008537471294403076, -0.0007846355438232422, -0.0007155239582061768, -0.0006464123725891113, -0.0005773007869720459, -0.0005081892013549805, -0.00043907761573791504, -0.0003699660301208496, -0.0003008544445037842, -0.00023174285888671875, -0.00016263127326965332, -9.351968765258789e-05, -2.440810203552246e-05, 4.470348358154297e-05, 0.0001138150691986084, 0.00018292665481567383, 0.00025203824043273926, 0.0003211498260498047, 0.0003902614116668701, 0.00045937299728393555, 0.000528484582901001, 0.0005975961685180664, 0.0006667077541351318, 0.0007358193397521973, 0.0008049309253692627, 0.0008740425109863281, 0.0009431540966033936, 0.001012265682220459, 0.0010813772678375244, 0.0011504888534545898, 0.0012196004390716553, 0.0012887120246887207, 0.0013578236103057861, 0.0014269351959228516, 0.001496046781539917, 0.0015651583671569824, 0.0016342699527740479, 0.0017033815383911133, 0.0017724931240081787, 0.0018416047096252441, 0.0019107162952423096, 0.001979827880859375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 5.0, 2.0, 7.0, 2.0, 13.0, 9.0, 25.0, 25.0, 38.0, 56.0, 82.0, 143.0, 185.0, 288.0, 403.0, 596.0, 922.0, 1465.0, 2178.0, 3343.0, 5183.0, 8440.0, 13430.0, 21589.0, 33610.0, 51462.0, 74978.0, 101099.0, 124328.0, 134845.0, 128163.0, 106508.0, 79719.0, 55442.0, 36448.0, 23413.0, 14537.0, 9229.0, 5731.0, 3714.0, 2355.0, 1599.0, 988.0, 616.0, 404.0, 313.0, 217.0, 143.0, 100.0, 51.0, 38.0, 26.0, 24.0, 14.0, 11.0, 5.0, 1.0, 6.0, 0.0, 2.0, 2.0], "bins": [-16.734375, -16.220947265625, -15.70751953125, -15.194091796875, -14.6806640625, -14.167236328125, -13.65380859375, -13.140380859375, -12.626953125, -12.113525390625, -11.60009765625, -11.086669921875, -10.5732421875, -10.059814453125, -9.54638671875, -9.032958984375, -8.51953125, -8.006103515625, -7.49267578125, -6.979248046875, -6.4658203125, -5.952392578125, -5.43896484375, -4.925537109375, -4.412109375, -3.898681640625, -3.38525390625, -2.871826171875, -2.3583984375, -1.844970703125, -1.33154296875, -0.818115234375, -0.3046875, 0.208740234375, 0.72216796875, 1.235595703125, 1.7490234375, 2.262451171875, 2.77587890625, 3.289306640625, 3.802734375, 4.316162109375, 4.82958984375, 5.343017578125, 5.8564453125, 6.369873046875, 6.88330078125, 7.396728515625, 7.91015625, 8.423583984375, 8.93701171875, 9.450439453125, 9.9638671875, 10.477294921875, 10.99072265625, 11.504150390625, 12.017578125, 12.531005859375, 13.04443359375, 13.557861328125, 14.0712890625, 14.584716796875, 15.09814453125, 15.611572265625, 16.125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 4.0, 10.0, 14.0, 14.0, 20.0, 21.0, 36.0, 38.0, 45.0, 46.0, 45.0, 65.0, 56.0, 37.0, 59.0, 64.0, 59.0, 46.0, 43.0, 41.0, 32.0, 39.0, 42.0, 25.0, 23.0, 12.0, 10.0, 15.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.85546875, -7.6187744140625, -7.382080078125, -7.1453857421875, -6.90869140625, -6.6719970703125, -6.435302734375, -6.1986083984375, -5.9619140625, -5.7252197265625, -5.488525390625, -5.2518310546875, -5.01513671875, -4.7784423828125, -4.541748046875, -4.3050537109375, -4.068359375, -3.8316650390625, -3.594970703125, -3.3582763671875, -3.12158203125, -2.8848876953125, -2.648193359375, -2.4114990234375, -2.1748046875, -1.9381103515625, -1.701416015625, -1.4647216796875, -1.22802734375, -0.9913330078125, -0.754638671875, -0.5179443359375, -0.28125, -0.0445556640625, 0.192138671875, 0.4288330078125, 0.66552734375, 0.9022216796875, 1.138916015625, 1.3756103515625, 1.6123046875, 1.8489990234375, 2.085693359375, 2.3223876953125, 2.55908203125, 2.7957763671875, 3.032470703125, 3.2691650390625, 3.505859375, 3.7425537109375, 3.979248046875, 4.2159423828125, 4.45263671875, 4.6893310546875, 4.926025390625, 5.1627197265625, 5.3994140625, 5.6361083984375, 5.872802734375, 6.1094970703125, 6.34619140625, 6.5828857421875, 6.819580078125, 7.0562744140625, 7.29296875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 0.0, 10.0, 4.0, 10.0, 10.0, 8.0, 13.0, 13.0, 15.0, 28.0, 7.0, 21.0, 15.0, 40.0, 31.0, 30.0, 30.0, 35.0, 32.0, 43.0, 39.0, 39.0, 43.0, 34.0, 43.0, 32.0, 37.0, 40.0, 39.0, 39.0, 26.0, 24.0, 18.0, 20.0, 17.0, 17.0, 22.0, 19.0, 10.0, 12.0, 8.0, 6.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-42.086856842041016, -40.794960021972656, -39.50306701660156, -38.2111701965332, -36.91927719116211, -35.62738037109375, -34.335487365722656, -33.0435905456543, -31.75169563293457, -30.459800720214844, -29.167905807495117, -27.87601089477539, -26.58411407470703, -25.292221069335938, -24.000324249267578, -22.70842933654785, -21.416534423828125, -20.1246395111084, -18.832744598388672, -17.540849685668945, -16.24895477294922, -14.957058906555176, -13.665163040161133, -12.373268127441406, -11.08137321472168, -9.789478302001953, -8.497583389282227, -7.205687522888184, -5.913792610168457, -4.6218976974487305, -3.3300023078918457, -2.038106918334961, -0.7462081909179688, 0.5456869602203369, 1.8375821113586426, 3.1294772624969482, 4.421372413635254, 5.7132673263549805, 7.005162715911865, 8.29705810546875, 9.588953018188477, 10.880847930908203, 12.17274284362793, 13.464638710021973, 14.7565336227417, 16.04842758178711, 17.34032440185547, 18.632219314575195, 19.924114227294922, 21.21600914001465, 22.507904052734375, 23.7997989654541, 25.091693878173828, 26.383590698242188, 27.675485610961914, 28.96738052368164, 30.259275436401367, 31.551170349121094, 32.84306716918945, 34.13496017456055, 35.426856994628906, 36.71875, 38.01064682006836, 39.30254364013672, 40.59443664550781]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 13.0, 6.0, 10.0, 13.0, 8.0, 13.0, 19.0, 12.0, 27.0, 31.0, 24.0, 35.0, 35.0, 42.0, 44.0, 36.0, 42.0, 39.0, 38.0, 50.0, 48.0, 52.0, 40.0, 24.0, 37.0, 35.0, 35.0, 31.0, 24.0, 22.0, 23.0, 14.0, 13.0, 14.0, 13.0, 8.0, 4.0, 3.0, 5.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-58.25493240356445, -56.65818786621094, -55.06144332885742, -53.464698791503906, -51.867958068847656, -50.27121353149414, -48.674468994140625, -47.07772445678711, -45.480979919433594, -43.88423538208008, -42.28749084472656, -40.69074630737305, -39.09400177001953, -37.49726104736328, -35.900516510009766, -34.30377197265625, -32.707027435302734, -31.11028289794922, -29.513538360595703, -27.91679573059082, -26.320051193237305, -24.72330665588379, -23.126564025878906, -21.52981948852539, -19.933074951171875, -18.33633041381836, -16.739585876464844, -15.142843246459961, -13.546098709106445, -11.94935417175293, -10.35261058807373, -8.755867004394531, -7.159122467041016, -5.562378406524658, -3.965634346008301, -2.3688902854919434, -0.7721462249755859, 0.8245978355407715, 2.421341896057129, 4.018085479736328, 5.614830017089844, 7.211574077606201, 8.808318138122559, 10.405061721801758, 12.001806259155273, 13.598550796508789, 15.195294380187988, 16.792037963867188, 18.388782501220703, 19.98552703857422, 21.582271575927734, 23.179014205932617, 24.775758743286133, 26.37250328063965, 27.96924591064453, 29.565990447998047, 31.162734985351562, 32.75947952270508, 34.356224060058594, 35.95296859741211, 37.549713134765625, 39.146453857421875, 40.74319839477539, 42.339942932128906, 43.93668746948242]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 2.0, 2.0, 11.0, 7.0, 13.0, 29.0, 34.0, 62.0, 104.0, 161.0, 222.0, 370.0, 595.0, 976.0, 1451.0, 2424.0, 3887.0, 6531.0, 10429.0, 17306.0, 28355.0, 46386.0, 76422.0, 128248.0, 209125.0, 337596.0, 513991.0, 671174.0, 681434.0, 533696.0, 356481.0, 224188.0, 135712.0, 81766.0, 49235.0, 29561.0, 18142.0, 10901.0, 6501.0, 4103.0, 2452.0, 1571.0, 1000.0, 604.0, 387.0, 234.0, 152.0, 95.0, 66.0, 39.0, 19.0, 14.0, 13.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-51.09375, -49.44775390625, -47.8017578125, -46.15576171875, -44.509765625, -42.86376953125, -41.2177734375, -39.57177734375, -37.92578125, -36.27978515625, -34.6337890625, -32.98779296875, -31.341796875, -29.69580078125, -28.0498046875, -26.40380859375, -24.7578125, -23.11181640625, -21.4658203125, -19.81982421875, -18.173828125, -16.52783203125, -14.8818359375, -13.23583984375, -11.58984375, -9.94384765625, -8.2978515625, -6.65185546875, -5.005859375, -3.35986328125, -1.7138671875, -0.06787109375, 1.578125, 3.22412109375, 4.8701171875, 6.51611328125, 8.162109375, 9.80810546875, 11.4541015625, 13.10009765625, 14.74609375, 16.39208984375, 18.0380859375, 19.68408203125, 21.330078125, 22.97607421875, 24.6220703125, 26.26806640625, 27.9140625, 29.56005859375, 31.2060546875, 32.85205078125, 34.498046875, 36.14404296875, 37.7900390625, 39.43603515625, 41.08203125, 42.72802734375, 44.3740234375, 46.02001953125, 47.666015625, 49.31201171875, 50.9580078125, 52.60400390625, 54.25]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 11.0, 10.0, 10.0, 16.0, 11.0, 16.0, 10.0, 31.0, 19.0, 29.0, 25.0, 29.0, 38.0, 39.0, 48.0, 27.0, 43.0, 38.0, 44.0, 60.0, 34.0, 43.0, 52.0, 42.0, 34.0, 25.0, 32.0, 24.0, 21.0, 20.0, 21.0, 18.0, 16.0, 13.0, 10.0, 7.0, 8.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 2.0, 1.0], "bins": [-40.625, -39.530517578125, -38.43603515625, -37.341552734375, -36.2470703125, -35.152587890625, -34.05810546875, -32.963623046875, -31.869140625, -30.774658203125, -29.68017578125, -28.585693359375, -27.4912109375, -26.396728515625, -25.30224609375, -24.207763671875, -23.11328125, -22.018798828125, -20.92431640625, -19.829833984375, -18.7353515625, -17.640869140625, -16.54638671875, -15.451904296875, -14.357421875, -13.262939453125, -12.16845703125, -11.073974609375, -9.9794921875, -8.885009765625, -7.79052734375, -6.696044921875, -5.6015625, -4.507080078125, -3.41259765625, -2.318115234375, -1.2236328125, -0.129150390625, 0.96533203125, 2.059814453125, 3.154296875, 4.248779296875, 5.34326171875, 6.437744140625, 7.5322265625, 8.626708984375, 9.72119140625, 10.815673828125, 11.91015625, 13.004638671875, 14.09912109375, 15.193603515625, 16.2880859375, 17.382568359375, 18.47705078125, 19.571533203125, 20.666015625, 21.760498046875, 22.85498046875, 23.949462890625, 25.0439453125, 26.138427734375, 27.23291015625, 28.327392578125, 29.421875]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 13.0, 11.0, 24.0, 46.0, 72.0, 97.0, 169.0, 258.0, 416.0, 690.0, 1103.0, 1836.0, 3141.0, 5510.0, 9456.0, 15887.0, 26961.0, 46692.0, 77030.0, 126569.0, 199136.0, 301734.0, 425777.0, 540502.0, 592568.0, 545126.0, 433472.0, 308703.0, 204701.0, 129944.0, 80104.0, 47745.0, 28232.0, 16808.0, 9688.0, 5677.0, 3338.0, 2050.0, 1178.0, 717.0, 432.0, 277.0, 152.0, 84.0, 58.0, 36.0, 25.0, 15.0, 7.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-39.96875, -38.701171875, -37.43359375, -36.166015625, -34.8984375, -33.630859375, -32.36328125, -31.095703125, -29.828125, -28.560546875, -27.29296875, -26.025390625, -24.7578125, -23.490234375, -22.22265625, -20.955078125, -19.6875, -18.419921875, -17.15234375, -15.884765625, -14.6171875, -13.349609375, -12.08203125, -10.814453125, -9.546875, -8.279296875, -7.01171875, -5.744140625, -4.4765625, -3.208984375, -1.94140625, -0.673828125, 0.59375, 1.861328125, 3.12890625, 4.396484375, 5.6640625, 6.931640625, 8.19921875, 9.466796875, 10.734375, 12.001953125, 13.26953125, 14.537109375, 15.8046875, 17.072265625, 18.33984375, 19.607421875, 20.875, 22.142578125, 23.41015625, 24.677734375, 25.9453125, 27.212890625, 28.48046875, 29.748046875, 31.015625, 32.283203125, 33.55078125, 34.818359375, 36.0859375, 37.353515625, 38.62109375, 39.888671875, 41.15625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 9.0, 10.0, 15.0, 18.0, 23.0, 37.0, 37.0, 47.0, 49.0, 63.0, 86.0, 93.0, 120.0, 133.0, 135.0, 152.0, 178.0, 220.0, 210.0, 210.0, 221.0, 194.0, 201.0, 217.0, 227.0, 190.0, 149.0, 124.0, 113.0, 103.0, 94.0, 68.0, 60.0, 59.0, 43.0, 45.0, 27.0, 17.0, 14.0, 17.0, 10.0, 9.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-18.6875, -18.1328125, -17.578125, -17.0234375, -16.46875, -15.9140625, -15.359375, -14.8046875, -14.25, -13.6953125, -13.140625, -12.5859375, -12.03125, -11.4765625, -10.921875, -10.3671875, -9.8125, -9.2578125, -8.703125, -8.1484375, -7.59375, -7.0390625, -6.484375, -5.9296875, -5.375, -4.8203125, -4.265625, -3.7109375, -3.15625, -2.6015625, -2.046875, -1.4921875, -0.9375, -0.3828125, 0.171875, 0.7265625, 1.28125, 1.8359375, 2.390625, 2.9453125, 3.5, 4.0546875, 4.609375, 5.1640625, 5.71875, 6.2734375, 6.828125, 7.3828125, 7.9375, 8.4921875, 9.046875, 9.6015625, 10.15625, 10.7109375, 11.265625, 11.8203125, 12.375, 12.9296875, 13.484375, 14.0390625, 14.59375, 15.1484375, 15.703125, 16.2578125, 16.8125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 6.0, 8.0, 7.0, 8.0, 11.0, 12.0, 14.0, 24.0, 15.0, 22.0, 51.0, 26.0, 34.0, 38.0, 23.0, 45.0, 46.0, 38.0, 46.0, 44.0, 46.0, 45.0, 33.0, 45.0, 32.0, 37.0, 33.0, 31.0, 34.0, 36.0, 20.0, 21.0, 11.0, 11.0, 9.0, 10.0, 9.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-47.67994689941406, -46.33475875854492, -44.98957061767578, -43.644386291503906, -42.299198150634766, -40.954010009765625, -39.608821868896484, -38.263633728027344, -36.91844940185547, -35.57326126098633, -34.22807312011719, -32.88288879394531, -31.537700653076172, -30.19251251220703, -28.84732437133789, -27.502138137817383, -26.156949996948242, -24.8117618560791, -23.466575622558594, -22.121387481689453, -20.776201248168945, -19.431013107299805, -18.085826873779297, -16.740638732910156, -15.395451545715332, -14.050264358520508, -12.705077171325684, -11.35988998413086, -10.014701843261719, -8.669515609741211, -7.32432746887207, -5.979140281677246, -4.633953094482422, -3.2887659072875977, -1.9435784816741943, -0.598391056060791, 0.7467961311340332, 2.0919833183288574, 3.43717098236084, 4.782358169555664, 6.127545356750488, 7.4727325439453125, 8.817919731140137, 10.163106918334961, 11.508295059204102, 12.85348129272461, 14.19866943359375, 15.543856620788574, 16.8890438079834, 18.23423194885254, 19.579418182373047, 20.924606323242188, 22.269792556762695, 23.614980697631836, 24.960166931152344, 26.305355072021484, 27.650543212890625, 28.995731353759766, 30.340917587280273, 31.686105728149414, 33.03129196166992, 34.37648010253906, 35.7216682434082, 37.066856384277344, 38.41204071044922]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 6.0, 3.0, 7.0, 10.0, 8.0, 10.0, 19.0, 16.0, 19.0, 30.0, 28.0, 38.0, 34.0, 44.0, 59.0, 57.0, 40.0, 43.0, 40.0, 60.0, 46.0, 50.0, 47.0, 29.0, 39.0, 37.0, 32.0, 31.0, 29.0, 15.0, 16.0, 15.0, 15.0, 7.0, 6.0, 3.0, 4.0, 3.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.05451583862305, -57.33771896362305, -55.62091827392578, -53.90412139892578, -52.187320709228516, -50.470523834228516, -48.75372314453125, -47.03692626953125, -45.320125579833984, -43.603328704833984, -41.88652801513672, -40.16973114013672, -38.45293045043945, -36.73613357543945, -35.01933288574219, -33.30253601074219, -31.585737228393555, -29.868938446044922, -28.15213966369629, -26.435340881347656, -24.718542098999023, -23.00174331665039, -21.28494644165039, -19.568145751953125, -17.851348876953125, -16.134550094604492, -14.41775131225586, -12.700952529907227, -10.984153747558594, -9.267355918884277, -7.5505571365356445, -5.833758354187012, -4.1169586181640625, -2.4001598358154297, -0.683361291885376, 1.0334372520446777, 2.7502360343933105, 4.467034339904785, 6.183833122253418, 7.900631904602051, 9.617430686950684, 11.334229469299316, 13.05102825164795, 14.767826080322266, 16.4846248626709, 18.20142364501953, 19.918222427368164, 21.635021209716797, 23.35181999206543, 25.068618774414062, 26.785417556762695, 28.502216339111328, 30.21901512145996, 31.935813903808594, 33.652610778808594, 35.36941146850586, 37.08620834350586, 38.80300521850586, 40.519805908203125, 42.236602783203125, 43.95340347290039, 45.67020034790039, 47.387001037597656, 49.103797912597656, 50.82059860229492]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 12.0, 23.0, 21.0, 53.0, 60.0, 87.0, 138.0, 197.0, 321.0, 447.0, 669.0, 1007.0, 1525.0, 2241.0, 3511.0, 5507.0, 8363.0, 12873.0, 20183.0, 30674.0, 45925.0, 66058.0, 92021.0, 117101.0, 131885.0, 130848.0, 110826.0, 84863.0, 60452.0, 41655.0, 27718.0, 17894.0, 11627.0, 7462.0, 4890.0, 3252.0, 2108.0, 1308.0, 919.0, 592.0, 418.0, 258.0, 197.0, 123.0, 94.0, 50.0, 35.0, 20.0, 11.0, 8.0, 9.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.25, -73.7802734375, -71.310546875, -68.8408203125, -66.37109375, -63.9013671875, -61.431640625, -58.9619140625, -56.4921875, -54.0224609375, -51.552734375, -49.0830078125, -46.61328125, -44.1435546875, -41.673828125, -39.2041015625, -36.734375, -34.2646484375, -31.794921875, -29.3251953125, -26.85546875, -24.3857421875, -21.916015625, -19.4462890625, -16.9765625, -14.5068359375, -12.037109375, -9.5673828125, -7.09765625, -4.6279296875, -2.158203125, 0.3115234375, 2.78125, 5.2509765625, 7.720703125, 10.1904296875, 12.66015625, 15.1298828125, 17.599609375, 20.0693359375, 22.5390625, 25.0087890625, 27.478515625, 29.9482421875, 32.41796875, 34.8876953125, 37.357421875, 39.8271484375, 42.296875, 44.7666015625, 47.236328125, 49.7060546875, 52.17578125, 54.6455078125, 57.115234375, 59.5849609375, 62.0546875, 64.5244140625, 66.994140625, 69.4638671875, 71.93359375, 74.4033203125, 76.873046875, 79.3427734375, 81.8125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 7.0, 9.0, 8.0, 14.0, 12.0, 13.0, 13.0, 27.0, 26.0, 25.0, 38.0, 38.0, 47.0, 40.0, 43.0, 46.0, 56.0, 46.0, 44.0, 40.0, 46.0, 39.0, 43.0, 34.0, 32.0, 32.0, 36.0, 26.0, 22.0, 18.0, 15.0, 14.0, 9.0, 12.0, 7.0, 6.0, 1.0, 9.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.78125, -37.67138671875, -36.5615234375, -35.45166015625, -34.341796875, -33.23193359375, -32.1220703125, -31.01220703125, -29.90234375, -28.79248046875, -27.6826171875, -26.57275390625, -25.462890625, -24.35302734375, -23.2431640625, -22.13330078125, -21.0234375, -19.91357421875, -18.8037109375, -17.69384765625, -16.583984375, -15.47412109375, -14.3642578125, -13.25439453125, -12.14453125, -11.03466796875, -9.9248046875, -8.81494140625, -7.705078125, -6.59521484375, -5.4853515625, -4.37548828125, -3.265625, -2.15576171875, -1.0458984375, 0.06396484375, 1.173828125, 2.28369140625, 3.3935546875, 4.50341796875, 5.61328125, 6.72314453125, 7.8330078125, 8.94287109375, 10.052734375, 11.16259765625, 12.2724609375, 13.38232421875, 14.4921875, 15.60205078125, 16.7119140625, 17.82177734375, 18.931640625, 20.04150390625, 21.1513671875, 22.26123046875, 23.37109375, 24.48095703125, 25.5908203125, 26.70068359375, 27.810546875, 28.92041015625, 30.0302734375, 31.14013671875, 32.25]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 7.0, 3.0, 9.0, 10.0, 10.0, 32.0, 34.0, 50.0, 87.0, 109.0, 162.0, 221.0, 334.0, 470.0, 734.0, 1050.0, 1539.0, 2203.0, 3243.0, 4901.0, 7394.0, 11344.0, 17376.0, 26985.0, 42444.0, 66733.0, 103795.0, 149501.0, 174983.0, 146980.0, 101672.0, 65806.0, 41333.0, 26726.0, 16982.0, 10958.0, 7361.0, 4839.0, 3184.0, 2239.0, 1479.0, 1019.0, 687.0, 501.0, 305.0, 226.0, 147.0, 117.0, 66.0, 55.0, 36.0, 21.0, 22.0, 19.0, 9.0, 6.0, 4.0, 2.0, 5.0, 0.0, 2.0], "bins": [-90.125, -87.26171875, -84.3984375, -81.53515625, -78.671875, -75.80859375, -72.9453125, -70.08203125, -67.21875, -64.35546875, -61.4921875, -58.62890625, -55.765625, -52.90234375, -50.0390625, -47.17578125, -44.3125, -41.44921875, -38.5859375, -35.72265625, -32.859375, -29.99609375, -27.1328125, -24.26953125, -21.40625, -18.54296875, -15.6796875, -12.81640625, -9.953125, -7.08984375, -4.2265625, -1.36328125, 1.5, 4.36328125, 7.2265625, 10.08984375, 12.953125, 15.81640625, 18.6796875, 21.54296875, 24.40625, 27.26953125, 30.1328125, 32.99609375, 35.859375, 38.72265625, 41.5859375, 44.44921875, 47.3125, 50.17578125, 53.0390625, 55.90234375, 58.765625, 61.62890625, 64.4921875, 67.35546875, 70.21875, 73.08203125, 75.9453125, 78.80859375, 81.671875, 84.53515625, 87.3984375, 90.26171875, 93.125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 9.0, 9.0, 8.0, 14.0, 8.0, 11.0, 24.0, 36.0, 23.0, 24.0, 41.0, 35.0, 55.0, 54.0, 56.0, 54.0, 54.0, 51.0, 51.0, 39.0, 36.0, 44.0, 30.0, 32.0, 32.0, 22.0, 23.0, 19.0, 13.0, 16.0, 9.0, 16.0, 14.0, 10.0, 7.0, 6.0, 6.0, 1.0, 0.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.40625, -33.3271484375, -32.248046875, -31.1689453125, -30.08984375, -29.0107421875, -27.931640625, -26.8525390625, -25.7734375, -24.6943359375, -23.615234375, -22.5361328125, -21.45703125, -20.3779296875, -19.298828125, -18.2197265625, -17.140625, -16.0615234375, -14.982421875, -13.9033203125, -12.82421875, -11.7451171875, -10.666015625, -9.5869140625, -8.5078125, -7.4287109375, -6.349609375, -5.2705078125, -4.19140625, -3.1123046875, -2.033203125, -0.9541015625, 0.125, 1.2041015625, 2.283203125, 3.3623046875, 4.44140625, 5.5205078125, 6.599609375, 7.6787109375, 8.7578125, 9.8369140625, 10.916015625, 11.9951171875, 13.07421875, 14.1533203125, 15.232421875, 16.3115234375, 17.390625, 18.4697265625, 19.548828125, 20.6279296875, 21.70703125, 22.7861328125, 23.865234375, 24.9443359375, 26.0234375, 27.1025390625, 28.181640625, 29.2607421875, 30.33984375, 31.4189453125, 32.498046875, 33.5771484375, 34.65625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 4.0, 10.0, 11.0, 9.0, 10.0, 20.0, 26.0, 40.0, 55.0, 60.0, 105.0, 148.0, 215.0, 310.0, 475.0, 757.0, 1200.0, 1915.0, 3130.0, 5109.0, 9308.0, 18804.0, 49264.0, 245537.0, 560406.0, 93092.0, 28316.0, 12812.0, 6815.0, 3853.0, 2377.0, 1516.0, 907.0, 617.0, 377.0, 279.0, 172.0, 136.0, 93.0, 70.0, 62.0, 35.0, 30.0, 15.0, 20.0, 12.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.125, -221.546875, -213.96875, -206.390625, -198.8125, -191.234375, -183.65625, -176.078125, -168.5, -160.921875, -153.34375, -145.765625, -138.1875, -130.609375, -123.03125, -115.453125, -107.875, -100.296875, -92.71875, -85.140625, -77.5625, -69.984375, -62.40625, -54.828125, -47.25, -39.671875, -32.09375, -24.515625, -16.9375, -9.359375, -1.78125, 5.796875, 13.375, 20.953125, 28.53125, 36.109375, 43.6875, 51.265625, 58.84375, 66.421875, 74.0, 81.578125, 89.15625, 96.734375, 104.3125, 111.890625, 119.46875, 127.046875, 134.625, 142.203125, 149.78125, 157.359375, 164.9375, 172.515625, 180.09375, 187.671875, 195.25, 202.828125, 210.40625, 217.984375, 225.5625, 233.140625, 240.71875, 248.296875, 255.875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 2.0, 12.0, 13.0, 18.0, 26.0, 37.0, 78.0, 113.0, 249.0, 184.0, 87.0, 45.0, 25.0, 18.0, 13.0, 7.0, 6.0, 6.0, 5.0, 7.0, 5.0, 5.0, 5.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0269317626953125, -0.0261077880859375, -0.0252838134765625, -0.0244598388671875, -0.0236358642578125, -0.0228118896484375, -0.0219879150390625, -0.0211639404296875, -0.0203399658203125, -0.0195159912109375, -0.0186920166015625, -0.0178680419921875, -0.0170440673828125, -0.0162200927734375, -0.0153961181640625, -0.0145721435546875, -0.0137481689453125, -0.0129241943359375, -0.0121002197265625, -0.0112762451171875, -0.0104522705078125, -0.0096282958984375, -0.0088043212890625, -0.0079803466796875, -0.0071563720703125, -0.0063323974609375, -0.0055084228515625, -0.0046844482421875, -0.0038604736328125, -0.0030364990234375, -0.0022125244140625, -0.0013885498046875, -0.0005645751953125, 0.0002593994140625, 0.0010833740234375, 0.0019073486328125, 0.0027313232421875, 0.0035552978515625, 0.0043792724609375, 0.0052032470703125, 0.0060272216796875, 0.0068511962890625, 0.0076751708984375, 0.0084991455078125, 0.0093231201171875, 0.0101470947265625, 0.0109710693359375, 0.0117950439453125, 0.0126190185546875, 0.0134429931640625, 0.0142669677734375, 0.0150909423828125, 0.0159149169921875, 0.0167388916015625, 0.0175628662109375, 0.0183868408203125, 0.0192108154296875, 0.0200347900390625, 0.0208587646484375, 0.0216827392578125, 0.0225067138671875, 0.0233306884765625, 0.0241546630859375, 0.0249786376953125, 0.0258026123046875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 5.0, 1.0, 5.0, 3.0, 6.0, 10.0, 13.0, 15.0, 15.0, 24.0, 29.0, 38.0, 57.0, 82.0, 85.0, 140.0, 187.0, 344.0, 498.0, 713.0, 1180.0, 1937.0, 3321.0, 5838.0, 10296.0, 20913.0, 54306.0, 232150.0, 503320.0, 137855.0, 37972.0, 16500.0, 8458.0, 4762.0, 2828.0, 1622.0, 1013.0, 628.0, 415.0, 248.0, 204.0, 118.0, 94.0, 75.0, 58.0, 50.0, 36.0, 33.0, 20.0, 10.0, 11.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-154.875, -150.0859375, -145.296875, -140.5078125, -135.71875, -130.9296875, -126.140625, -121.3515625, -116.5625, -111.7734375, -106.984375, -102.1953125, -97.40625, -92.6171875, -87.828125, -83.0390625, -78.25, -73.4609375, -68.671875, -63.8828125, -59.09375, -54.3046875, -49.515625, -44.7265625, -39.9375, -35.1484375, -30.359375, -25.5703125, -20.78125, -15.9921875, -11.203125, -6.4140625, -1.625, 3.1640625, 7.953125, 12.7421875, 17.53125, 22.3203125, 27.109375, 31.8984375, 36.6875, 41.4765625, 46.265625, 51.0546875, 55.84375, 60.6328125, 65.421875, 70.2109375, 75.0, 79.7890625, 84.578125, 89.3671875, 94.15625, 98.9453125, 103.734375, 108.5234375, 113.3125, 118.1015625, 122.890625, 127.6796875, 132.46875, 137.2578125, 142.046875, 146.8359375, 151.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 4.0, 8.0, 3.0, 11.0, 15.0, 29.0, 27.0, 53.0, 72.0, 119.0, 138.0, 144.0, 140.0, 83.0, 37.0, 34.0, 19.0, 7.0, 10.0, 3.0, 7.0, 7.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.09375, -40.63623046875, -39.1787109375, -37.72119140625, -36.263671875, -34.80615234375, -33.3486328125, -31.89111328125, -30.43359375, -28.97607421875, -27.5185546875, -26.06103515625, -24.603515625, -23.14599609375, -21.6884765625, -20.23095703125, -18.7734375, -17.31591796875, -15.8583984375, -14.40087890625, -12.943359375, -11.48583984375, -10.0283203125, -8.57080078125, -7.11328125, -5.65576171875, -4.1982421875, -2.74072265625, -1.283203125, 0.17431640625, 1.6318359375, 3.08935546875, 4.546875, 6.00439453125, 7.4619140625, 8.91943359375, 10.376953125, 11.83447265625, 13.2919921875, 14.74951171875, 16.20703125, 17.66455078125, 19.1220703125, 20.57958984375, 22.037109375, 23.49462890625, 24.9521484375, 26.40966796875, 27.8671875, 29.32470703125, 30.7822265625, 32.23974609375, 33.697265625, 35.15478515625, 36.6123046875, 38.06982421875, 39.52734375, 40.98486328125, 42.4423828125, 43.89990234375, 45.357421875, 46.81494140625, 48.2724609375, 49.72998046875, 51.1875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 4.0, 7.0, 4.0, 7.0, 4.0, 9.0, 10.0, 8.0, 13.0, 12.0, 23.0, 19.0, 27.0, 28.0, 15.0, 29.0, 29.0, 29.0, 37.0, 32.0, 51.0, 56.0, 44.0, 42.0, 35.0, 38.0, 42.0, 34.0, 44.0, 38.0, 30.0, 26.0, 27.0, 20.0, 19.0, 19.0, 19.0, 14.0, 8.0, 10.0, 15.0, 7.0, 7.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-38.12268829345703, -36.99401092529297, -35.865333557128906, -34.736656188964844, -33.60797882080078, -32.479305267333984, -31.350627899169922, -30.22195053100586, -29.093273162841797, -27.964595794677734, -26.835918426513672, -25.707242965698242, -24.57856559753418, -23.449888229370117, -22.321212768554688, -21.192535400390625, -20.063858032226562, -18.9351806640625, -17.806503295898438, -16.677827835083008, -15.549150466918945, -14.420473098754883, -13.291796684265137, -12.16312026977539, -11.034442901611328, -9.905765533447266, -8.77708911895752, -7.648412227630615, -6.519735336303711, -5.391058444976807, -4.262381553649902, -3.133704662322998, -2.0050277709960938, -0.8763508796691895, 0.25232601165771484, 1.3810029029846191, 2.5096797943115234, 3.6383566856384277, 4.767033576965332, 5.895710468292236, 7.024387359619141, 8.153064727783203, 9.28174114227295, 10.410417556762695, 11.539094924926758, 12.66777229309082, 13.796448707580566, 14.925125122070312, 16.053802490234375, 17.182479858398438, 18.3111572265625, 19.43983268737793, 20.568510055541992, 21.697187423706055, 22.825862884521484, 23.954540252685547, 25.08321762084961, 26.211894989013672, 27.340572357177734, 28.469247817993164, 29.597925186157227, 30.72660255432129, 31.85527801513672, 32.98395538330078, 34.112632751464844]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 5.0, 9.0, 6.0, 11.0, 16.0, 11.0, 15.0, 26.0, 20.0, 23.0, 29.0, 30.0, 37.0, 27.0, 37.0, 36.0, 57.0, 40.0, 43.0, 33.0, 42.0, 37.0, 45.0, 36.0, 35.0, 30.0, 36.0, 33.0, 28.0, 21.0, 22.0, 19.0, 13.0, 14.0, 11.0, 8.0, 14.0, 6.0, 7.0, 5.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.17087936401367, -41.873294830322266, -40.57571029663086, -39.27812194824219, -37.98053741455078, -36.682952880859375, -35.38536834716797, -34.08778381347656, -32.790199279785156, -31.49261474609375, -30.19502830505371, -28.897443771362305, -27.5998592376709, -26.30227279663086, -25.004688262939453, -23.707103729248047, -22.409517288208008, -21.1119327545166, -19.814346313476562, -18.516761779785156, -17.21917724609375, -15.921591758728027, -14.624006271362305, -13.326421737670898, -12.028836250305176, -10.731250762939453, -9.433666229248047, -8.136080741882324, -6.83849573135376, -5.540910720825195, -4.243325233459473, -2.9457406997680664, -1.6481552124023438, -0.35057008266448975, 0.9470150470733643, 2.244600296020508, 3.5421853065490723, 4.839770317077637, 6.137355804443359, 7.434940338134766, 8.732525825500488, 10.030111312866211, 11.327695846557617, 12.62528133392334, 13.922866821289062, 15.220451354980469, 16.518035888671875, 17.81562042236328, 19.11320686340332, 20.410791397094727, 21.708377838134766, 23.005962371826172, 24.303546905517578, 25.601131439208984, 26.898717880249023, 28.19630241394043, 29.49388885498047, 30.791473388671875, 32.08905792236328, 33.38664245605469, 34.68423080444336, 35.981815338134766, 37.27939987182617, 38.57698440551758, 39.874568939208984]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 7.0, 8.0, 11.0, 16.0, 43.0, 67.0, 100.0, 143.0, 210.0, 368.0, 535.0, 830.0, 1268.0, 2081.0, 3343.0, 5485.0, 8729.0, 13417.0, 20871.0, 32038.0, 47567.0, 68939.0, 93928.0, 118754.0, 133239.0, 128714.0, 109672.0, 83704.0, 59499.0, 40590.0, 26528.0, 17427.0, 11077.0, 7131.0, 4478.0, 2888.0, 1840.0, 1098.0, 709.0, 457.0, 268.0, 169.0, 110.0, 76.0, 43.0, 17.0, 30.0, 18.0, 10.0, 10.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.65625, -39.41650390625, -38.1767578125, -36.93701171875, -35.697265625, -34.45751953125, -33.2177734375, -31.97802734375, -30.73828125, -29.49853515625, -28.2587890625, -27.01904296875, -25.779296875, -24.53955078125, -23.2998046875, -22.06005859375, -20.8203125, -19.58056640625, -18.3408203125, -17.10107421875, -15.861328125, -14.62158203125, -13.3818359375, -12.14208984375, -10.90234375, -9.66259765625, -8.4228515625, -7.18310546875, -5.943359375, -4.70361328125, -3.4638671875, -2.22412109375, -0.984375, 0.25537109375, 1.4951171875, 2.73486328125, 3.974609375, 5.21435546875, 6.4541015625, 7.69384765625, 8.93359375, 10.17333984375, 11.4130859375, 12.65283203125, 13.892578125, 15.13232421875, 16.3720703125, 17.61181640625, 18.8515625, 20.09130859375, 21.3310546875, 22.57080078125, 23.810546875, 25.05029296875, 26.2900390625, 27.52978515625, 28.76953125, 30.00927734375, 31.2490234375, 32.48876953125, 33.728515625, 34.96826171875, 36.2080078125, 37.44775390625, 38.6875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 6.0, 4.0, 4.0, 5.0, 9.0, 8.0, 9.0, 8.0, 17.0, 8.0, 20.0, 16.0, 16.0, 21.0, 27.0, 29.0, 39.0, 32.0, 34.0, 39.0, 43.0, 38.0, 44.0, 40.0, 36.0, 37.0, 48.0, 33.0, 32.0, 39.0, 34.0, 32.0, 28.0, 23.0, 25.0, 19.0, 16.0, 14.0, 5.0, 10.0, 9.0, 12.0, 6.0, 6.0, 8.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.8125, -33.67333984375, -32.5341796875, -31.39501953125, -30.255859375, -29.11669921875, -27.9775390625, -26.83837890625, -25.69921875, -24.56005859375, -23.4208984375, -22.28173828125, -21.142578125, -20.00341796875, -18.8642578125, -17.72509765625, -16.5859375, -15.44677734375, -14.3076171875, -13.16845703125, -12.029296875, -10.89013671875, -9.7509765625, -8.61181640625, -7.47265625, -6.33349609375, -5.1943359375, -4.05517578125, -2.916015625, -1.77685546875, -0.6376953125, 0.50146484375, 1.640625, 2.77978515625, 3.9189453125, 5.05810546875, 6.197265625, 7.33642578125, 8.4755859375, 9.61474609375, 10.75390625, 11.89306640625, 13.0322265625, 14.17138671875, 15.310546875, 16.44970703125, 17.5888671875, 18.72802734375, 19.8671875, 21.00634765625, 22.1455078125, 23.28466796875, 24.423828125, 25.56298828125, 26.7021484375, 27.84130859375, 28.98046875, 30.11962890625, 31.2587890625, 32.39794921875, 33.537109375, 34.67626953125, 35.8154296875, 36.95458984375, 38.09375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 11.0, 17.0, 39.0, 36.0, 62.0, 72.0, 122.0, 164.0, 282.0, 428.0, 668.0, 948.0, 1495.0, 2425.0, 3888.0, 6124.0, 9848.0, 16087.0, 25477.0, 41435.0, 64684.0, 96704.0, 132190.0, 154375.0, 147142.0, 117589.0, 82336.0, 53832.0, 33945.0, 21146.0, 13017.0, 8030.0, 5036.0, 3226.0, 2042.0, 1304.0, 816.0, 527.0, 325.0, 245.0, 123.0, 119.0, 48.0, 48.0, 35.0, 12.0, 14.0, 9.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.6875, -48.07373046875, -46.4599609375, -44.84619140625, -43.232421875, -41.61865234375, -40.0048828125, -38.39111328125, -36.77734375, -35.16357421875, -33.5498046875, -31.93603515625, -30.322265625, -28.70849609375, -27.0947265625, -25.48095703125, -23.8671875, -22.25341796875, -20.6396484375, -19.02587890625, -17.412109375, -15.79833984375, -14.1845703125, -12.57080078125, -10.95703125, -9.34326171875, -7.7294921875, -6.11572265625, -4.501953125, -2.88818359375, -1.2744140625, 0.33935546875, 1.953125, 3.56689453125, 5.1806640625, 6.79443359375, 8.408203125, 10.02197265625, 11.6357421875, 13.24951171875, 14.86328125, 16.47705078125, 18.0908203125, 19.70458984375, 21.318359375, 22.93212890625, 24.5458984375, 26.15966796875, 27.7734375, 29.38720703125, 31.0009765625, 32.61474609375, 34.228515625, 35.84228515625, 37.4560546875, 39.06982421875, 40.68359375, 42.29736328125, 43.9111328125, 45.52490234375, 47.138671875, 48.75244140625, 50.3662109375, 51.97998046875, 53.59375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 10.0, 8.0, 13.0, 8.0, 13.0, 15.0, 14.0, 18.0, 24.0, 21.0, 28.0, 32.0, 35.0, 33.0, 32.0, 33.0, 36.0, 36.0, 44.0, 25.0, 33.0, 37.0, 26.0, 26.0, 30.0, 42.0, 35.0, 36.0, 26.0, 25.0, 19.0, 24.0, 23.0, 22.0, 16.0, 19.0, 13.0, 9.0, 10.0, 7.0, 5.0, 2.0, 4.0, 3.0, 4.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-29.1875, -28.245361328125, -27.30322265625, -26.361083984375, -25.4189453125, -24.476806640625, -23.53466796875, -22.592529296875, -21.650390625, -20.708251953125, -19.76611328125, -18.823974609375, -17.8818359375, -16.939697265625, -15.99755859375, -15.055419921875, -14.11328125, -13.171142578125, -12.22900390625, -11.286865234375, -10.3447265625, -9.402587890625, -8.46044921875, -7.518310546875, -6.576171875, -5.634033203125, -4.69189453125, -3.749755859375, -2.8076171875, -1.865478515625, -0.92333984375, 0.018798828125, 0.9609375, 1.903076171875, 2.84521484375, 3.787353515625, 4.7294921875, 5.671630859375, 6.61376953125, 7.555908203125, 8.498046875, 9.440185546875, 10.38232421875, 11.324462890625, 12.2666015625, 13.208740234375, 14.15087890625, 15.093017578125, 16.03515625, 16.977294921875, 17.91943359375, 18.861572265625, 19.8037109375, 20.745849609375, 21.68798828125, 22.630126953125, 23.572265625, 24.514404296875, 25.45654296875, 26.398681640625, 27.3408203125, 28.282958984375, 29.22509765625, 30.167236328125, 31.109375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 7.0, 12.0, 8.0, 17.0, 15.0, 39.0, 53.0, 73.0, 162.0, 247.0, 458.0, 762.0, 1312.0, 2303.0, 3946.0, 7176.0, 13656.0, 27950.0, 60659.0, 141105.0, 288252.0, 268641.0, 124656.0, 54262.0, 25063.0, 12608.0, 6632.0, 3596.0, 1996.0, 1191.0, 660.0, 357.0, 234.0, 151.0, 110.0, 63.0, 41.0, 28.0, 16.0, 13.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.8125, -75.0263671875, -72.240234375, -69.4541015625, -66.66796875, -63.8818359375, -61.095703125, -58.3095703125, -55.5234375, -52.7373046875, -49.951171875, -47.1650390625, -44.37890625, -41.5927734375, -38.806640625, -36.0205078125, -33.234375, -30.4482421875, -27.662109375, -24.8759765625, -22.08984375, -19.3037109375, -16.517578125, -13.7314453125, -10.9453125, -8.1591796875, -5.373046875, -2.5869140625, 0.19921875, 2.9853515625, 5.771484375, 8.5576171875, 11.34375, 14.1298828125, 16.916015625, 19.7021484375, 22.48828125, 25.2744140625, 28.060546875, 30.8466796875, 33.6328125, 36.4189453125, 39.205078125, 41.9912109375, 44.77734375, 47.5634765625, 50.349609375, 53.1357421875, 55.921875, 58.7080078125, 61.494140625, 64.2802734375, 67.06640625, 69.8525390625, 72.638671875, 75.4248046875, 78.2109375, 80.9970703125, 83.783203125, 86.5693359375, 89.35546875, 92.1416015625, 94.927734375, 97.7138671875, 100.5]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 9.0, 10.0, 8.0, 11.0, 12.0, 26.0, 19.0, 38.0, 56.0, 72.0, 118.0, 115.0, 128.0, 98.0, 82.0, 57.0, 41.0, 25.0, 22.0, 15.0, 9.0, 8.0, 7.0, 9.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01080322265625, -0.010485291481018066, -0.010167360305786133, -0.0098494291305542, -0.009531497955322266, -0.009213566780090332, -0.008895635604858398, -0.008577704429626465, -0.008259773254394531, -0.007941842079162598, -0.007623910903930664, -0.0073059797286987305, -0.006988048553466797, -0.006670117378234863, -0.00635218620300293, -0.006034255027770996, -0.0057163238525390625, -0.005398392677307129, -0.005080461502075195, -0.004762530326843262, -0.004444599151611328, -0.0041266679763793945, -0.003808736801147461, -0.0034908056259155273, -0.0031728744506835938, -0.00285494327545166, -0.0025370121002197266, -0.002219080924987793, -0.0019011497497558594, -0.0015832185745239258, -0.0012652873992919922, -0.0009473562240600586, -0.000629425048828125, -0.0003114938735961914, 6.4373016357421875e-06, 0.0003243684768676758, 0.0006422996520996094, 0.000960230827331543, 0.0012781620025634766, 0.0015960931777954102, 0.0019140243530273438, 0.0022319555282592773, 0.002549886703491211, 0.0028678178787231445, 0.003185749053955078, 0.0035036802291870117, 0.0038216114044189453, 0.004139542579650879, 0.0044574737548828125, 0.004775404930114746, 0.00509333610534668, 0.005411267280578613, 0.005729198455810547, 0.0060471296310424805, 0.006365060806274414, 0.006682991981506348, 0.007000923156738281, 0.007318854331970215, 0.0076367855072021484, 0.007954716682434082, 0.008272647857666016, 0.00859057903289795, 0.008908510208129883, 0.009226441383361816, 0.00954437255859375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 10.0, 15.0, 20.0, 21.0, 35.0, 54.0, 87.0, 121.0, 175.0, 265.0, 407.0, 500.0, 889.0, 1311.0, 2162.0, 3348.0, 5500.0, 9192.0, 16093.0, 28831.0, 53235.0, 97763.0, 167476.0, 218424.0, 186226.0, 114077.0, 62559.0, 33630.0, 18642.0, 10578.0, 6267.0, 3852.0, 2362.0, 1478.0, 1006.0, 636.0, 430.0, 277.0, 202.0, 127.0, 93.0, 43.0, 45.0, 31.0, 18.0, 14.0, 13.0, 1.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-54.78125, -53.04931640625, -51.3173828125, -49.58544921875, -47.853515625, -46.12158203125, -44.3896484375, -42.65771484375, -40.92578125, -39.19384765625, -37.4619140625, -35.72998046875, -33.998046875, -32.26611328125, -30.5341796875, -28.80224609375, -27.0703125, -25.33837890625, -23.6064453125, -21.87451171875, -20.142578125, -18.41064453125, -16.6787109375, -14.94677734375, -13.21484375, -11.48291015625, -9.7509765625, -8.01904296875, -6.287109375, -4.55517578125, -2.8232421875, -1.09130859375, 0.640625, 2.37255859375, 4.1044921875, 5.83642578125, 7.568359375, 9.30029296875, 11.0322265625, 12.76416015625, 14.49609375, 16.22802734375, 17.9599609375, 19.69189453125, 21.423828125, 23.15576171875, 24.8876953125, 26.61962890625, 28.3515625, 30.08349609375, 31.8154296875, 33.54736328125, 35.279296875, 37.01123046875, 38.7431640625, 40.47509765625, 42.20703125, 43.93896484375, 45.6708984375, 47.40283203125, 49.134765625, 50.86669921875, 52.5986328125, 54.33056640625, 56.0625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 7.0, 9.0, 6.0, 9.0, 15.0, 21.0, 17.0, 26.0, 23.0, 28.0, 39.0, 32.0, 44.0, 52.0, 65.0, 46.0, 62.0, 66.0, 51.0, 55.0, 58.0, 33.0, 32.0, 22.0, 23.0, 29.0, 23.0, 20.0, 6.0, 10.0, 11.0, 9.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-15.84375, -15.30517578125, -14.7666015625, -14.22802734375, -13.689453125, -13.15087890625, -12.6123046875, -12.07373046875, -11.53515625, -10.99658203125, -10.4580078125, -9.91943359375, -9.380859375, -8.84228515625, -8.3037109375, -7.76513671875, -7.2265625, -6.68798828125, -6.1494140625, -5.61083984375, -5.072265625, -4.53369140625, -3.9951171875, -3.45654296875, -2.91796875, -2.37939453125, -1.8408203125, -1.30224609375, -0.763671875, -0.22509765625, 0.3134765625, 0.85205078125, 1.390625, 1.92919921875, 2.4677734375, 3.00634765625, 3.544921875, 4.08349609375, 4.6220703125, 5.16064453125, 5.69921875, 6.23779296875, 6.7763671875, 7.31494140625, 7.853515625, 8.39208984375, 8.9306640625, 9.46923828125, 10.0078125, 10.54638671875, 11.0849609375, 11.62353515625, 12.162109375, 12.70068359375, 13.2392578125, 13.77783203125, 14.31640625, 14.85498046875, 15.3935546875, 15.93212890625, 16.470703125, 17.00927734375, 17.5478515625, 18.08642578125, 18.625]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 11.0, 8.0, 9.0, 8.0, 13.0, 14.0, 16.0, 24.0, 27.0, 27.0, 36.0, 33.0, 39.0, 49.0, 48.0, 47.0, 58.0, 57.0, 51.0, 41.0, 38.0, 51.0, 34.0, 31.0, 35.0, 31.0, 23.0, 21.0, 21.0, 18.0, 15.0, 10.0, 11.0, 14.0, 5.0, 2.0, 2.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.93859100341797, -47.61852264404297, -46.298458099365234, -44.978389739990234, -43.658321380615234, -42.3382568359375, -41.0181884765625, -39.6981201171875, -38.378055572509766, -37.057987213134766, -35.73792266845703, -34.41785430908203, -33.09778594970703, -31.777721405029297, -30.457653045654297, -29.13758659362793, -27.81751823425293, -26.497451782226562, -25.177383422851562, -23.857316970825195, -22.537250518798828, -21.217182159423828, -19.89711570739746, -18.577049255371094, -17.256980895996094, -15.93691349029541, -14.616847038269043, -13.29677963256836, -11.976713180541992, -10.656645774841309, -9.336578369140625, -8.016511917114258, -6.696445465087891, -5.376378536224365, -4.05631160736084, -2.7362442016601562, -1.4161772727966309, -0.09611034393310547, 1.2239570617675781, 2.5440235137939453, 3.864090919494629, 5.184157848358154, 6.50422477722168, 7.824292182922363, 9.144359588623047, 10.464426040649414, 11.784493446350098, 13.104559898376465, 14.424627304077148, 15.744694709777832, 17.064762115478516, 18.384828567504883, 19.70489501953125, 21.02496337890625, 22.345029830932617, 23.665096282958984, 24.985164642333984, 26.30523109436035, 27.62529945373535, 28.94536590576172, 30.265432357788086, 31.585498809814453, 32.90556716918945, 34.22563171386719, 35.54570007324219]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 9.0, 6.0, 4.0, 3.0, 4.0, 10.0, 5.0, 11.0, 13.0, 16.0, 13.0, 15.0, 19.0, 26.0, 21.0, 29.0, 30.0, 35.0, 28.0, 33.0, 35.0, 36.0, 40.0, 44.0, 34.0, 48.0, 42.0, 43.0, 42.0, 35.0, 24.0, 28.0, 33.0, 27.0, 29.0, 33.0, 18.0, 19.0, 17.0, 11.0, 8.0, 7.0, 6.0, 4.0, 2.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.25529861450195, -42.876625061035156, -41.49795150756836, -40.11927795410156, -38.74060821533203, -37.361934661865234, -35.98326110839844, -34.60458755493164, -33.225914001464844, -31.847240447998047, -30.46856689453125, -29.089895248413086, -27.71122169494629, -26.332548141479492, -24.953876495361328, -23.57520294189453, -22.196529388427734, -20.817855834960938, -19.43918228149414, -18.060510635375977, -16.68183708190918, -15.303163528442383, -13.924490928649902, -12.545818328857422, -11.167144775390625, -9.788471221923828, -8.409798622131348, -7.031125545501709, -5.65245246887207, -4.273779392242432, -2.895106315612793, -1.5164337158203125, -0.13775634765625, 1.2409167289733887, 2.6195898056030273, 3.998262882232666, 5.376935958862305, 6.755609035491943, 8.134282112121582, 9.512954711914062, 10.89162826538086, 12.270301818847656, 13.648974418640137, 15.027647018432617, 16.406320571899414, 17.78499412536621, 19.163665771484375, 20.542339324951172, 21.92101287841797, 23.299686431884766, 24.678359985351562, 26.057031631469727, 27.435705184936523, 28.81437873840332, 30.193050384521484, 31.57172393798828, 32.95039749145508, 34.329071044921875, 35.70774459838867, 37.08641815185547, 38.465087890625, 39.8437614440918, 41.222434997558594, 42.60110855102539, 43.97978210449219]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 9.0, 11.0, 17.0, 18.0, 46.0, 57.0, 98.0, 161.0, 221.0, 380.0, 569.0, 847.0, 1502.0, 2150.0, 3361.0, 5321.0, 8639.0, 13993.0, 22869.0, 38204.0, 63980.0, 111489.0, 189345.0, 318325.0, 492108.0, 654207.0, 695152.0, 581064.0, 399426.0, 244820.0, 142485.0, 82469.0, 48044.0, 28412.0, 17145.0, 10351.0, 6374.0, 3952.0, 2514.0, 1543.0, 998.0, 584.0, 381.0, 234.0, 136.0, 96.0, 56.0, 53.0, 29.0, 14.0, 14.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.5, -28.4912109375, -27.482421875, -26.4736328125, -25.46484375, -24.4560546875, -23.447265625, -22.4384765625, -21.4296875, -20.4208984375, -19.412109375, -18.4033203125, -17.39453125, -16.3857421875, -15.376953125, -14.3681640625, -13.359375, -12.3505859375, -11.341796875, -10.3330078125, -9.32421875, -8.3154296875, -7.306640625, -6.2978515625, -5.2890625, -4.2802734375, -3.271484375, -2.2626953125, -1.25390625, -0.2451171875, 0.763671875, 1.7724609375, 2.78125, 3.7900390625, 4.798828125, 5.8076171875, 6.81640625, 7.8251953125, 8.833984375, 9.8427734375, 10.8515625, 11.8603515625, 12.869140625, 13.8779296875, 14.88671875, 15.8955078125, 16.904296875, 17.9130859375, 18.921875, 19.9306640625, 20.939453125, 21.9482421875, 22.95703125, 23.9658203125, 24.974609375, 25.9833984375, 26.9921875, 28.0009765625, 29.009765625, 30.0185546875, 31.02734375, 32.0361328125, 33.044921875, 34.0537109375, 35.0625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 12.0, 12.0, 11.0, 7.0, 15.0, 11.0, 13.0, 17.0, 12.0, 28.0, 16.0, 24.0, 35.0, 27.0, 30.0, 31.0, 33.0, 42.0, 32.0, 41.0, 48.0, 38.0, 49.0, 41.0, 39.0, 42.0, 32.0, 42.0, 36.0, 26.0, 25.0, 19.0, 20.0, 17.0, 14.0, 8.0, 11.0, 9.0, 9.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.03125, -31.046142578125, -30.06103515625, -29.075927734375, -28.0908203125, -27.105712890625, -26.12060546875, -25.135498046875, -24.150390625, -23.165283203125, -22.18017578125, -21.195068359375, -20.2099609375, -19.224853515625, -18.23974609375, -17.254638671875, -16.26953125, -15.284423828125, -14.29931640625, -13.314208984375, -12.3291015625, -11.343994140625, -10.35888671875, -9.373779296875, -8.388671875, -7.403564453125, -6.41845703125, -5.433349609375, -4.4482421875, -3.463134765625, -2.47802734375, -1.492919921875, -0.5078125, 0.477294921875, 1.46240234375, 2.447509765625, 3.4326171875, 4.417724609375, 5.40283203125, 6.387939453125, 7.373046875, 8.358154296875, 9.34326171875, 10.328369140625, 11.3134765625, 12.298583984375, 13.28369140625, 14.268798828125, 15.25390625, 16.239013671875, 17.22412109375, 18.209228515625, 19.1943359375, 20.179443359375, 21.16455078125, 22.149658203125, 23.134765625, 24.119873046875, 25.10498046875, 26.090087890625, 27.0751953125, 28.060302734375, 29.04541015625, 30.030517578125, 31.015625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 3.0, 12.0, 5.0, 20.0, 21.0, 49.0, 61.0, 110.0, 133.0, 232.0, 343.0, 531.0, 809.0, 1422.0, 2251.0, 3559.0, 6007.0, 9805.0, 16358.0, 27565.0, 46567.0, 79256.0, 133870.0, 222727.0, 354968.0, 519008.0, 652719.0, 656145.0, 528263.0, 362655.0, 228872.0, 138571.0, 81516.0, 47978.0, 28516.0, 17006.0, 10081.0, 6113.0, 3815.0, 2347.0, 1448.0, 929.0, 586.0, 368.0, 245.0, 174.0, 88.0, 53.0, 43.0, 23.0, 15.0, 16.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-33.9375, -32.84375, -31.75, -30.65625, -29.5625, -28.46875, -27.375, -26.28125, -25.1875, -24.09375, -23.0, -21.90625, -20.8125, -19.71875, -18.625, -17.53125, -16.4375, -15.34375, -14.25, -13.15625, -12.0625, -10.96875, -9.875, -8.78125, -7.6875, -6.59375, -5.5, -4.40625, -3.3125, -2.21875, -1.125, -0.03125, 1.0625, 2.15625, 3.25, 4.34375, 5.4375, 6.53125, 7.625, 8.71875, 9.8125, 10.90625, 12.0, 13.09375, 14.1875, 15.28125, 16.375, 17.46875, 18.5625, 19.65625, 20.75, 21.84375, 22.9375, 24.03125, 25.125, 26.21875, 27.3125, 28.40625, 29.5, 30.59375, 31.6875, 32.78125, 33.875, 34.96875, 36.0625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 8.0, 4.0, 9.0, 17.0, 25.0, 23.0, 35.0, 35.0, 51.0, 57.0, 80.0, 96.0, 101.0, 151.0, 174.0, 168.0, 201.0, 231.0, 266.0, 229.0, 282.0, 251.0, 242.0, 230.0, 203.0, 165.0, 175.0, 122.0, 92.0, 82.0, 67.0, 39.0, 42.0, 28.0, 25.0, 16.0, 11.0, 12.0, 7.0, 4.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.9609375, -15.4556884765625, -14.950439453125, -14.4451904296875, -13.93994140625, -13.4346923828125, -12.929443359375, -12.4241943359375, -11.9189453125, -11.4136962890625, -10.908447265625, -10.4031982421875, -9.89794921875, -9.3927001953125, -8.887451171875, -8.3822021484375, -7.876953125, -7.3717041015625, -6.866455078125, -6.3612060546875, -5.85595703125, -5.3507080078125, -4.845458984375, -4.3402099609375, -3.8349609375, -3.3297119140625, -2.824462890625, -2.3192138671875, -1.81396484375, -1.3087158203125, -0.803466796875, -0.2982177734375, 0.20703125, 0.7122802734375, 1.217529296875, 1.7227783203125, 2.22802734375, 2.7332763671875, 3.238525390625, 3.7437744140625, 4.2490234375, 4.7542724609375, 5.259521484375, 5.7647705078125, 6.27001953125, 6.7752685546875, 7.280517578125, 7.7857666015625, 8.291015625, 8.7962646484375, 9.301513671875, 9.8067626953125, 10.31201171875, 10.8172607421875, 11.322509765625, 11.8277587890625, 12.3330078125, 12.8382568359375, 13.343505859375, 13.8487548828125, 14.35400390625, 14.8592529296875, 15.364501953125, 15.8697509765625, 16.375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 6.0, 2.0, 3.0, 5.0, 7.0, 11.0, 18.0, 15.0, 16.0, 18.0, 24.0, 23.0, 29.0, 33.0, 40.0, 49.0, 36.0, 43.0, 53.0, 50.0, 41.0, 61.0, 48.0, 52.0, 49.0, 40.0, 28.0, 30.0, 35.0, 32.0, 15.0, 15.0, 20.0, 14.0, 12.0, 5.0, 8.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.03864288330078, -37.804527282714844, -36.57040786743164, -35.3362922668457, -34.102176666259766, -32.86805725097656, -31.633941650390625, -30.399824142456055, -29.165706634521484, -27.931589126586914, -26.697473526000977, -25.463356018066406, -24.229238510131836, -22.995121002197266, -21.761005401611328, -20.526887893676758, -19.29277229309082, -18.05865478515625, -16.824539184570312, -15.590421676635742, -14.356304168701172, -13.122187614440918, -11.888071060180664, -10.653953552246094, -9.41983699798584, -8.185720443725586, -6.951602935791016, -5.717486381530762, -4.48336935043335, -3.2492523193359375, -2.0151357650756836, -0.7810182571411133, 0.4530982971191406, 1.6872152090072632, 2.9213321208953857, 4.155448913574219, 5.389565944671631, 6.623682975769043, 7.857799530029297, 9.091917037963867, 10.326033592224121, 11.560150146484375, 12.794267654418945, 14.0283842086792, 15.262500762939453, 16.496618270874023, 17.730735778808594, 18.96485137939453, 20.1989688873291, 21.433086395263672, 22.66720199584961, 23.90131950378418, 25.13543701171875, 26.369552612304688, 27.603670120239258, 28.837787628173828, 30.071903228759766, 31.306020736694336, 32.540138244628906, 33.774253845214844, 35.00836944580078, 36.242488861083984, 37.47660446166992, 38.710723876953125, 39.94483947753906]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 8.0, 8.0, 7.0, 13.0, 11.0, 16.0, 12.0, 20.0, 25.0, 22.0, 23.0, 21.0, 33.0, 32.0, 37.0, 33.0, 38.0, 32.0, 40.0, 48.0, 49.0, 32.0, 39.0, 40.0, 36.0, 38.0, 31.0, 31.0, 31.0, 24.0, 22.0, 24.0, 17.0, 14.0, 11.0, 14.0, 15.0, 9.0, 6.0, 9.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-42.00522232055664, -40.75437927246094, -39.50353240966797, -38.252689361572266, -37.0018424987793, -35.750999450683594, -34.500152587890625, -33.24930953979492, -31.998464584350586, -30.74761962890625, -29.496774673461914, -28.245929718017578, -26.995086669921875, -25.744239807128906, -24.493396759033203, -23.242551803588867, -21.99170684814453, -20.740861892700195, -19.49001693725586, -18.239171981811523, -16.988327026367188, -15.737483024597168, -14.486639022827148, -13.235794067382812, -11.984949111938477, -10.73410415649414, -9.483259201049805, -8.232415199279785, -6.981570243835449, -5.730725288391113, -4.4798808097839355, -3.229036331176758, -1.9781875610351562, -0.7273428440093994, 0.5235018730163574, 1.7743465900421143, 3.025191307067871, 4.276036262512207, 5.526880741119385, 6.7777252197265625, 8.028570175170898, 9.279415130615234, 10.53026008605957, 11.78110408782959, 13.031949043273926, 14.282793998718262, 15.533638000488281, 16.784482955932617, 18.035327911376953, 19.28617286682129, 20.537017822265625, 21.78786277770996, 23.038707733154297, 24.28955078125, 25.540395736694336, 26.791240692138672, 28.042085647583008, 29.292930603027344, 30.54377555847168, 31.794620513916016, 33.04546356201172, 34.29631042480469, 35.54715347290039, 36.797996520996094, 38.04884338378906]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 11.0, 6.0, 23.0, 21.0, 54.0, 71.0, 130.0, 176.0, 238.0, 382.0, 599.0, 908.0, 1510.0, 2364.0, 3697.0, 6280.0, 10685.0, 17968.0, 31192.0, 53554.0, 92898.0, 150284.0, 201318.0, 181379.0, 120789.0, 71360.0, 41252.0, 24273.0, 13918.0, 8257.0, 4938.0, 2915.0, 1874.0, 1088.0, 721.0, 494.0, 316.0, 193.0, 135.0, 95.0, 58.0, 39.0, 36.0, 23.0, 16.0, 3.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-99.875, -96.6279296875, -93.380859375, -90.1337890625, -86.88671875, -83.6396484375, -80.392578125, -77.1455078125, -73.8984375, -70.6513671875, -67.404296875, -64.1572265625, -60.91015625, -57.6630859375, -54.416015625, -51.1689453125, -47.921875, -44.6748046875, -41.427734375, -38.1806640625, -34.93359375, -31.6865234375, -28.439453125, -25.1923828125, -21.9453125, -18.6982421875, -15.451171875, -12.2041015625, -8.95703125, -5.7099609375, -2.462890625, 0.7841796875, 4.03125, 7.2783203125, 10.525390625, 13.7724609375, 17.01953125, 20.2666015625, 23.513671875, 26.7607421875, 30.0078125, 33.2548828125, 36.501953125, 39.7490234375, 42.99609375, 46.2431640625, 49.490234375, 52.7373046875, 55.984375, 59.2314453125, 62.478515625, 65.7255859375, 68.97265625, 72.2197265625, 75.466796875, 78.7138671875, 81.9609375, 85.2080078125, 88.455078125, 91.7021484375, 94.94921875, 98.1962890625, 101.443359375, 104.6904296875, 107.9375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 9.0, 19.0, 9.0, 7.0, 13.0, 26.0, 21.0, 15.0, 25.0, 19.0, 28.0, 32.0, 33.0, 28.0, 47.0, 40.0, 45.0, 44.0, 41.0, 54.0, 39.0, 34.0, 56.0, 27.0, 38.0, 40.0, 46.0, 25.0, 20.0, 18.0, 19.0, 21.0, 10.0, 13.0, 7.0, 5.0, 5.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.21875, -38.0830078125, -36.947265625, -35.8115234375, -34.67578125, -33.5400390625, -32.404296875, -31.2685546875, -30.1328125, -28.9970703125, -27.861328125, -26.7255859375, -25.58984375, -24.4541015625, -23.318359375, -22.1826171875, -21.046875, -19.9111328125, -18.775390625, -17.6396484375, -16.50390625, -15.3681640625, -14.232421875, -13.0966796875, -11.9609375, -10.8251953125, -9.689453125, -8.5537109375, -7.41796875, -6.2822265625, -5.146484375, -4.0107421875, -2.875, -1.7392578125, -0.603515625, 0.5322265625, 1.66796875, 2.8037109375, 3.939453125, 5.0751953125, 6.2109375, 7.3466796875, 8.482421875, 9.6181640625, 10.75390625, 11.8896484375, 13.025390625, 14.1611328125, 15.296875, 16.4326171875, 17.568359375, 18.7041015625, 19.83984375, 20.9755859375, 22.111328125, 23.2470703125, 24.3828125, 25.5185546875, 26.654296875, 27.7900390625, 28.92578125, 30.0615234375, 31.197265625, 32.3330078125, 33.46875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 4.0, 7.0, 14.0, 24.0, 13.0, 27.0, 49.0, 65.0, 97.0, 144.0, 226.0, 330.0, 473.0, 785.0, 1232.0, 1914.0, 3184.0, 5048.0, 8205.0, 14403.0, 24622.0, 44123.0, 81585.0, 155605.0, 250278.0, 206517.0, 111523.0, 59229.0, 32343.0, 18436.0, 10794.0, 6501.0, 3933.0, 2373.0, 1521.0, 1014.0, 646.0, 434.0, 282.0, 171.0, 122.0, 77.0, 54.0, 38.0, 25.0, 17.0, 11.0, 12.0, 12.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-107.3125, -103.931640625, -100.55078125, -97.169921875, -93.7890625, -90.408203125, -87.02734375, -83.646484375, -80.265625, -76.884765625, -73.50390625, -70.123046875, -66.7421875, -63.361328125, -59.98046875, -56.599609375, -53.21875, -49.837890625, -46.45703125, -43.076171875, -39.6953125, -36.314453125, -32.93359375, -29.552734375, -26.171875, -22.791015625, -19.41015625, -16.029296875, -12.6484375, -9.267578125, -5.88671875, -2.505859375, 0.875, 4.255859375, 7.63671875, 11.017578125, 14.3984375, 17.779296875, 21.16015625, 24.541015625, 27.921875, 31.302734375, 34.68359375, 38.064453125, 41.4453125, 44.826171875, 48.20703125, 51.587890625, 54.96875, 58.349609375, 61.73046875, 65.111328125, 68.4921875, 71.873046875, 75.25390625, 78.634765625, 82.015625, 85.396484375, 88.77734375, 92.158203125, 95.5390625, 98.919921875, 102.30078125, 105.681640625, 109.0625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 3.0, 10.0, 8.0, 7.0, 13.0, 10.0, 14.0, 19.0, 21.0, 18.0, 38.0, 41.0, 35.0, 36.0, 47.0, 45.0, 49.0, 62.0, 45.0, 49.0, 43.0, 45.0, 40.0, 39.0, 48.0, 38.0, 29.0, 23.0, 19.0, 14.0, 18.0, 15.0, 13.0, 9.0, 8.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-38.25, -37.095703125, -35.94140625, -34.787109375, -33.6328125, -32.478515625, -31.32421875, -30.169921875, -29.015625, -27.861328125, -26.70703125, -25.552734375, -24.3984375, -23.244140625, -22.08984375, -20.935546875, -19.78125, -18.626953125, -17.47265625, -16.318359375, -15.1640625, -14.009765625, -12.85546875, -11.701171875, -10.546875, -9.392578125, -8.23828125, -7.083984375, -5.9296875, -4.775390625, -3.62109375, -2.466796875, -1.3125, -0.158203125, 0.99609375, 2.150390625, 3.3046875, 4.458984375, 5.61328125, 6.767578125, 7.921875, 9.076171875, 10.23046875, 11.384765625, 12.5390625, 13.693359375, 14.84765625, 16.001953125, 17.15625, 18.310546875, 19.46484375, 20.619140625, 21.7734375, 22.927734375, 24.08203125, 25.236328125, 26.390625, 27.544921875, 28.69921875, 29.853515625, 31.0078125, 32.162109375, 33.31640625, 34.470703125, 35.625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 11.0, 11.0, 22.0, 26.0, 33.0, 61.0, 89.0, 104.0, 165.0, 243.0, 438.0, 584.0, 859.0, 1329.0, 2279.0, 3914.0, 6922.0, 12930.0, 28766.0, 91515.0, 509640.0, 286823.0, 56391.0, 20963.0, 10324.0, 5548.0, 3194.0, 1897.0, 1149.0, 777.0, 511.0, 336.0, 220.0, 158.0, 86.0, 74.0, 31.0, 31.0, 32.0, 23.0, 13.0, 10.0, 11.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-168.875, -163.568359375, -158.26171875, -152.955078125, -147.6484375, -142.341796875, -137.03515625, -131.728515625, -126.421875, -121.115234375, -115.80859375, -110.501953125, -105.1953125, -99.888671875, -94.58203125, -89.275390625, -83.96875, -78.662109375, -73.35546875, -68.048828125, -62.7421875, -57.435546875, -52.12890625, -46.822265625, -41.515625, -36.208984375, -30.90234375, -25.595703125, -20.2890625, -14.982421875, -9.67578125, -4.369140625, 0.9375, 6.244140625, 11.55078125, 16.857421875, 22.1640625, 27.470703125, 32.77734375, 38.083984375, 43.390625, 48.697265625, 54.00390625, 59.310546875, 64.6171875, 69.923828125, 75.23046875, 80.537109375, 85.84375, 91.150390625, 96.45703125, 101.763671875, 107.0703125, 112.376953125, 117.68359375, 122.990234375, 128.296875, 133.603515625, 138.91015625, 144.216796875, 149.5234375, 154.830078125, 160.13671875, 165.443359375, 170.75]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 5.0, 8.0, 4.0, 10.0, 12.0, 24.0, 37.0, 93.0, 254.0, 273.0, 135.0, 40.0, 17.0, 16.0, 9.0, 11.0, 9.0, 1.0, 4.0, 3.0, 5.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01345062255859375, -0.012841343879699707, -0.012232065200805664, -0.011622786521911621, -0.011013507843017578, -0.010404229164123535, -0.009794950485229492, -0.00918567180633545, -0.008576393127441406, -0.007967114448547363, -0.00735783576965332, -0.006748557090759277, -0.006139278411865234, -0.005529999732971191, -0.0049207210540771484, -0.0043114423751831055, -0.0037021636962890625, -0.0030928850173950195, -0.0024836063385009766, -0.0018743276596069336, -0.0012650489807128906, -0.0006557703018188477, -4.649162292480469e-05, 0.0005627870559692383, 0.0011720657348632812, 0.0017813444137573242, 0.002390623092651367, 0.00299990177154541, 0.003609180450439453, 0.004218459129333496, 0.004827737808227539, 0.005437016487121582, 0.006046295166015625, 0.006655573844909668, 0.007264852523803711, 0.007874131202697754, 0.008483409881591797, 0.00909268856048584, 0.009701967239379883, 0.010311245918273926, 0.010920524597167969, 0.011529803276062012, 0.012139081954956055, 0.012748360633850098, 0.01335763931274414, 0.013966917991638184, 0.014576196670532227, 0.01518547534942627, 0.015794754028320312, 0.016404032707214355, 0.0170133113861084, 0.01762259006500244, 0.018231868743896484, 0.018841147422790527, 0.01945042610168457, 0.020059704780578613, 0.020668983459472656, 0.0212782621383667, 0.021887540817260742, 0.022496819496154785, 0.023106098175048828, 0.02371537685394287, 0.024324655532836914, 0.024933934211730957, 0.025543212890625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 9.0, 8.0, 12.0, 18.0, 18.0, 31.0, 44.0, 84.0, 95.0, 159.0, 218.0, 351.0, 493.0, 708.0, 1189.0, 1754.0, 2822.0, 4835.0, 8622.0, 16749.0, 36116.0, 94364.0, 290421.0, 366502.0, 130392.0, 46690.0, 20761.0, 10336.0, 5500.0, 3320.0, 2094.0, 1313.0, 827.0, 551.0, 357.0, 250.0, 173.0, 111.0, 71.0, 60.0, 32.0, 28.0, 15.0, 13.0, 15.0, 11.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-97.0, -93.982421875, -90.96484375, -87.947265625, -84.9296875, -81.912109375, -78.89453125, -75.876953125, -72.859375, -69.841796875, -66.82421875, -63.806640625, -60.7890625, -57.771484375, -54.75390625, -51.736328125, -48.71875, -45.701171875, -42.68359375, -39.666015625, -36.6484375, -33.630859375, -30.61328125, -27.595703125, -24.578125, -21.560546875, -18.54296875, -15.525390625, -12.5078125, -9.490234375, -6.47265625, -3.455078125, -0.4375, 2.580078125, 5.59765625, 8.615234375, 11.6328125, 14.650390625, 17.66796875, 20.685546875, 23.703125, 26.720703125, 29.73828125, 32.755859375, 35.7734375, 38.791015625, 41.80859375, 44.826171875, 47.84375, 50.861328125, 53.87890625, 56.896484375, 59.9140625, 62.931640625, 65.94921875, 68.966796875, 71.984375, 75.001953125, 78.01953125, 81.037109375, 84.0546875, 87.072265625, 90.08984375, 93.107421875, 96.125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 5.0, 10.0, 11.0, 12.0, 14.0, 21.0, 25.0, 33.0, 52.0, 83.0, 83.0, 111.0, 117.0, 110.0, 58.0, 70.0, 45.0, 32.0, 23.0, 11.0, 18.0, 6.0, 8.0, 8.0, 3.0, 5.0, 7.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-29.359375, -28.350830078125, -27.34228515625, -26.333740234375, -25.3251953125, -24.316650390625, -23.30810546875, -22.299560546875, -21.291015625, -20.282470703125, -19.27392578125, -18.265380859375, -17.2568359375, -16.248291015625, -15.23974609375, -14.231201171875, -13.22265625, -12.214111328125, -11.20556640625, -10.197021484375, -9.1884765625, -8.179931640625, -7.17138671875, -6.162841796875, -5.154296875, -4.145751953125, -3.13720703125, -2.128662109375, -1.1201171875, -0.111572265625, 0.89697265625, 1.905517578125, 2.9140625, 3.922607421875, 4.93115234375, 5.939697265625, 6.9482421875, 7.956787109375, 8.96533203125, 9.973876953125, 10.982421875, 11.990966796875, 12.99951171875, 14.008056640625, 15.0166015625, 16.025146484375, 17.03369140625, 18.042236328125, 19.05078125, 20.059326171875, 21.06787109375, 22.076416015625, 23.0849609375, 24.093505859375, 25.10205078125, 26.110595703125, 27.119140625, 28.127685546875, 29.13623046875, 30.144775390625, 31.1533203125, 32.161865234375, 33.17041015625, 34.178955078125, 35.1875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 9.0, 3.0, 3.0, 2.0, 5.0, 10.0, 10.0, 19.0, 22.0, 39.0, 46.0, 52.0, 53.0, 60.0, 78.0, 69.0, 82.0, 79.0, 66.0, 65.0, 52.0, 59.0, 36.0, 25.0, 21.0, 13.0, 13.0, 10.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.76567840576172, -58.00718688964844, -56.248695373535156, -54.490203857421875, -52.73171615600586, -50.97322463989258, -49.2147331237793, -47.456241607666016, -45.69775390625, -43.93926239013672, -42.18077087402344, -40.422279357910156, -38.66379165649414, -36.90530014038086, -35.14680862426758, -33.3883171081543, -31.629825592041016, -29.871334075927734, -28.112844467163086, -26.354352951049805, -24.595863342285156, -22.837371826171875, -21.078880310058594, -19.320388793945312, -17.561899185180664, -15.8034086227417, -14.044918060302734, -12.286426544189453, -10.527935981750488, -8.769445419311523, -7.010953903198242, -5.252463340759277, -3.4939727783203125, -1.7354819774627686, 0.02300882339477539, 1.7814998626708984, 3.5399904251098633, 5.298480987548828, 7.056972503662109, 8.815463066101074, 10.573953628540039, 12.332444190979004, 14.090934753417969, 15.84942626953125, 17.60791778564453, 19.36640739440918, 21.12489891052246, 22.88338851928711, 24.64188003540039, 26.400371551513672, 28.15886116027832, 29.9173526763916, 31.67584228515625, 33.43433380126953, 35.19282531738281, 36.951316833496094, 38.709808349609375, 40.468299865722656, 42.22679138183594, 43.98528289794922, 45.743770599365234, 47.502262115478516, 49.2607536315918, 51.01924514770508, 52.777732849121094]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 9.0, 6.0, 8.0, 6.0, 14.0, 10.0, 17.0, 25.0, 16.0, 20.0, 21.0, 25.0, 35.0, 28.0, 40.0, 28.0, 36.0, 40.0, 45.0, 50.0, 41.0, 43.0, 56.0, 31.0, 41.0, 43.0, 29.0, 37.0, 32.0, 22.0, 21.0, 17.0, 12.0, 21.0, 12.0, 12.0, 10.0, 10.0, 10.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-38.17616271972656, -37.085914611816406, -35.99566650390625, -34.905418395996094, -33.81517028808594, -32.72492218017578, -31.634674072265625, -30.54442596435547, -29.454177856445312, -28.363929748535156, -27.273681640625, -26.183433532714844, -25.093185424804688, -24.00293731689453, -22.912689208984375, -21.82244110107422, -20.732192993164062, -19.641944885253906, -18.55169677734375, -17.461448669433594, -16.371200561523438, -15.280952453613281, -14.190704345703125, -13.100456237792969, -12.010208129882812, -10.919960021972656, -9.8297119140625, -8.739463806152344, -7.6492156982421875, -6.558967590332031, -5.468719482421875, -4.378471374511719, -3.2882232666015625, -2.1979751586914062, -1.10772705078125, -0.01747894287109375, 1.0727691650390625, 2.1630172729492188, 3.253265380859375, 4.343513488769531, 5.4337615966796875, 6.524009704589844, 7.6142578125, 8.704505920410156, 9.794754028320312, 10.885002136230469, 11.975250244140625, 13.065498352050781, 14.155746459960938, 15.245994567871094, 16.33624267578125, 17.426490783691406, 18.516738891601562, 19.60698699951172, 20.697235107421875, 21.78748321533203, 22.877731323242188, 23.967979431152344, 25.0582275390625, 26.148475646972656, 27.238723754882812, 28.32897186279297, 29.419219970703125, 30.50946807861328, 31.599716186523438]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 8.0, 10.0, 14.0, 10.0, 30.0, 40.0, 74.0, 104.0, 141.0, 247.0, 380.0, 654.0, 1104.0, 1799.0, 3010.0, 4872.0, 8127.0, 13810.0, 22678.0, 37410.0, 58916.0, 89870.0, 125935.0, 152498.0, 152429.0, 126917.0, 91198.0, 60201.0, 37756.0, 23140.0, 14043.0, 8329.0, 5025.0, 3059.0, 1823.0, 1126.0, 631.0, 420.0, 271.0, 166.0, 104.0, 63.0, 40.0, 31.0, 16.0, 11.0, 9.0, 3.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.78125, -33.62255859375, -32.4638671875, -31.30517578125, -30.146484375, -28.98779296875, -27.8291015625, -26.67041015625, -25.51171875, -24.35302734375, -23.1943359375, -22.03564453125, -20.876953125, -19.71826171875, -18.5595703125, -17.40087890625, -16.2421875, -15.08349609375, -13.9248046875, -12.76611328125, -11.607421875, -10.44873046875, -9.2900390625, -8.13134765625, -6.97265625, -5.81396484375, -4.6552734375, -3.49658203125, -2.337890625, -1.17919921875, -0.0205078125, 1.13818359375, 2.296875, 3.45556640625, 4.6142578125, 5.77294921875, 6.931640625, 8.09033203125, 9.2490234375, 10.40771484375, 11.56640625, 12.72509765625, 13.8837890625, 15.04248046875, 16.201171875, 17.35986328125, 18.5185546875, 19.67724609375, 20.8359375, 21.99462890625, 23.1533203125, 24.31201171875, 25.470703125, 26.62939453125, 27.7880859375, 28.94677734375, 30.10546875, 31.26416015625, 32.4228515625, 33.58154296875, 34.740234375, 35.89892578125, 37.0576171875, 38.21630859375, 39.375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 5.0, 10.0, 5.0, 9.0, 17.0, 10.0, 28.0, 23.0, 29.0, 27.0, 36.0, 30.0, 36.0, 32.0, 43.0, 45.0, 49.0, 44.0, 48.0, 48.0, 39.0, 51.0, 23.0, 44.0, 33.0, 31.0, 33.0, 22.0, 26.0, 19.0, 16.0, 15.0, 15.0, 10.0, 8.0, 5.0, 4.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.125, -33.05029296875, -31.9755859375, -30.90087890625, -29.826171875, -28.75146484375, -27.6767578125, -26.60205078125, -25.52734375, -24.45263671875, -23.3779296875, -22.30322265625, -21.228515625, -20.15380859375, -19.0791015625, -18.00439453125, -16.9296875, -15.85498046875, -14.7802734375, -13.70556640625, -12.630859375, -11.55615234375, -10.4814453125, -9.40673828125, -8.33203125, -7.25732421875, -6.1826171875, -5.10791015625, -4.033203125, -2.95849609375, -1.8837890625, -0.80908203125, 0.265625, 1.34033203125, 2.4150390625, 3.48974609375, 4.564453125, 5.63916015625, 6.7138671875, 7.78857421875, 8.86328125, 9.93798828125, 11.0126953125, 12.08740234375, 13.162109375, 14.23681640625, 15.3115234375, 16.38623046875, 17.4609375, 18.53564453125, 19.6103515625, 20.68505859375, 21.759765625, 22.83447265625, 23.9091796875, 24.98388671875, 26.05859375, 27.13330078125, 28.2080078125, 29.28271484375, 30.357421875, 31.43212890625, 32.5068359375, 33.58154296875, 34.65625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 13.0, 9.0, 9.0, 37.0, 42.0, 45.0, 74.0, 101.0, 166.0, 255.0, 394.0, 538.0, 847.0, 1286.0, 1987.0, 3116.0, 5041.0, 7895.0, 12785.0, 20858.0, 33337.0, 53256.0, 83517.0, 117936.0, 147524.0, 154227.0, 132663.0, 97661.0, 64362.0, 41185.0, 25328.0, 15701.0, 9714.0, 5928.0, 3737.0, 2421.0, 1606.0, 950.0, 660.0, 457.0, 303.0, 189.0, 134.0, 83.0, 50.0, 44.0, 27.0, 19.0, 15.0, 7.0, 7.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0], "bins": [-32.34375, -31.339599609375, -30.33544921875, -29.331298828125, -28.3271484375, -27.322998046875, -26.31884765625, -25.314697265625, -24.310546875, -23.306396484375, -22.30224609375, -21.298095703125, -20.2939453125, -19.289794921875, -18.28564453125, -17.281494140625, -16.27734375, -15.273193359375, -14.26904296875, -13.264892578125, -12.2607421875, -11.256591796875, -10.25244140625, -9.248291015625, -8.244140625, -7.239990234375, -6.23583984375, -5.231689453125, -4.2275390625, -3.223388671875, -2.21923828125, -1.215087890625, -0.2109375, 0.793212890625, 1.79736328125, 2.801513671875, 3.8056640625, 4.809814453125, 5.81396484375, 6.818115234375, 7.822265625, 8.826416015625, 9.83056640625, 10.834716796875, 11.8388671875, 12.843017578125, 13.84716796875, 14.851318359375, 15.85546875, 16.859619140625, 17.86376953125, 18.867919921875, 19.8720703125, 20.876220703125, 21.88037109375, 22.884521484375, 23.888671875, 24.892822265625, 25.89697265625, 26.901123046875, 27.9052734375, 28.909423828125, 29.91357421875, 30.917724609375, 31.921875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 5.0, 7.0, 9.0, 11.0, 13.0, 12.0, 9.0, 13.0, 26.0, 23.0, 17.0, 28.0, 28.0, 37.0, 30.0, 32.0, 41.0, 37.0, 42.0, 41.0, 35.0, 41.0, 34.0, 47.0, 45.0, 38.0, 41.0, 29.0, 29.0, 22.0, 26.0, 15.0, 9.0, 19.0, 17.0, 15.0, 9.0, 13.0, 6.0, 9.0, 4.0, 6.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-19.578125, -18.93505859375, -18.2919921875, -17.64892578125, -17.005859375, -16.36279296875, -15.7197265625, -15.07666015625, -14.43359375, -13.79052734375, -13.1474609375, -12.50439453125, -11.861328125, -11.21826171875, -10.5751953125, -9.93212890625, -9.2890625, -8.64599609375, -8.0029296875, -7.35986328125, -6.716796875, -6.07373046875, -5.4306640625, -4.78759765625, -4.14453125, -3.50146484375, -2.8583984375, -2.21533203125, -1.572265625, -0.92919921875, -0.2861328125, 0.35693359375, 1.0, 1.64306640625, 2.2861328125, 2.92919921875, 3.572265625, 4.21533203125, 4.8583984375, 5.50146484375, 6.14453125, 6.78759765625, 7.4306640625, 8.07373046875, 8.716796875, 9.35986328125, 10.0029296875, 10.64599609375, 11.2890625, 11.93212890625, 12.5751953125, 13.21826171875, 13.861328125, 14.50439453125, 15.1474609375, 15.79052734375, 16.43359375, 17.07666015625, 17.7197265625, 18.36279296875, 19.005859375, 19.64892578125, 20.2919921875, 20.93505859375, 21.578125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 18.0, 27.0, 22.0, 45.0, 58.0, 90.0, 138.0, 192.0, 258.0, 362.0, 617.0, 932.0, 1439.0, 2204.0, 3421.0, 5687.0, 9233.0, 16196.0, 29476.0, 55572.0, 106962.0, 193126.0, 242858.0, 173729.0, 93689.0, 48854.0, 26392.0, 14607.0, 8472.0, 4930.0, 3152.0, 1930.0, 1304.0, 841.0, 567.0, 352.0, 250.0, 159.0, 128.0, 91.0, 52.0, 43.0, 25.0, 24.0, 9.0, 9.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-66.75, -64.8095703125, -62.869140625, -60.9287109375, -58.98828125, -57.0478515625, -55.107421875, -53.1669921875, -51.2265625, -49.2861328125, -47.345703125, -45.4052734375, -43.46484375, -41.5244140625, -39.583984375, -37.6435546875, -35.703125, -33.7626953125, -31.822265625, -29.8818359375, -27.94140625, -26.0009765625, -24.060546875, -22.1201171875, -20.1796875, -18.2392578125, -16.298828125, -14.3583984375, -12.41796875, -10.4775390625, -8.537109375, -6.5966796875, -4.65625, -2.7158203125, -0.775390625, 1.1650390625, 3.10546875, 5.0458984375, 6.986328125, 8.9267578125, 10.8671875, 12.8076171875, 14.748046875, 16.6884765625, 18.62890625, 20.5693359375, 22.509765625, 24.4501953125, 26.390625, 28.3310546875, 30.271484375, 32.2119140625, 34.15234375, 36.0927734375, 38.033203125, 39.9736328125, 41.9140625, 43.8544921875, 45.794921875, 47.7353515625, 49.67578125, 51.6162109375, 53.556640625, 55.4970703125, 57.4375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 8.0, 5.0, 3.0, 8.0, 5.0, 8.0, 12.0, 11.0, 18.0, 25.0, 22.0, 33.0, 38.0, 47.0, 53.0, 56.0, 67.0, 62.0, 73.0, 68.0, 70.0, 51.0, 56.0, 41.0, 38.0, 26.0, 20.0, 11.0, 19.0, 14.0, 10.0, 14.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.006725311279296875, -0.0065577030181884766, -0.006390094757080078, -0.00622248649597168, -0.006054878234863281, -0.005887269973754883, -0.005719661712646484, -0.005552053451538086, -0.0053844451904296875, -0.005216836929321289, -0.005049228668212891, -0.004881620407104492, -0.004714012145996094, -0.004546403884887695, -0.004378795623779297, -0.0042111873626708984, -0.0040435791015625, -0.0038759708404541016, -0.003708362579345703, -0.0035407543182373047, -0.0033731460571289062, -0.003205537796020508, -0.0030379295349121094, -0.002870321273803711, -0.0027027130126953125, -0.002535104751586914, -0.0023674964904785156, -0.002199888229370117, -0.0020322799682617188, -0.0018646717071533203, -0.0016970634460449219, -0.0015294551849365234, -0.001361846923828125, -0.0011942386627197266, -0.0010266304016113281, -0.0008590221405029297, -0.0006914138793945312, -0.0005238056182861328, -0.0003561973571777344, -0.00018858909606933594, -2.09808349609375e-05, 0.00014662742614746094, 0.0003142356872558594, 0.0004818439483642578, 0.0006494522094726562, 0.0008170604705810547, 0.0009846687316894531, 0.0011522769927978516, 0.00131988525390625, 0.0014874935150146484, 0.0016551017761230469, 0.0018227100372314453, 0.0019903182983398438, 0.002157926559448242, 0.0023255348205566406, 0.002493143081665039, 0.0026607513427734375, 0.002828359603881836, 0.0029959678649902344, 0.003163576126098633, 0.0033311843872070312, 0.0034987926483154297, 0.003666400909423828, 0.0038340091705322266, 0.004001617431640625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 5.0, 9.0, 10.0, 10.0, 13.0, 22.0, 32.0, 46.0, 62.0, 102.0, 162.0, 250.0, 296.0, 534.0, 831.0, 1376.0, 2217.0, 3630.0, 5872.0, 10034.0, 17823.0, 32282.0, 61299.0, 115437.0, 199101.0, 233773.0, 164843.0, 90334.0, 47462.0, 25528.0, 14288.0, 8113.0, 4857.0, 2942.0, 1771.0, 1114.0, 733.0, 484.0, 289.0, 186.0, 125.0, 84.0, 53.0, 51.0, 27.0, 18.0, 13.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.5, -51.67431640625, -49.8486328125, -48.02294921875, -46.197265625, -44.37158203125, -42.5458984375, -40.72021484375, -38.89453125, -37.06884765625, -35.2431640625, -33.41748046875, -31.591796875, -29.76611328125, -27.9404296875, -26.11474609375, -24.2890625, -22.46337890625, -20.6376953125, -18.81201171875, -16.986328125, -15.16064453125, -13.3349609375, -11.50927734375, -9.68359375, -7.85791015625, -6.0322265625, -4.20654296875, -2.380859375, -0.55517578125, 1.2705078125, 3.09619140625, 4.921875, 6.74755859375, 8.5732421875, 10.39892578125, 12.224609375, 14.05029296875, 15.8759765625, 17.70166015625, 19.52734375, 21.35302734375, 23.1787109375, 25.00439453125, 26.830078125, 28.65576171875, 30.4814453125, 32.30712890625, 34.1328125, 35.95849609375, 37.7841796875, 39.60986328125, 41.435546875, 43.26123046875, 45.0869140625, 46.91259765625, 48.73828125, 50.56396484375, 52.3896484375, 54.21533203125, 56.041015625, 57.86669921875, 59.6923828125, 61.51806640625, 63.34375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 7.0, 15.0, 20.0, 12.0, 14.0, 15.0, 23.0, 25.0, 42.0, 33.0, 45.0, 53.0, 46.0, 58.0, 56.0, 63.0, 60.0, 47.0, 45.0, 51.0, 42.0, 39.0, 28.0, 25.0, 30.0, 21.0, 12.0, 11.0, 4.0, 4.0, 15.0, 4.0, 4.0, 8.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.09375, -16.593505859375, -16.09326171875, -15.593017578125, -15.0927734375, -14.592529296875, -14.09228515625, -13.592041015625, -13.091796875, -12.591552734375, -12.09130859375, -11.591064453125, -11.0908203125, -10.590576171875, -10.09033203125, -9.590087890625, -9.08984375, -8.589599609375, -8.08935546875, -7.589111328125, -7.0888671875, -6.588623046875, -6.08837890625, -5.588134765625, -5.087890625, -4.587646484375, -4.08740234375, -3.587158203125, -3.0869140625, -2.586669921875, -2.08642578125, -1.586181640625, -1.0859375, -0.585693359375, -0.08544921875, 0.414794921875, 0.9150390625, 1.415283203125, 1.91552734375, 2.415771484375, 2.916015625, 3.416259765625, 3.91650390625, 4.416748046875, 4.9169921875, 5.417236328125, 5.91748046875, 6.417724609375, 6.91796875, 7.418212890625, 7.91845703125, 8.418701171875, 8.9189453125, 9.419189453125, 9.91943359375, 10.419677734375, 10.919921875, 11.420166015625, 11.92041015625, 12.420654296875, 12.9208984375, 13.421142578125, 13.92138671875, 14.421630859375, 14.921875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 8.0, 7.0, 16.0, 15.0, 19.0, 30.0, 26.0, 33.0, 42.0, 35.0, 49.0, 53.0, 45.0, 58.0, 56.0, 39.0, 58.0, 54.0, 47.0, 52.0, 46.0, 41.0, 37.0, 17.0, 20.0, 18.0, 13.0, 14.0, 9.0, 10.0, 9.0, 4.0, 4.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.76057434082031, -41.48890686035156, -40.21723937988281, -38.94557189941406, -37.67390441894531, -36.40223693847656, -35.13056945800781, -33.85890197753906, -32.58723449707031, -31.315567016601562, -30.043899536132812, -28.772232055664062, -27.500564575195312, -26.228897094726562, -24.957229614257812, -23.685562133789062, -22.413894653320312, -21.142227172851562, -19.870559692382812, -18.598892211914062, -17.327224731445312, -16.055557250976562, -14.783889770507812, -13.512222290039062, -12.240554809570312, -10.968887329101562, -9.697219848632812, -8.425552368164062, -7.1538848876953125, -5.8822174072265625, -4.6105499267578125, -3.3388824462890625, -2.067218780517578, -0.7955513000488281, 0.4761161804199219, 1.7477836608886719, 3.019451141357422, 4.291118621826172, 5.562786102294922, 6.834453582763672, 8.106121063232422, 9.377788543701172, 10.649456024169922, 11.921123504638672, 13.192790985107422, 14.464458465576172, 15.736125946044922, 17.007793426513672, 18.279460906982422, 19.551128387451172, 20.822795867919922, 22.094463348388672, 23.366130828857422, 24.637798309326172, 25.909465789794922, 27.181133270263672, 28.452800750732422, 29.724468231201172, 30.996135711669922, 32.26780319213867, 33.53947067260742, 34.81113815307617, 36.08280563354492, 37.35447311401367, 38.62614059448242]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 9.0, 5.0, 10.0, 9.0, 20.0, 20.0, 25.0, 31.0, 26.0, 25.0, 26.0, 40.0, 45.0, 43.0, 27.0, 47.0, 42.0, 41.0, 43.0, 31.0, 47.0, 43.0, 42.0, 36.0, 29.0, 29.0, 19.0, 32.0, 20.0, 26.0, 19.0, 15.0, 11.0, 9.0, 10.0, 4.0, 10.0, 5.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-37.21701431274414, -36.13599395751953, -35.05497741699219, -33.97395706176758, -32.89293670654297, -31.811920166015625, -30.730899810791016, -29.64988136291504, -28.568862915039062, -27.487844467163086, -26.406824111938477, -25.3258056640625, -24.244787216186523, -23.163768768310547, -22.082748413085938, -21.00172996520996, -19.92070960998535, -18.839691162109375, -17.758670806884766, -16.67765235900879, -15.596633911132812, -14.51561450958252, -13.434595108032227, -12.35357666015625, -11.272557258605957, -10.191537857055664, -9.110519409179688, -8.029500007629395, -6.94848108291626, -5.867462158203125, -4.786442756652832, -3.7054238319396973, -2.6244029998779297, -1.5433839559555054, -0.46236491203308105, 0.6186542510986328, 1.6996731758117676, 2.7806921005249023, 3.8617115020751953, 4.94273042678833, 6.023749351501465, 7.1047682762146, 8.185787200927734, 9.266806602478027, 10.34782600402832, 11.428844451904297, 12.50986385345459, 13.590883255004883, 14.67190170288086, 15.752921104431152, 16.833940505981445, 17.914958953857422, 18.9959774017334, 20.076995849609375, 21.158016204833984, 22.23903465270996, 23.320053100585938, 24.401071548461914, 25.482091903686523, 26.5631103515625, 27.644128799438477, 28.725147247314453, 29.806167602539062, 30.88718605041504, 31.96820640563965]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 4.0, 10.0, 28.0, 37.0, 59.0, 80.0, 157.0, 219.0, 350.0, 579.0, 885.0, 1332.0, 2007.0, 3386.0, 5594.0, 9021.0, 15080.0, 25606.0, 43902.0, 77720.0, 137253.0, 243803.0, 415192.0, 630088.0, 759345.0, 681891.0, 474132.0, 285032.0, 162666.0, 91290.0, 52115.0, 30113.0, 17991.0, 10729.0, 6430.0, 3834.0, 2393.0, 1461.0, 914.0, 574.0, 359.0, 234.0, 132.0, 94.0, 65.0, 43.0, 25.0, 15.0, 9.0, 5.0, 4.0, 1.0], "bins": [-30.359375, -29.531005859375, -28.70263671875, -27.874267578125, -27.0458984375, -26.217529296875, -25.38916015625, -24.560791015625, -23.732421875, -22.904052734375, -22.07568359375, -21.247314453125, -20.4189453125, -19.590576171875, -18.76220703125, -17.933837890625, -17.10546875, -16.277099609375, -15.44873046875, -14.620361328125, -13.7919921875, -12.963623046875, -12.13525390625, -11.306884765625, -10.478515625, -9.650146484375, -8.82177734375, -7.993408203125, -7.1650390625, -6.336669921875, -5.50830078125, -4.679931640625, -3.8515625, -3.023193359375, -2.19482421875, -1.366455078125, -0.5380859375, 0.290283203125, 1.11865234375, 1.947021484375, 2.775390625, 3.603759765625, 4.43212890625, 5.260498046875, 6.0888671875, 6.917236328125, 7.74560546875, 8.573974609375, 9.40234375, 10.230712890625, 11.05908203125, 11.887451171875, 12.7158203125, 13.544189453125, 14.37255859375, 15.200927734375, 16.029296875, 16.857666015625, 17.68603515625, 18.514404296875, 19.3427734375, 20.171142578125, 20.99951171875, 21.827880859375, 22.65625]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 4.0, 5.0, 6.0, 5.0, 3.0, 4.0, 14.0, 9.0, 9.0, 23.0, 21.0, 20.0, 21.0, 23.0, 30.0, 31.0, 50.0, 36.0, 45.0, 40.0, 41.0, 41.0, 37.0, 40.0, 57.0, 38.0, 40.0, 38.0, 34.0, 36.0, 26.0, 29.0, 28.0, 28.0, 18.0, 14.0, 14.0, 14.0, 5.0, 11.0, 2.0, 7.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.104736328125, -20.36572265625, -19.626708984375, -18.8876953125, -18.148681640625, -17.40966796875, -16.670654296875, -15.931640625, -15.192626953125, -14.45361328125, -13.714599609375, -12.9755859375, -12.236572265625, -11.49755859375, -10.758544921875, -10.01953125, -9.280517578125, -8.54150390625, -7.802490234375, -7.0634765625, -6.324462890625, -5.58544921875, -4.846435546875, -4.107421875, -3.368408203125, -2.62939453125, -1.890380859375, -1.1513671875, -0.412353515625, 0.32666015625, 1.065673828125, 1.8046875, 2.543701171875, 3.28271484375, 4.021728515625, 4.7607421875, 5.499755859375, 6.23876953125, 6.977783203125, 7.716796875, 8.455810546875, 9.19482421875, 9.933837890625, 10.6728515625, 11.411865234375, 12.15087890625, 12.889892578125, 13.62890625, 14.367919921875, 15.10693359375, 15.845947265625, 16.5849609375, 17.323974609375, 18.06298828125, 18.802001953125, 19.541015625, 20.280029296875, 21.01904296875, 21.758056640625, 22.4970703125, 23.236083984375, 23.97509765625, 24.714111328125, 25.453125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 8.0, 11.0, 4.0, 13.0, 21.0, 35.0, 63.0, 106.0, 155.0, 242.0, 345.0, 555.0, 917.0, 1461.0, 2246.0, 3445.0, 5595.0, 9000.0, 14901.0, 24035.0, 39944.0, 65599.0, 107660.0, 174178.0, 273799.0, 405646.0, 544268.0, 624851.0, 584251.0, 456105.0, 317583.0, 206029.0, 128482.0, 78632.0, 48175.0, 29271.0, 17682.0, 10924.0, 6647.0, 4197.0, 2647.0, 1659.0, 1048.0, 703.0, 369.0, 299.0, 174.0, 103.0, 77.0, 52.0, 34.0, 17.0, 12.0, 11.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.53125, -21.796875, -21.0625, -20.328125, -19.59375, -18.859375, -18.125, -17.390625, -16.65625, -15.921875, -15.1875, -14.453125, -13.71875, -12.984375, -12.25, -11.515625, -10.78125, -10.046875, -9.3125, -8.578125, -7.84375, -7.109375, -6.375, -5.640625, -4.90625, -4.171875, -3.4375, -2.703125, -1.96875, -1.234375, -0.5, 0.234375, 0.96875, 1.703125, 2.4375, 3.171875, 3.90625, 4.640625, 5.375, 6.109375, 6.84375, 7.578125, 8.3125, 9.046875, 9.78125, 10.515625, 11.25, 11.984375, 12.71875, 13.453125, 14.1875, 14.921875, 15.65625, 16.390625, 17.125, 17.859375, 18.59375, 19.328125, 20.0625, 20.796875, 21.53125, 22.265625, 23.0, 23.734375, 24.46875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 8.0, 5.0, 9.0, 19.0, 23.0, 31.0, 30.0, 37.0, 63.0, 62.0, 75.0, 78.0, 109.0, 125.0, 141.0, 160.0, 195.0, 179.0, 222.0, 208.0, 202.0, 223.0, 203.0, 226.0, 210.0, 175.0, 157.0, 129.0, 120.0, 131.0, 92.0, 83.0, 56.0, 55.0, 39.0, 43.0, 43.0, 31.0, 20.0, 9.0, 8.0, 11.0, 9.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.4375, -9.1298828125, -8.822265625, -8.5146484375, -8.20703125, -7.8994140625, -7.591796875, -7.2841796875, -6.9765625, -6.6689453125, -6.361328125, -6.0537109375, -5.74609375, -5.4384765625, -5.130859375, -4.8232421875, -4.515625, -4.2080078125, -3.900390625, -3.5927734375, -3.28515625, -2.9775390625, -2.669921875, -2.3623046875, -2.0546875, -1.7470703125, -1.439453125, -1.1318359375, -0.82421875, -0.5166015625, -0.208984375, 0.0986328125, 0.40625, 0.7138671875, 1.021484375, 1.3291015625, 1.63671875, 1.9443359375, 2.251953125, 2.5595703125, 2.8671875, 3.1748046875, 3.482421875, 3.7900390625, 4.09765625, 4.4052734375, 4.712890625, 5.0205078125, 5.328125, 5.6357421875, 5.943359375, 6.2509765625, 6.55859375, 6.8662109375, 7.173828125, 7.4814453125, 7.7890625, 8.0966796875, 8.404296875, 8.7119140625, 9.01953125, 9.3271484375, 9.634765625, 9.9423828125, 10.25]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 13.0, 6.0, 10.0, 7.0, 7.0, 12.0, 15.0, 25.0, 16.0, 30.0, 33.0, 48.0, 45.0, 45.0, 37.0, 57.0, 48.0, 55.0, 62.0, 51.0, 55.0, 57.0, 40.0, 37.0, 30.0, 39.0, 22.0, 26.0, 12.0, 14.0, 13.0, 10.0, 4.0, 10.0, 2.0, 0.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.91673469543457, -29.967512130737305, -29.018291473388672, -28.069068908691406, -27.119848251342773, -26.170625686645508, -25.221405029296875, -24.27218246459961, -23.322959899902344, -22.373737335205078, -21.424516677856445, -20.47529411315918, -19.526073455810547, -18.57685089111328, -17.627628326416016, -16.678407669067383, -15.72918701171875, -14.7799654006958, -13.830743789672852, -12.881521224975586, -11.932300567626953, -10.983078002929688, -10.033856391906738, -9.084634780883789, -8.13541316986084, -7.186191558837891, -6.236969947814941, -5.287747859954834, -4.338526248931885, -3.3893046379089355, -2.440082550048828, -1.490860939025879, -0.5416412353515625, 0.40758049488067627, 1.356802225112915, 2.3060240745544434, 3.2552456855773926, 4.204467296600342, 5.153689384460449, 6.102910995483398, 7.052132606506348, 8.001354217529297, 8.950575828552246, 9.899797439575195, 10.849020004272461, 11.798240661621094, 12.74746322631836, 13.696684837341309, 14.645906448364258, 15.595128059387207, 16.544349670410156, 17.493572235107422, 18.442792892456055, 19.39201545715332, 20.341236114501953, 21.29045867919922, 22.239681243896484, 23.18890380859375, 24.138124465942383, 25.08734703063965, 26.03656768798828, 26.985790252685547, 27.935012817382812, 28.884233474731445, 29.833454132080078]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 15.0, 11.0, 6.0, 10.0, 10.0, 16.0, 19.0, 23.0, 25.0, 24.0, 23.0, 29.0, 33.0, 40.0, 46.0, 37.0, 37.0, 35.0, 31.0, 54.0, 42.0, 32.0, 38.0, 52.0, 27.0, 26.0, 29.0, 32.0, 32.0, 20.0, 21.0, 17.0, 15.0, 19.0, 12.0, 6.0, 16.0, 7.0, 5.0, 6.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-28.55113983154297, -27.751279830932617, -26.9514217376709, -26.151561737060547, -25.351701736450195, -24.551841735839844, -23.751983642578125, -22.952123641967773, -22.152263641357422, -21.35240364074707, -20.55254554748535, -19.752685546875, -18.95282554626465, -18.152965545654297, -17.353107452392578, -16.553247451782227, -15.753389358520508, -14.953530311584473, -14.153670310974121, -13.353811264038086, -12.553951263427734, -11.7540922164917, -10.954233169555664, -10.154373168945312, -9.354514122009277, -8.554655075073242, -7.754795074462891, -6.9549360275268555, -6.155076503753662, -5.355216979980469, -4.555357933044434, -3.7554984092712402, -2.955636978149414, -2.1557774543762207, -1.3559181690216064, -0.5560588836669922, 0.24380064010620117, 1.0436601638793945, 1.8435192108154297, 2.643378734588623, 3.4432382583618164, 4.24309778213501, 5.042957305908203, 5.842816352844238, 6.642675876617432, 7.442535400390625, 8.24239444732666, 9.042253494262695, 9.842113494873047, 10.641972541809082, 11.441832542419434, 12.241691589355469, 13.04155158996582, 13.841410636901855, 14.64126968383789, 15.441129684448242, 16.240989685058594, 17.040849685668945, 17.840707778930664, 18.640567779541016, 19.440427780151367, 20.24028778076172, 21.040145874023438, 21.84000587463379, 22.639863967895508]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 7.0, 10.0, 13.0, 9.0, 18.0, 41.0, 52.0, 71.0, 83.0, 132.0, 199.0, 297.0, 414.0, 679.0, 865.0, 1272.0, 2054.0, 3028.0, 4681.0, 7695.0, 13574.0, 24786.0, 47261.0, 97937.0, 198105.0, 273028.0, 183596.0, 89266.0, 43351.0, 22585.0, 12655.0, 7388.0, 4597.0, 2841.0, 1916.0, 1269.0, 913.0, 577.0, 371.0, 302.0, 181.0, 131.0, 91.0, 76.0, 48.0, 32.0, 28.0, 15.0, 7.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-60.03125, -58.05908203125, -56.0869140625, -54.11474609375, -52.142578125, -50.17041015625, -48.1982421875, -46.22607421875, -44.25390625, -42.28173828125, -40.3095703125, -38.33740234375, -36.365234375, -34.39306640625, -32.4208984375, -30.44873046875, -28.4765625, -26.50439453125, -24.5322265625, -22.56005859375, -20.587890625, -18.61572265625, -16.6435546875, -14.67138671875, -12.69921875, -10.72705078125, -8.7548828125, -6.78271484375, -4.810546875, -2.83837890625, -0.8662109375, 1.10595703125, 3.078125, 5.05029296875, 7.0224609375, 8.99462890625, 10.966796875, 12.93896484375, 14.9111328125, 16.88330078125, 18.85546875, 20.82763671875, 22.7998046875, 24.77197265625, 26.744140625, 28.71630859375, 30.6884765625, 32.66064453125, 34.6328125, 36.60498046875, 38.5771484375, 40.54931640625, 42.521484375, 44.49365234375, 46.4658203125, 48.43798828125, 50.41015625, 52.38232421875, 54.3544921875, 56.32666015625, 58.298828125, 60.27099609375, 62.2431640625, 64.21533203125, 66.1875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 9.0, 10.0, 10.0, 12.0, 12.0, 20.0, 19.0, 13.0, 24.0, 36.0, 23.0, 30.0, 39.0, 38.0, 40.0, 39.0, 38.0, 30.0, 35.0, 37.0, 39.0, 30.0, 52.0, 28.0, 21.0, 38.0, 35.0, 22.0, 30.0, 20.0, 24.0, 19.0, 14.0, 18.0, 12.0, 14.0, 10.0, 13.0, 6.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-24.15625, -23.441162109375, -22.72607421875, -22.010986328125, -21.2958984375, -20.580810546875, -19.86572265625, -19.150634765625, -18.435546875, -17.720458984375, -17.00537109375, -16.290283203125, -15.5751953125, -14.860107421875, -14.14501953125, -13.429931640625, -12.71484375, -11.999755859375, -11.28466796875, -10.569580078125, -9.8544921875, -9.139404296875, -8.42431640625, -7.709228515625, -6.994140625, -6.279052734375, -5.56396484375, -4.848876953125, -4.1337890625, -3.418701171875, -2.70361328125, -1.988525390625, -1.2734375, -0.558349609375, 0.15673828125, 0.871826171875, 1.5869140625, 2.302001953125, 3.01708984375, 3.732177734375, 4.447265625, 5.162353515625, 5.87744140625, 6.592529296875, 7.3076171875, 8.022705078125, 8.73779296875, 9.452880859375, 10.16796875, 10.883056640625, 11.59814453125, 12.313232421875, 13.0283203125, 13.743408203125, 14.45849609375, 15.173583984375, 15.888671875, 16.603759765625, 17.31884765625, 18.033935546875, 18.7490234375, 19.464111328125, 20.17919921875, 20.894287109375, 21.609375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 9.0, 2.0, 15.0, 17.0, 14.0, 32.0, 45.0, 73.0, 97.0, 157.0, 204.0, 264.0, 413.0, 596.0, 846.0, 1253.0, 1993.0, 3015.0, 4755.0, 7595.0, 12534.0, 21581.0, 39584.0, 76861.0, 163024.0, 285937.0, 210797.0, 100196.0, 49580.0, 26749.0, 15064.0, 9198.0, 5535.0, 3489.0, 2308.0, 1541.0, 1016.0, 660.0, 446.0, 303.0, 232.0, 176.0, 109.0, 72.0, 61.0, 36.0, 25.0, 16.0, 17.0, 7.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0], "bins": [-63.34375, -61.462890625, -59.58203125, -57.701171875, -55.8203125, -53.939453125, -52.05859375, -50.177734375, -48.296875, -46.416015625, -44.53515625, -42.654296875, -40.7734375, -38.892578125, -37.01171875, -35.130859375, -33.25, -31.369140625, -29.48828125, -27.607421875, -25.7265625, -23.845703125, -21.96484375, -20.083984375, -18.203125, -16.322265625, -14.44140625, -12.560546875, -10.6796875, -8.798828125, -6.91796875, -5.037109375, -3.15625, -1.275390625, 0.60546875, 2.486328125, 4.3671875, 6.248046875, 8.12890625, 10.009765625, 11.890625, 13.771484375, 15.65234375, 17.533203125, 19.4140625, 21.294921875, 23.17578125, 25.056640625, 26.9375, 28.818359375, 30.69921875, 32.580078125, 34.4609375, 36.341796875, 38.22265625, 40.103515625, 41.984375, 43.865234375, 45.74609375, 47.626953125, 49.5078125, 51.388671875, 53.26953125, 55.150390625, 57.03125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 9.0, 3.0, 9.0, 7.0, 10.0, 7.0, 12.0, 15.0, 17.0, 21.0, 22.0, 32.0, 43.0, 32.0, 38.0, 45.0, 40.0, 40.0, 49.0, 43.0, 51.0, 38.0, 29.0, 40.0, 42.0, 42.0, 31.0, 39.0, 40.0, 26.0, 22.0, 22.0, 15.0, 14.0, 13.0, 11.0, 6.0, 10.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.3681640625, -15.798828125, -15.2294921875, -14.66015625, -14.0908203125, -13.521484375, -12.9521484375, -12.3828125, -11.8134765625, -11.244140625, -10.6748046875, -10.10546875, -9.5361328125, -8.966796875, -8.3974609375, -7.828125, -7.2587890625, -6.689453125, -6.1201171875, -5.55078125, -4.9814453125, -4.412109375, -3.8427734375, -3.2734375, -2.7041015625, -2.134765625, -1.5654296875, -0.99609375, -0.4267578125, 0.142578125, 0.7119140625, 1.28125, 1.8505859375, 2.419921875, 2.9892578125, 3.55859375, 4.1279296875, 4.697265625, 5.2666015625, 5.8359375, 6.4052734375, 6.974609375, 7.5439453125, 8.11328125, 8.6826171875, 9.251953125, 9.8212890625, 10.390625, 10.9599609375, 11.529296875, 12.0986328125, 12.66796875, 13.2373046875, 13.806640625, 14.3759765625, 14.9453125, 15.5146484375, 16.083984375, 16.6533203125, 17.22265625, 17.7919921875, 18.361328125, 18.9306640625, 19.5]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 7.0, 4.0, 11.0, 16.0, 19.0, 21.0, 26.0, 34.0, 59.0, 69.0, 125.0, 153.0, 279.0, 390.0, 616.0, 999.0, 1652.0, 3041.0, 6175.0, 15705.0, 60387.0, 432051.0, 436369.0, 60952.0, 15756.0, 6010.0, 3127.0, 1674.0, 986.0, 617.0, 394.0, 280.0, 169.0, 111.0, 88.0, 50.0, 41.0, 34.0, 23.0, 14.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-85.875, -83.0126953125, -80.150390625, -77.2880859375, -74.42578125, -71.5634765625, -68.701171875, -65.8388671875, -62.9765625, -60.1142578125, -57.251953125, -54.3896484375, -51.52734375, -48.6650390625, -45.802734375, -42.9404296875, -40.078125, -37.2158203125, -34.353515625, -31.4912109375, -28.62890625, -25.7666015625, -22.904296875, -20.0419921875, -17.1796875, -14.3173828125, -11.455078125, -8.5927734375, -5.73046875, -2.8681640625, -0.005859375, 2.8564453125, 5.71875, 8.5810546875, 11.443359375, 14.3056640625, 17.16796875, 20.0302734375, 22.892578125, 25.7548828125, 28.6171875, 31.4794921875, 34.341796875, 37.2041015625, 40.06640625, 42.9287109375, 45.791015625, 48.6533203125, 51.515625, 54.3779296875, 57.240234375, 60.1025390625, 62.96484375, 65.8271484375, 68.689453125, 71.5517578125, 74.4140625, 77.2763671875, 80.138671875, 83.0009765625, 85.86328125, 88.7255859375, 91.587890625, 94.4501953125, 97.3125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 9.0, 17.0, 20.0, 33.0, 81.0, 232.0, 302.0, 144.0, 62.0, 24.0, 13.0, 9.0, 4.0, 6.0, 5.0, 4.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.0084228515625, -0.008208394050598145, -0.007993936538696289, -0.007779479026794434, -0.007565021514892578, -0.007350564002990723, -0.007136106491088867, -0.006921648979187012, -0.006707191467285156, -0.006492733955383301, -0.006278276443481445, -0.00606381893157959, -0.005849361419677734, -0.005634903907775879, -0.0054204463958740234, -0.005205988883972168, -0.0049915313720703125, -0.004777073860168457, -0.0045626163482666016, -0.004348158836364746, -0.004133701324462891, -0.003919243812561035, -0.0037047863006591797, -0.0034903287887573242, -0.0032758712768554688, -0.0030614137649536133, -0.002846956253051758, -0.0026324987411499023, -0.002418041229248047, -0.0022035837173461914, -0.001989126205444336, -0.0017746686935424805, -0.001560211181640625, -0.0013457536697387695, -0.001131296157836914, -0.0009168386459350586, -0.0007023811340332031, -0.00048792362213134766, -0.0002734661102294922, -5.900859832763672e-05, 0.00015544891357421875, 0.0003699064254760742, 0.0005843639373779297, 0.0007988214492797852, 0.0010132789611816406, 0.001227736473083496, 0.0014421939849853516, 0.001656651496887207, 0.0018711090087890625, 0.002085566520690918, 0.0023000240325927734, 0.002514481544494629, 0.0027289390563964844, 0.00294339656829834, 0.0031578540802001953, 0.0033723115921020508, 0.0035867691040039062, 0.0038012266159057617, 0.004015684127807617, 0.004230141639709473, 0.004444599151611328, 0.004659056663513184, 0.004873514175415039, 0.0050879716873168945, 0.00530242919921875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 3.0, 0.0, 5.0, 6.0, 8.0, 12.0, 10.0, 21.0, 33.0, 34.0, 61.0, 70.0, 104.0, 130.0, 204.0, 288.0, 410.0, 613.0, 871.0, 1224.0, 1788.0, 2785.0, 4953.0, 10121.0, 26568.0, 94503.0, 375928.0, 381259.0, 95439.0, 27164.0, 10237.0, 5052.0, 2842.0, 1755.0, 1227.0, 851.0, 572.0, 372.0, 289.0, 231.0, 137.0, 106.0, 79.0, 43.0, 43.0, 41.0, 21.0, 13.0, 15.0, 9.0, 1.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-60.1875, -58.181640625, -56.17578125, -54.169921875, -52.1640625, -50.158203125, -48.15234375, -46.146484375, -44.140625, -42.134765625, -40.12890625, -38.123046875, -36.1171875, -34.111328125, -32.10546875, -30.099609375, -28.09375, -26.087890625, -24.08203125, -22.076171875, -20.0703125, -18.064453125, -16.05859375, -14.052734375, -12.046875, -10.041015625, -8.03515625, -6.029296875, -4.0234375, -2.017578125, -0.01171875, 1.994140625, 4.0, 6.005859375, 8.01171875, 10.017578125, 12.0234375, 14.029296875, 16.03515625, 18.041015625, 20.046875, 22.052734375, 24.05859375, 26.064453125, 28.0703125, 30.076171875, 32.08203125, 34.087890625, 36.09375, 38.099609375, 40.10546875, 42.111328125, 44.1171875, 46.123046875, 48.12890625, 50.134765625, 52.140625, 54.146484375, 56.15234375, 58.158203125, 60.1640625, 62.169921875, 64.17578125, 66.181640625, 68.1875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 11.0, 12.0, 5.0, 34.0, 26.0, 30.0, 32.0, 58.0, 61.0, 68.0, 77.0, 77.0, 70.0, 66.0, 76.0, 59.0, 49.0, 36.0, 31.0, 22.0, 21.0, 11.0, 10.0, 12.0, 9.0, 2.0, 3.0, 2.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -11.16064453125, -10.7900390625, -10.41943359375, -10.048828125, -9.67822265625, -9.3076171875, -8.93701171875, -8.56640625, -8.19580078125, -7.8251953125, -7.45458984375, -7.083984375, -6.71337890625, -6.3427734375, -5.97216796875, -5.6015625, -5.23095703125, -4.8603515625, -4.48974609375, -4.119140625, -3.74853515625, -3.3779296875, -3.00732421875, -2.63671875, -2.26611328125, -1.8955078125, -1.52490234375, -1.154296875, -0.78369140625, -0.4130859375, -0.04248046875, 0.328125, 0.69873046875, 1.0693359375, 1.43994140625, 1.810546875, 2.18115234375, 2.5517578125, 2.92236328125, 3.29296875, 3.66357421875, 4.0341796875, 4.40478515625, 4.775390625, 5.14599609375, 5.5166015625, 5.88720703125, 6.2578125, 6.62841796875, 6.9990234375, 7.36962890625, 7.740234375, 8.11083984375, 8.4814453125, 8.85205078125, 9.22265625, 9.59326171875, 9.9638671875, 10.33447265625, 10.705078125, 11.07568359375, 11.4462890625, 11.81689453125, 12.1875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 2.0, 5.0, 6.0, 7.0, 15.0, 16.0, 20.0, 20.0, 25.0, 29.0, 32.0, 29.0, 48.0, 52.0, 47.0, 77.0, 64.0, 60.0, 73.0, 57.0, 49.0, 40.0, 46.0, 35.0, 33.0, 27.0, 19.0, 13.0, 16.0, 10.0, 5.0, 3.0, 4.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.922874450683594, -26.953081130981445, -25.98328971862793, -25.01349639892578, -24.043704986572266, -23.073911666870117, -22.10411834716797, -21.134326934814453, -20.164533615112305, -19.194740295410156, -18.22494888305664, -17.255155563354492, -16.285364151000977, -15.315570831298828, -14.345778465270996, -13.375986099243164, -12.406193733215332, -11.4364013671875, -10.466609001159668, -9.496816635131836, -8.527023315429688, -7.5572309494018555, -6.587438583374023, -5.617645740509033, -4.647853374481201, -3.67806077003479, -2.708268165588379, -1.7384757995605469, -0.7686831951141357, 0.2011094093322754, 1.1709017753601074, 2.1406946182250977, 3.1104869842529297, 4.080279350280762, 5.050072193145752, 6.019864559173584, 6.989657402038574, 7.959449768066406, 8.929242134094238, 9.89903450012207, 10.868827819824219, 11.83862018585205, 12.808412551879883, 13.778205871582031, 14.747998237609863, 15.717790603637695, 16.687583923339844, 17.65737533569336, 18.627166748046875, 19.596960067749023, 20.56675148010254, 21.536544799804688, 22.506336212158203, 23.47612953186035, 24.4459228515625, 25.415714263916016, 26.385507583618164, 27.355300903320312, 28.325092315673828, 29.294885635375977, 30.264677047729492, 31.23447036743164, 32.204261779785156, 33.17405700683594, 34.14384841918945]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 4.0, 6.0, 11.0, 7.0, 9.0, 12.0, 16.0, 10.0, 19.0, 14.0, 23.0, 41.0, 19.0, 30.0, 37.0, 39.0, 24.0, 36.0, 37.0, 33.0, 45.0, 36.0, 35.0, 33.0, 32.0, 44.0, 38.0, 37.0, 36.0, 27.0, 22.0, 29.0, 13.0, 28.0, 17.0, 11.0, 13.0, 11.0, 13.0, 12.0, 6.0, 6.0, 10.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-25.787109375, -25.07587242126465, -24.364633560180664, -23.653396606445312, -22.94215965270996, -22.230920791625977, -21.519683837890625, -20.80844497680664, -20.09720802307129, -19.385971069335938, -18.674732208251953, -17.9634952545166, -17.25225830078125, -16.541019439697266, -15.829782485961914, -15.118544578552246, -14.407307624816895, -13.696069717407227, -12.984832763671875, -12.273594856262207, -11.562356948852539, -10.851119995117188, -10.13988208770752, -9.428644180297852, -8.7174072265625, -8.006169319152832, -7.294931888580322, -6.5836944580078125, -5.8724565505981445, -5.161219120025635, -4.449981689453125, -3.738743782043457, -3.027505874633789, -2.3162682056427, -1.6050306558609009, -0.8937931060791016, -0.1825554370880127, 0.5286822319030762, 1.239919662475586, 1.951157569885254, 2.6623950004577637, 3.3736326694488525, 4.084870338439941, 4.796107769012451, 5.507345199584961, 6.218583106994629, 6.929820537567139, 7.641058444976807, 8.352295875549316, 9.063533782958984, 9.774770736694336, 10.486008644104004, 11.197246551513672, 11.908483505249023, 12.619721412658691, 13.33095932006836, 14.042196273803711, 14.753434181213379, 15.46467113494873, 16.1759090423584, 16.88714599609375, 17.598384857177734, 18.309621810913086, 19.020858764648438, 19.732097625732422]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 10.0, 13.0, 14.0, 31.0, 43.0, 70.0, 102.0, 116.0, 210.0, 361.0, 514.0, 834.0, 1387.0, 2327.0, 3956.0, 6958.0, 11785.0, 21023.0, 37132.0, 62950.0, 99802.0, 142745.0, 169762.0, 162008.0, 124353.0, 82533.0, 49721.0, 28493.0, 16829.0, 9311.0, 5308.0, 3040.0, 1856.0, 1089.0, 641.0, 459.0, 284.0, 138.0, 101.0, 89.0, 49.0, 41.0, 18.0, 18.0, 11.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0], "bins": [-33.0, -32.07763671875, -31.1552734375, -30.23291015625, -29.310546875, -28.38818359375, -27.4658203125, -26.54345703125, -25.62109375, -24.69873046875, -23.7763671875, -22.85400390625, -21.931640625, -21.00927734375, -20.0869140625, -19.16455078125, -18.2421875, -17.31982421875, -16.3974609375, -15.47509765625, -14.552734375, -13.63037109375, -12.7080078125, -11.78564453125, -10.86328125, -9.94091796875, -9.0185546875, -8.09619140625, -7.173828125, -6.25146484375, -5.3291015625, -4.40673828125, -3.484375, -2.56201171875, -1.6396484375, -0.71728515625, 0.205078125, 1.12744140625, 2.0498046875, 2.97216796875, 3.89453125, 4.81689453125, 5.7392578125, 6.66162109375, 7.583984375, 8.50634765625, 9.4287109375, 10.35107421875, 11.2734375, 12.19580078125, 13.1181640625, 14.04052734375, 14.962890625, 15.88525390625, 16.8076171875, 17.72998046875, 18.65234375, 19.57470703125, 20.4970703125, 21.41943359375, 22.341796875, 23.26416015625, 24.1865234375, 25.10888671875, 26.03125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 7.0, 9.0, 3.0, 10.0, 8.0, 11.0, 14.0, 14.0, 20.0, 30.0, 21.0, 28.0, 30.0, 26.0, 32.0, 30.0, 36.0, 30.0, 48.0, 35.0, 38.0, 39.0, 30.0, 53.0, 43.0, 43.0, 30.0, 31.0, 34.0, 30.0, 28.0, 31.0, 15.0, 22.0, 13.0, 11.0, 15.0, 12.0, 5.0, 12.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.390625, -24.6796875, -23.96875, -23.2578125, -22.546875, -21.8359375, -21.125, -20.4140625, -19.703125, -18.9921875, -18.28125, -17.5703125, -16.859375, -16.1484375, -15.4375, -14.7265625, -14.015625, -13.3046875, -12.59375, -11.8828125, -11.171875, -10.4609375, -9.75, -9.0390625, -8.328125, -7.6171875, -6.90625, -6.1953125, -5.484375, -4.7734375, -4.0625, -3.3515625, -2.640625, -1.9296875, -1.21875, -0.5078125, 0.203125, 0.9140625, 1.625, 2.3359375, 3.046875, 3.7578125, 4.46875, 5.1796875, 5.890625, 6.6015625, 7.3125, 8.0234375, 8.734375, 9.4453125, 10.15625, 10.8671875, 11.578125, 12.2890625, 13.0, 13.7109375, 14.421875, 15.1328125, 15.84375, 16.5546875, 17.265625, 17.9765625, 18.6875, 19.3984375, 20.109375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 10.0, 10.0, 18.0, 40.0, 81.0, 91.0, 174.0, 220.0, 383.0, 618.0, 956.0, 1554.0, 2523.0, 4213.0, 6838.0, 11266.0, 18137.0, 29202.0, 45698.0, 69260.0, 98215.0, 127179.0, 143438.0, 137474.0, 113980.0, 83452.0, 57179.0, 36626.0, 23178.0, 14213.0, 8544.0, 5383.0, 3153.0, 1998.0, 1180.0, 781.0, 520.0, 283.0, 166.0, 137.0, 78.0, 44.0, 26.0, 15.0, 11.0, 7.0, 5.0, 1.0, 1.0, 3.0], "bins": [-25.6875, -24.988525390625, -24.28955078125, -23.590576171875, -22.8916015625, -22.192626953125, -21.49365234375, -20.794677734375, -20.095703125, -19.396728515625, -18.69775390625, -17.998779296875, -17.2998046875, -16.600830078125, -15.90185546875, -15.202880859375, -14.50390625, -13.804931640625, -13.10595703125, -12.406982421875, -11.7080078125, -11.009033203125, -10.31005859375, -9.611083984375, -8.912109375, -8.213134765625, -7.51416015625, -6.815185546875, -6.1162109375, -5.417236328125, -4.71826171875, -4.019287109375, -3.3203125, -2.621337890625, -1.92236328125, -1.223388671875, -0.5244140625, 0.174560546875, 0.87353515625, 1.572509765625, 2.271484375, 2.970458984375, 3.66943359375, 4.368408203125, 5.0673828125, 5.766357421875, 6.46533203125, 7.164306640625, 7.86328125, 8.562255859375, 9.26123046875, 9.960205078125, 10.6591796875, 11.358154296875, 12.05712890625, 12.756103515625, 13.455078125, 14.154052734375, 14.85302734375, 15.552001953125, 16.2509765625, 16.949951171875, 17.64892578125, 18.347900390625, 19.046875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 8.0, 7.0, 7.0, 8.0, 11.0, 11.0, 26.0, 18.0, 17.0, 21.0, 24.0, 28.0, 27.0, 36.0, 46.0, 41.0, 44.0, 31.0, 37.0, 31.0, 48.0, 38.0, 34.0, 34.0, 38.0, 33.0, 25.0, 31.0, 30.0, 27.0, 18.0, 27.0, 17.0, 19.0, 9.0, 15.0, 15.0, 6.0, 8.0, 13.0, 10.0, 8.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.84375, -12.4027099609375, -11.961669921875, -11.5206298828125, -11.07958984375, -10.6385498046875, -10.197509765625, -9.7564697265625, -9.3154296875, -8.8743896484375, -8.433349609375, -7.9923095703125, -7.55126953125, -7.1102294921875, -6.669189453125, -6.2281494140625, -5.787109375, -5.3460693359375, -4.905029296875, -4.4639892578125, -4.02294921875, -3.5819091796875, -3.140869140625, -2.6998291015625, -2.2587890625, -1.8177490234375, -1.376708984375, -0.9356689453125, -0.49462890625, -0.0535888671875, 0.387451171875, 0.8284912109375, 1.26953125, 1.7105712890625, 2.151611328125, 2.5926513671875, 3.03369140625, 3.4747314453125, 3.915771484375, 4.3568115234375, 4.7978515625, 5.2388916015625, 5.679931640625, 6.1209716796875, 6.56201171875, 7.0030517578125, 7.444091796875, 7.8851318359375, 8.326171875, 8.7672119140625, 9.208251953125, 9.6492919921875, 10.09033203125, 10.5313720703125, 10.972412109375, 11.4134521484375, 11.8544921875, 12.2955322265625, 12.736572265625, 13.1776123046875, 13.61865234375, 14.0596923828125, 14.500732421875, 14.9417724609375, 15.3828125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 5.0, 6.0, 15.0, 17.0, 28.0, 28.0, 44.0, 64.0, 96.0, 139.0, 152.0, 220.0, 319.0, 496.0, 637.0, 997.0, 1487.0, 2414.0, 4405.0, 9227.0, 22068.0, 66965.0, 217993.0, 410293.0, 206302.0, 62876.0, 21222.0, 8804.0, 4264.0, 2349.0, 1396.0, 971.0, 591.0, 456.0, 334.0, 265.0, 149.0, 132.0, 78.0, 79.0, 49.0, 30.0, 38.0, 19.0, 10.0, 7.0, 4.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0], "bins": [-57.03125, -55.376953125, -53.72265625, -52.068359375, -50.4140625, -48.759765625, -47.10546875, -45.451171875, -43.796875, -42.142578125, -40.48828125, -38.833984375, -37.1796875, -35.525390625, -33.87109375, -32.216796875, -30.5625, -28.908203125, -27.25390625, -25.599609375, -23.9453125, -22.291015625, -20.63671875, -18.982421875, -17.328125, -15.673828125, -14.01953125, -12.365234375, -10.7109375, -9.056640625, -7.40234375, -5.748046875, -4.09375, -2.439453125, -0.78515625, 0.869140625, 2.5234375, 4.177734375, 5.83203125, 7.486328125, 9.140625, 10.794921875, 12.44921875, 14.103515625, 15.7578125, 17.412109375, 19.06640625, 20.720703125, 22.375, 24.029296875, 25.68359375, 27.337890625, 28.9921875, 30.646484375, 32.30078125, 33.955078125, 35.609375, 37.263671875, 38.91796875, 40.572265625, 42.2265625, 43.880859375, 45.53515625, 47.189453125, 48.84375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 11.0, 15.0, 19.0, 34.0, 37.0, 62.0, 73.0, 84.0, 94.0, 99.0, 90.0, 83.0, 63.0, 52.0, 47.0, 33.0, 26.0, 16.0, 10.0, 10.0, 5.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0036869049072265625, -0.003576606512069702, -0.003466308116912842, -0.0033560097217559814, -0.003245711326599121, -0.0031354129314422607, -0.0030251145362854004, -0.00291481614112854, -0.0028045177459716797, -0.0026942193508148193, -0.002583920955657959, -0.0024736225605010986, -0.0023633241653442383, -0.002253025770187378, -0.0021427273750305176, -0.0020324289798736572, -0.0019221305847167969, -0.0018118321895599365, -0.0017015337944030762, -0.0015912353992462158, -0.0014809370040893555, -0.0013706386089324951, -0.0012603402137756348, -0.0011500418186187744, -0.001039743423461914, -0.0009294450283050537, -0.0008191466331481934, -0.000708848237991333, -0.0005985498428344727, -0.0004882514476776123, -0.00037795305252075195, -0.0002676546573638916, -0.00015735626220703125, -4.70578670501709e-05, 6.324052810668945e-05, 0.0001735389232635498, 0.00028383731842041016, 0.0003941357135772705, 0.0005044341087341309, 0.0006147325038909912, 0.0007250308990478516, 0.0008353292942047119, 0.0009456276893615723, 0.0010559260845184326, 0.001166224479675293, 0.0012765228748321533, 0.0013868212699890137, 0.001497119665145874, 0.0016074180603027344, 0.0017177164554595947, 0.001828014850616455, 0.0019383132457733154, 0.0020486116409301758, 0.002158910036087036, 0.0022692084312438965, 0.002379506826400757, 0.002489805221557617, 0.0026001036167144775, 0.002710402011871338, 0.0028207004070281982, 0.0029309988021850586, 0.003041297197341919, 0.0031515955924987793, 0.0032618939876556396, 0.0033721923828125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 11.0, 15.0, 21.0, 23.0, 34.0, 54.0, 85.0, 131.0, 175.0, 302.0, 428.0, 661.0, 1019.0, 1646.0, 2697.0, 4359.0, 7713.0, 13910.0, 26410.0, 56292.0, 124276.0, 233723.0, 263259.0, 161237.0, 74879.0, 34596.0, 17305.0, 9327.0, 5365.0, 3236.0, 1911.0, 1204.0, 762.0, 478.0, 319.0, 237.0, 136.0, 90.0, 66.0, 42.0, 36.0, 31.0, 17.0, 7.0, 9.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-32.09375, -31.12646484375, -30.1591796875, -29.19189453125, -28.224609375, -27.25732421875, -26.2900390625, -25.32275390625, -24.35546875, -23.38818359375, -22.4208984375, -21.45361328125, -20.486328125, -19.51904296875, -18.5517578125, -17.58447265625, -16.6171875, -15.64990234375, -14.6826171875, -13.71533203125, -12.748046875, -11.78076171875, -10.8134765625, -9.84619140625, -8.87890625, -7.91162109375, -6.9443359375, -5.97705078125, -5.009765625, -4.04248046875, -3.0751953125, -2.10791015625, -1.140625, -0.17333984375, 0.7939453125, 1.76123046875, 2.728515625, 3.69580078125, 4.6630859375, 5.63037109375, 6.59765625, 7.56494140625, 8.5322265625, 9.49951171875, 10.466796875, 11.43408203125, 12.4013671875, 13.36865234375, 14.3359375, 15.30322265625, 16.2705078125, 17.23779296875, 18.205078125, 19.17236328125, 20.1396484375, 21.10693359375, 22.07421875, 23.04150390625, 24.0087890625, 24.97607421875, 25.943359375, 26.91064453125, 27.8779296875, 28.84521484375, 29.8125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 3.0, 9.0, 6.0, 4.0, 11.0, 19.0, 20.0, 37.0, 31.0, 59.0, 66.0, 79.0, 92.0, 93.0, 108.0, 99.0, 72.0, 52.0, 44.0, 19.0, 23.0, 13.0, 14.0, 9.0, 3.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.1953125, -12.7789306640625, -12.362548828125, -11.9461669921875, -11.52978515625, -11.1134033203125, -10.697021484375, -10.2806396484375, -9.8642578125, -9.4478759765625, -9.031494140625, -8.6151123046875, -8.19873046875, -7.7823486328125, -7.365966796875, -6.9495849609375, -6.533203125, -6.1168212890625, -5.700439453125, -5.2840576171875, -4.86767578125, -4.4512939453125, -4.034912109375, -3.6185302734375, -3.2021484375, -2.7857666015625, -2.369384765625, -1.9530029296875, -1.53662109375, -1.1202392578125, -0.703857421875, -0.2874755859375, 0.12890625, 0.5452880859375, 0.961669921875, 1.3780517578125, 1.79443359375, 2.2108154296875, 2.627197265625, 3.0435791015625, 3.4599609375, 3.8763427734375, 4.292724609375, 4.7091064453125, 5.12548828125, 5.5418701171875, 5.958251953125, 6.3746337890625, 6.791015625, 7.2073974609375, 7.623779296875, 8.0401611328125, 8.45654296875, 8.8729248046875, 9.289306640625, 9.7056884765625, 10.1220703125, 10.5384521484375, 10.954833984375, 11.3712158203125, 11.78759765625, 12.2039794921875, 12.620361328125, 13.0367431640625, 13.453125]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 8.0, 4.0, 15.0, 11.0, 18.0, 18.0, 17.0, 22.0, 30.0, 36.0, 43.0, 46.0, 54.0, 54.0, 60.0, 56.0, 58.0, 61.0, 55.0, 53.0, 53.0, 33.0, 34.0, 27.0, 26.0, 21.0, 16.0, 16.0, 15.0, 8.0, 5.0, 6.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.70570182800293, -27.76563262939453, -26.825563430786133, -25.885494232177734, -24.94542694091797, -24.00535774230957, -23.065288543701172, -22.125219345092773, -21.185150146484375, -20.245080947875977, -19.305011749267578, -18.364944458007812, -17.424875259399414, -16.484806060791016, -15.544736862182617, -14.604667663574219, -13.664599418640137, -12.724530220031738, -11.784461975097656, -10.844392776489258, -9.90432357788086, -8.964254379272461, -8.024186134338379, -7.0841169357299805, -6.14404821395874, -5.2039794921875, -4.263910293579102, -3.3238415718078613, -2.383772611618042, -1.4437036514282227, -0.5036349296569824, 0.436434268951416, 1.3765029907226562, 2.3165719509124756, 3.256640911102295, 4.196709632873535, 5.136778831481934, 6.076847553253174, 7.016916275024414, 7.9569854736328125, 8.897054672241211, 9.83712387084961, 10.777192115783691, 11.71726131439209, 12.657330513000488, 13.59739875793457, 14.537467956542969, 15.477537155151367, 16.417606353759766, 17.357675552368164, 18.297744750976562, 19.237812042236328, 20.177881240844727, 21.117950439453125, 22.058019638061523, 22.998088836669922, 23.938156127929688, 24.878225326538086, 25.818294525146484, 26.75836181640625, 27.69843101501465, 28.638500213623047, 29.578569412231445, 30.518638610839844, 31.458707809448242]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 1.0, 4.0, 8.0, 5.0, 8.0, 12.0, 10.0, 13.0, 9.0, 16.0, 17.0, 27.0, 27.0, 26.0, 32.0, 32.0, 30.0, 40.0, 41.0, 34.0, 30.0, 50.0, 37.0, 37.0, 46.0, 42.0, 31.0, 39.0, 43.0, 34.0, 26.0, 28.0, 32.0, 14.0, 21.0, 17.0, 11.0, 12.0, 11.0, 12.0, 7.0, 8.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.769573211669922, -24.033735275268555, -23.297897338867188, -22.56205940246582, -21.826221466064453, -21.090381622314453, -20.354543685913086, -19.61870574951172, -18.88286781311035, -18.147029876708984, -17.411191940307617, -16.67535400390625, -15.939515113830566, -15.2036771774292, -14.467838287353516, -13.732000350952148, -12.996162414550781, -12.260324478149414, -11.524486541748047, -10.788647651672363, -10.052809715270996, -9.316971778869629, -8.581132888793945, -7.845294952392578, -7.109457015991211, -6.373619079589844, -5.637780666351318, -4.901942253112793, -4.166104316711426, -3.4302661418914795, -2.694427967071533, -1.9585895538330078, -1.2227535247802734, -0.48691534996032715, 0.24892282485961914, 0.9847609996795654, 1.7205991744995117, 2.456437349319458, 3.1922755241394043, 3.9281139373779297, 4.663951873779297, 5.399789810180664, 6.1356282234191895, 6.871466636657715, 7.607304573059082, 8.34314250946045, 9.078981399536133, 9.8148193359375, 10.550657272338867, 11.286495208740234, 12.022333145141602, 12.758172035217285, 13.494009971618652, 14.22984790802002, 14.965686798095703, 15.70152473449707, 16.437362670898438, 17.173200607299805, 17.909038543701172, 18.64487648010254, 19.380714416503906, 20.116554260253906, 20.852392196655273, 21.58823013305664, 22.324068069458008]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 11.0, 12.0, 18.0, 28.0, 42.0, 61.0, 89.0, 114.0, 199.0, 334.0, 493.0, 808.0, 1243.0, 2136.0, 3370.0, 5829.0, 10019.0, 17687.0, 31386.0, 57786.0, 108282.0, 202119.0, 373146.0, 625151.0, 826894.0, 765347.0, 514554.0, 294201.0, 159025.0, 85112.0, 45964.0, 26140.0, 14689.0, 8604.0, 5110.0, 3079.0, 1937.0, 1106.0, 724.0, 515.0, 316.0, 218.0, 144.0, 84.0, 44.0, 43.0, 23.0, 15.0, 7.0, 11.0, 5.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-21.65625, -20.953125, -20.25, -19.546875, -18.84375, -18.140625, -17.4375, -16.734375, -16.03125, -15.328125, -14.625, -13.921875, -13.21875, -12.515625, -11.8125, -11.109375, -10.40625, -9.703125, -9.0, -8.296875, -7.59375, -6.890625, -6.1875, -5.484375, -4.78125, -4.078125, -3.375, -2.671875, -1.96875, -1.265625, -0.5625, 0.140625, 0.84375, 1.546875, 2.25, 2.953125, 3.65625, 4.359375, 5.0625, 5.765625, 6.46875, 7.171875, 7.875, 8.578125, 9.28125, 9.984375, 10.6875, 11.390625, 12.09375, 12.796875, 13.5, 14.203125, 14.90625, 15.609375, 16.3125, 17.015625, 17.71875, 18.421875, 19.125, 19.828125, 20.53125, 21.234375, 21.9375, 22.640625, 23.34375]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 7.0, 4.0, 9.0, 10.0, 11.0, 12.0, 16.0, 14.0, 20.0, 35.0, 26.0, 29.0, 30.0, 31.0, 41.0, 37.0, 47.0, 39.0, 48.0, 37.0, 38.0, 46.0, 36.0, 37.0, 39.0, 32.0, 37.0, 35.0, 21.0, 22.0, 27.0, 16.0, 17.0, 17.0, 16.0, 14.0, 11.0, 8.0, 4.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.734375, -15.25, -14.765625, -14.28125, -13.796875, -13.3125, -12.828125, -12.34375, -11.859375, -11.375, -10.890625, -10.40625, -9.921875, -9.4375, -8.953125, -8.46875, -7.984375, -7.5, -7.015625, -6.53125, -6.046875, -5.5625, -5.078125, -4.59375, -4.109375, -3.625, -3.140625, -2.65625, -2.171875, -1.6875, -1.203125, -0.71875, -0.234375, 0.25, 0.734375, 1.21875, 1.703125, 2.1875, 2.671875, 3.15625, 3.640625, 4.125, 4.609375, 5.09375, 5.578125, 6.0625, 6.546875, 7.03125, 7.515625, 8.0, 8.484375, 8.96875, 9.453125, 9.9375, 10.421875, 10.90625, 11.390625, 11.875, 12.359375, 12.84375, 13.328125, 13.8125, 14.296875, 14.78125, 15.265625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 10.0, 12.0, 14.0, 24.0, 32.0, 61.0, 117.0, 163.0, 266.0, 423.0, 730.0, 1143.0, 1896.0, 3031.0, 5355.0, 9492.0, 16601.0, 29927.0, 55296.0, 100922.0, 183762.0, 323873.0, 522229.0, 716386.0, 752972.0, 592190.0, 382370.0, 221660.0, 122442.0, 66844.0, 36801.0, 20136.0, 11406.0, 6348.0, 3761.0, 2151.0, 1303.0, 805.0, 502.0, 307.0, 208.0, 108.0, 60.0, 55.0, 27.0, 28.0, 21.0, 5.0, 4.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.32177734375, -18.6591796875, -17.99658203125, -17.333984375, -16.67138671875, -16.0087890625, -15.34619140625, -14.68359375, -14.02099609375, -13.3583984375, -12.69580078125, -12.033203125, -11.37060546875, -10.7080078125, -10.04541015625, -9.3828125, -8.72021484375, -8.0576171875, -7.39501953125, -6.732421875, -6.06982421875, -5.4072265625, -4.74462890625, -4.08203125, -3.41943359375, -2.7568359375, -2.09423828125, -1.431640625, -0.76904296875, -0.1064453125, 0.55615234375, 1.21875, 1.88134765625, 2.5439453125, 3.20654296875, 3.869140625, 4.53173828125, 5.1943359375, 5.85693359375, 6.51953125, 7.18212890625, 7.8447265625, 8.50732421875, 9.169921875, 9.83251953125, 10.4951171875, 11.15771484375, 11.8203125, 12.48291015625, 13.1455078125, 13.80810546875, 14.470703125, 15.13330078125, 15.7958984375, 16.45849609375, 17.12109375, 17.78369140625, 18.4462890625, 19.10888671875, 19.771484375, 20.43408203125, 21.0966796875, 21.75927734375, 22.421875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 11.0, 12.0, 9.0, 12.0, 28.0, 27.0, 31.0, 46.0, 57.0, 74.0, 76.0, 87.0, 122.0, 121.0, 142.0, 173.0, 188.0, 220.0, 225.0, 239.0, 248.0, 221.0, 220.0, 201.0, 188.0, 199.0, 158.0, 123.0, 112.0, 116.0, 75.0, 67.0, 54.0, 41.0, 26.0, 24.0, 18.0, 18.0, 18.0, 15.0, 8.0, 4.0, 10.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.58203125, -6.35174560546875, -6.1214599609375, -5.89117431640625, -5.660888671875, -5.43060302734375, -5.2003173828125, -4.97003173828125, -4.73974609375, -4.50946044921875, -4.2791748046875, -4.04888916015625, -3.818603515625, -3.58831787109375, -3.3580322265625, -3.12774658203125, -2.8974609375, -2.66717529296875, -2.4368896484375, -2.20660400390625, -1.976318359375, -1.74603271484375, -1.5157470703125, -1.28546142578125, -1.05517578125, -0.82489013671875, -0.5946044921875, -0.36431884765625, -0.134033203125, 0.09625244140625, 0.3265380859375, 0.55682373046875, 0.787109375, 1.01739501953125, 1.2476806640625, 1.47796630859375, 1.708251953125, 1.93853759765625, 2.1688232421875, 2.39910888671875, 2.62939453125, 2.85968017578125, 3.0899658203125, 3.32025146484375, 3.550537109375, 3.78082275390625, 4.0111083984375, 4.24139404296875, 4.4716796875, 4.70196533203125, 4.9322509765625, 5.16253662109375, 5.392822265625, 5.62310791015625, 5.8533935546875, 6.08367919921875, 6.31396484375, 6.54425048828125, 6.7745361328125, 7.00482177734375, 7.235107421875, 7.46539306640625, 7.6956787109375, 7.92596435546875, 8.15625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 4.0, 6.0, 10.0, 8.0, 12.0, 15.0, 24.0, 27.0, 28.0, 29.0, 32.0, 35.0, 43.0, 43.0, 47.0, 48.0, 45.0, 54.0, 63.0, 42.0, 54.0, 41.0, 39.0, 34.0, 43.0, 31.0, 26.0, 14.0, 25.0, 14.0, 9.0, 7.0, 10.0, 7.0, 6.0, 6.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.09479522705078, -21.410888671875, -20.72698211669922, -20.043073654174805, -19.359167098999023, -18.675260543823242, -17.99135398864746, -17.307445526123047, -16.623538970947266, -15.939632415771484, -15.255724906921387, -14.571818351745605, -13.887910842895508, -13.204004287719727, -12.520097732543945, -11.836190223693848, -11.152283668518066, -10.468377113342285, -9.784469604492188, -9.100563049316406, -8.416655540466309, -7.732748985290527, -7.048841953277588, -6.364934921264648, -5.681027889251709, -4.9971208572387695, -4.31321382522583, -3.6293070316314697, -2.9453999996185303, -2.261492967605591, -1.5775861740112305, -0.893679141998291, -0.20977210998535156, 0.4741348624229431, 1.1580418348312378, 1.8419487476348877, 2.525855779647827, 3.2097628116607666, 3.893669605255127, 4.577576637268066, 5.261483669281006, 5.945390701293945, 6.629297733306885, 7.313204765319824, 7.9971113204956055, 8.681018829345703, 9.364925384521484, 10.048831939697266, 10.732739448547363, 11.416646003723145, 12.100553512573242, 12.784460067749023, 13.468367576599121, 14.152274131774902, 14.836181640625, 15.520088195800781, 16.203994750976562, 16.887901306152344, 17.571807861328125, 18.25571632385254, 18.93962287902832, 19.6235294342041, 20.307435989379883, 20.991344451904297, 21.675251007080078]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 7.0, 8.0, 6.0, 6.0, 3.0, 6.0, 6.0, 12.0, 16.0, 14.0, 16.0, 18.0, 20.0, 33.0, 26.0, 32.0, 32.0, 31.0, 44.0, 38.0, 35.0, 37.0, 34.0, 49.0, 37.0, 35.0, 37.0, 44.0, 47.0, 36.0, 32.0, 28.0, 22.0, 21.0, 18.0, 20.0, 19.0, 14.0, 13.0, 12.0, 6.0, 6.0, 5.0, 5.0, 9.0, 8.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-20.271059036254883, -19.708677291870117, -19.14629364013672, -18.583911895751953, -18.021530151367188, -17.45914649963379, -16.896764755249023, -16.334381103515625, -15.77199935913086, -15.209616661071777, -14.647233963012695, -14.08485221862793, -13.522469520568848, -12.960086822509766, -12.397705078125, -11.835322380065918, -11.272939682006836, -10.710556983947754, -10.148174285888672, -9.585792541503906, -9.023409843444824, -8.461027145385742, -7.898644924163818, -7.3362627029418945, -6.7738800048828125, -6.2114973068237305, -5.649115085601807, -5.086732864379883, -4.524350166320801, -3.961967706680298, -3.399585247039795, -2.837202787399292, -2.274822235107422, -1.712439775466919, -1.150057315826416, -0.5876748561859131, -0.025292396545410156, 0.5370900630950928, 1.0994725227355957, 1.6618549823760986, 2.2242374420166016, 2.7866199016571045, 3.3490023612976074, 3.9113848209381104, 4.473767280578613, 5.036149978637695, 5.598532199859619, 6.160914421081543, 6.723297119140625, 7.285679817199707, 7.848062038421631, 8.410444259643555, 8.972826957702637, 9.535209655761719, 10.097591400146484, 10.659974098205566, 11.222356796264648, 11.78473949432373, 12.347122192382812, 12.909503936767578, 13.47188663482666, 14.034269332885742, 14.596651077270508, 15.15903377532959, 15.721416473388672]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 9.0, 3.0, 11.0, 21.0, 22.0, 50.0, 40.0, 70.0, 119.0, 176.0, 247.0, 375.0, 526.0, 780.0, 1175.0, 1910.0, 2897.0, 4198.0, 6420.0, 10256.0, 16374.0, 27579.0, 48918.0, 90433.0, 158048.0, 215569.0, 189465.0, 117606.0, 64047.0, 35331.0, 20533.0, 12433.0, 7993.0, 4980.0, 3351.0, 2171.0, 1425.0, 1039.0, 643.0, 417.0, 281.0, 215.0, 142.0, 92.0, 60.0, 37.0, 30.0, 14.0, 18.0, 9.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.578125, -24.771728515625, -23.96533203125, -23.158935546875, -22.3525390625, -21.546142578125, -20.73974609375, -19.933349609375, -19.126953125, -18.320556640625, -17.51416015625, -16.707763671875, -15.9013671875, -15.094970703125, -14.28857421875, -13.482177734375, -12.67578125, -11.869384765625, -11.06298828125, -10.256591796875, -9.4501953125, -8.643798828125, -7.83740234375, -7.031005859375, -6.224609375, -5.418212890625, -4.61181640625, -3.805419921875, -2.9990234375, -2.192626953125, -1.38623046875, -0.579833984375, 0.2265625, 1.032958984375, 1.83935546875, 2.645751953125, 3.4521484375, 4.258544921875, 5.06494140625, 5.871337890625, 6.677734375, 7.484130859375, 8.29052734375, 9.096923828125, 9.9033203125, 10.709716796875, 11.51611328125, 12.322509765625, 13.12890625, 13.935302734375, 14.74169921875, 15.548095703125, 16.3544921875, 17.160888671875, 17.96728515625, 18.773681640625, 19.580078125, 20.386474609375, 21.19287109375, 21.999267578125, 22.8056640625, 23.612060546875, 24.41845703125, 25.224853515625, 26.03125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 7.0, 1.0, 8.0, 8.0, 15.0, 6.0, 11.0, 19.0, 14.0, 17.0, 21.0, 24.0, 31.0, 33.0, 34.0, 35.0, 44.0, 29.0, 34.0, 29.0, 43.0, 47.0, 41.0, 30.0, 57.0, 46.0, 44.0, 27.0, 28.0, 25.0, 26.0, 27.0, 23.0, 27.0, 17.0, 18.0, 14.0, 4.0, 11.0, 7.0, 8.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-21.6875, -21.095458984375, -20.50341796875, -19.911376953125, -19.3193359375, -18.727294921875, -18.13525390625, -17.543212890625, -16.951171875, -16.359130859375, -15.76708984375, -15.175048828125, -14.5830078125, -13.990966796875, -13.39892578125, -12.806884765625, -12.21484375, -11.622802734375, -11.03076171875, -10.438720703125, -9.8466796875, -9.254638671875, -8.66259765625, -8.070556640625, -7.478515625, -6.886474609375, -6.29443359375, -5.702392578125, -5.1103515625, -4.518310546875, -3.92626953125, -3.334228515625, -2.7421875, -2.150146484375, -1.55810546875, -0.966064453125, -0.3740234375, 0.218017578125, 0.81005859375, 1.402099609375, 1.994140625, 2.586181640625, 3.17822265625, 3.770263671875, 4.3623046875, 4.954345703125, 5.54638671875, 6.138427734375, 6.73046875, 7.322509765625, 7.91455078125, 8.506591796875, 9.0986328125, 9.690673828125, 10.28271484375, 10.874755859375, 11.466796875, 12.058837890625, 12.65087890625, 13.242919921875, 13.8349609375, 14.427001953125, 15.01904296875, 15.611083984375, 16.203125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 4.0, 8.0, 8.0, 18.0, 16.0, 26.0, 45.0, 53.0, 65.0, 98.0, 190.0, 216.0, 337.0, 478.0, 730.0, 1154.0, 1826.0, 2965.0, 4973.0, 8891.0, 16845.0, 35536.0, 89553.0, 257811.0, 369230.0, 150090.0, 54517.0, 24012.0, 11909.0, 6525.0, 3832.0, 2287.0, 1485.0, 969.0, 581.0, 419.0, 245.0, 172.0, 136.0, 76.0, 67.0, 50.0, 33.0, 18.0, 21.0, 11.0, 10.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-49.65625, -48.16259765625, -46.6689453125, -45.17529296875, -43.681640625, -42.18798828125, -40.6943359375, -39.20068359375, -37.70703125, -36.21337890625, -34.7197265625, -33.22607421875, -31.732421875, -30.23876953125, -28.7451171875, -27.25146484375, -25.7578125, -24.26416015625, -22.7705078125, -21.27685546875, -19.783203125, -18.28955078125, -16.7958984375, -15.30224609375, -13.80859375, -12.31494140625, -10.8212890625, -9.32763671875, -7.833984375, -6.34033203125, -4.8466796875, -3.35302734375, -1.859375, -0.36572265625, 1.1279296875, 2.62158203125, 4.115234375, 5.60888671875, 7.1025390625, 8.59619140625, 10.08984375, 11.58349609375, 13.0771484375, 14.57080078125, 16.064453125, 17.55810546875, 19.0517578125, 20.54541015625, 22.0390625, 23.53271484375, 25.0263671875, 26.52001953125, 28.013671875, 29.50732421875, 31.0009765625, 32.49462890625, 33.98828125, 35.48193359375, 36.9755859375, 38.46923828125, 39.962890625, 41.45654296875, 42.9501953125, 44.44384765625, 45.9375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 13.0, 4.0, 5.0, 10.0, 8.0, 16.0, 12.0, 26.0, 23.0, 17.0, 33.0, 33.0, 27.0, 38.0, 42.0, 38.0, 43.0, 32.0, 40.0, 45.0, 46.0, 55.0, 31.0, 36.0, 46.0, 36.0, 41.0, 32.0, 30.0, 22.0, 17.0, 20.0, 26.0, 7.0, 10.0, 5.0, 7.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.21875, -11.81591796875, -11.4130859375, -11.01025390625, -10.607421875, -10.20458984375, -9.8017578125, -9.39892578125, -8.99609375, -8.59326171875, -8.1904296875, -7.78759765625, -7.384765625, -6.98193359375, -6.5791015625, -6.17626953125, -5.7734375, -5.37060546875, -4.9677734375, -4.56494140625, -4.162109375, -3.75927734375, -3.3564453125, -2.95361328125, -2.55078125, -2.14794921875, -1.7451171875, -1.34228515625, -0.939453125, -0.53662109375, -0.1337890625, 0.26904296875, 0.671875, 1.07470703125, 1.4775390625, 1.88037109375, 2.283203125, 2.68603515625, 3.0888671875, 3.49169921875, 3.89453125, 4.29736328125, 4.7001953125, 5.10302734375, 5.505859375, 5.90869140625, 6.3115234375, 6.71435546875, 7.1171875, 7.52001953125, 7.9228515625, 8.32568359375, 8.728515625, 9.13134765625, 9.5341796875, 9.93701171875, 10.33984375, 10.74267578125, 11.1455078125, 11.54833984375, 11.951171875, 12.35400390625, 12.7568359375, 13.15966796875, 13.5625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 7.0, 7.0, 10.0, 26.0, 29.0, 44.0, 78.0, 94.0, 129.0, 216.0, 325.0, 548.0, 874.0, 1424.0, 2581.0, 4848.0, 10508.0, 26031.0, 74542.0, 230190.0, 406172.0, 188300.0, 60611.0, 21694.0, 8999.0, 4364.0, 2317.0, 1352.0, 814.0, 487.0, 306.0, 219.0, 130.0, 86.0, 56.0, 42.0, 32.0, 20.0, 12.0, 10.0, 7.0, 0.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.328125, -21.56884765625, -20.8095703125, -20.05029296875, -19.291015625, -18.53173828125, -17.7724609375, -17.01318359375, -16.25390625, -15.49462890625, -14.7353515625, -13.97607421875, -13.216796875, -12.45751953125, -11.6982421875, -10.93896484375, -10.1796875, -9.42041015625, -8.6611328125, -7.90185546875, -7.142578125, -6.38330078125, -5.6240234375, -4.86474609375, -4.10546875, -3.34619140625, -2.5869140625, -1.82763671875, -1.068359375, -0.30908203125, 0.4501953125, 1.20947265625, 1.96875, 2.72802734375, 3.4873046875, 4.24658203125, 5.005859375, 5.76513671875, 6.5244140625, 7.28369140625, 8.04296875, 8.80224609375, 9.5615234375, 10.32080078125, 11.080078125, 11.83935546875, 12.5986328125, 13.35791015625, 14.1171875, 14.87646484375, 15.6357421875, 16.39501953125, 17.154296875, 17.91357421875, 18.6728515625, 19.43212890625, 20.19140625, 20.95068359375, 21.7099609375, 22.46923828125, 23.228515625, 23.98779296875, 24.7470703125, 25.50634765625, 26.265625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 10.0, 9.0, 18.0, 10.0, 35.0, 60.0, 95.0, 152.0, 197.0, 151.0, 94.0, 55.0, 35.0, 26.0, 13.0, 5.0, 9.0, 6.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0019502639770507812, -0.0019032955169677734, -0.0018563270568847656, -0.0018093585968017578, -0.00176239013671875, -0.0017154216766357422, -0.0016684532165527344, -0.0016214847564697266, -0.0015745162963867188, -0.001527547836303711, -0.0014805793762207031, -0.0014336109161376953, -0.0013866424560546875, -0.0013396739959716797, -0.0012927055358886719, -0.001245737075805664, -0.0011987686157226562, -0.0011518001556396484, -0.0011048316955566406, -0.0010578632354736328, -0.001010894775390625, -0.0009639263153076172, -0.0009169578552246094, -0.0008699893951416016, -0.0008230209350585938, -0.0007760524749755859, -0.0007290840148925781, -0.0006821155548095703, -0.0006351470947265625, -0.0005881786346435547, -0.0005412101745605469, -0.0004942417144775391, -0.00044727325439453125, -0.00040030479431152344, -0.0003533363342285156, -0.0003063678741455078, -0.0002593994140625, -0.0002124309539794922, -0.00016546249389648438, -0.00011849403381347656, -7.152557373046875e-05, -2.4557113647460938e-05, 2.2411346435546875e-05, 6.937980651855469e-05, 0.0001163482666015625, 0.0001633167266845703, 0.00021028518676757812, 0.00025725364685058594, 0.00030422210693359375, 0.00035119056701660156, 0.0003981590270996094, 0.0004451274871826172, 0.000492095947265625, 0.0005390644073486328, 0.0005860328674316406, 0.0006330013275146484, 0.0006799697875976562, 0.0007269382476806641, 0.0007739067077636719, 0.0008208751678466797, 0.0008678436279296875, 0.0009148120880126953, 0.0009617805480957031, 0.001008749008178711, 0.0010557174682617188]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 17.0, 20.0, 15.0, 24.0, 37.0, 55.0, 73.0, 105.0, 158.0, 221.0, 364.0, 545.0, 912.0, 1582.0, 2726.0, 5387.0, 11107.0, 24235.0, 57666.0, 137907.0, 272147.0, 278461.0, 144887.0, 60480.0, 25212.0, 11429.0, 5636.0, 2927.0, 1569.0, 973.0, 576.0, 337.0, 234.0, 149.0, 112.0, 69.0, 48.0, 38.0, 29.0, 18.0, 20.0, 11.0, 9.0, 9.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-18.6875, -18.085205078125, -17.48291015625, -16.880615234375, -16.2783203125, -15.676025390625, -15.07373046875, -14.471435546875, -13.869140625, -13.266845703125, -12.66455078125, -12.062255859375, -11.4599609375, -10.857666015625, -10.25537109375, -9.653076171875, -9.05078125, -8.448486328125, -7.84619140625, -7.243896484375, -6.6416015625, -6.039306640625, -5.43701171875, -4.834716796875, -4.232421875, -3.630126953125, -3.02783203125, -2.425537109375, -1.8232421875, -1.220947265625, -0.61865234375, -0.016357421875, 0.5859375, 1.188232421875, 1.79052734375, 2.392822265625, 2.9951171875, 3.597412109375, 4.19970703125, 4.802001953125, 5.404296875, 6.006591796875, 6.60888671875, 7.211181640625, 7.8134765625, 8.415771484375, 9.01806640625, 9.620361328125, 10.22265625, 10.824951171875, 11.42724609375, 12.029541015625, 12.6318359375, 13.234130859375, 13.83642578125, 14.438720703125, 15.041015625, 15.643310546875, 16.24560546875, 16.847900390625, 17.4501953125, 18.052490234375, 18.65478515625, 19.257080078125, 19.859375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 3.0, 5.0, 7.0, 14.0, 12.0, 15.0, 26.0, 25.0, 19.0, 44.0, 39.0, 51.0, 65.0, 72.0, 66.0, 89.0, 72.0, 75.0, 54.0, 48.0, 35.0, 31.0, 27.0, 15.0, 23.0, 21.0, 6.0, 5.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-7.67578125, -7.48822021484375, -7.3006591796875, -7.11309814453125, -6.925537109375, -6.73797607421875, -6.5504150390625, -6.36285400390625, -6.17529296875, -5.98773193359375, -5.8001708984375, -5.61260986328125, -5.425048828125, -5.23748779296875, -5.0499267578125, -4.86236572265625, -4.6748046875, -4.48724365234375, -4.2996826171875, -4.11212158203125, -3.924560546875, -3.73699951171875, -3.5494384765625, -3.36187744140625, -3.17431640625, -2.98675537109375, -2.7991943359375, -2.61163330078125, -2.424072265625, -2.23651123046875, -2.0489501953125, -1.86138916015625, -1.673828125, -1.48626708984375, -1.2987060546875, -1.11114501953125, -0.923583984375, -0.73602294921875, -0.5484619140625, -0.36090087890625, -0.17333984375, 0.01422119140625, 0.2017822265625, 0.38934326171875, 0.576904296875, 0.76446533203125, 0.9520263671875, 1.13958740234375, 1.3271484375, 1.51470947265625, 1.7022705078125, 1.88983154296875, 2.077392578125, 2.26495361328125, 2.4525146484375, 2.64007568359375, 2.82763671875, 3.01519775390625, 3.2027587890625, 3.39031982421875, 3.577880859375, 3.76544189453125, 3.9530029296875, 4.14056396484375, 4.328125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 8.0, 10.0, 7.0, 15.0, 9.0, 24.0, 27.0, 24.0, 39.0, 34.0, 45.0, 44.0, 51.0, 57.0, 50.0, 51.0, 58.0, 58.0, 52.0, 46.0, 50.0, 35.0, 45.0, 26.0, 29.0, 24.0, 16.0, 9.0, 6.0, 10.0, 8.0, 7.0, 6.0, 1.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.43088722229004, -22.71494483947754, -21.999004364013672, -21.283061981201172, -20.567121505737305, -19.851179122924805, -19.135238647460938, -18.419296264648438, -17.70335578918457, -16.98741340637207, -16.271472930908203, -15.55553150177002, -14.839590072631836, -14.123648643493652, -13.407707214355469, -12.691764831542969, -11.975823402404785, -11.259881973266602, -10.543940544128418, -9.827999114990234, -9.11205768585205, -8.396116256713867, -7.680174350738525, -6.964232921600342, -6.248291492462158, -5.532350063323975, -4.816408634185791, -4.100466728210449, -3.3845255374908447, -2.668584108352661, -1.9526424407958984, -1.2367010116577148, -0.5207595825195312, 0.19518190622329712, 0.9111233949661255, 1.6270649433135986, 2.3430063724517822, 3.058947801589966, 3.7748894691467285, 4.490830898284912, 5.206772327423096, 5.922713756561279, 6.638655185699463, 7.354597091674805, 8.070538520812988, 8.786479949951172, 9.502421379089355, 10.218362808227539, 10.934304237365723, 11.650245666503906, 12.36618709564209, 13.082128524780273, 13.798069953918457, 14.51401138305664, 15.22995376586914, 15.945894241333008, 16.661836624145508, 17.377779006958008, 18.093719482421875, 18.809661865234375, 19.525602340698242, 20.241544723510742, 20.95748519897461, 21.67342758178711, 22.389368057250977]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 3.0, 5.0, 7.0, 4.0, 12.0, 5.0, 5.0, 13.0, 15.0, 15.0, 16.0, 26.0, 24.0, 20.0, 32.0, 29.0, 25.0, 26.0, 49.0, 43.0, 30.0, 37.0, 36.0, 51.0, 44.0, 42.0, 27.0, 39.0, 37.0, 40.0, 33.0, 28.0, 28.0, 23.0, 21.0, 22.0, 21.0, 8.0, 10.0, 7.0, 10.0, 10.0, 9.0, 2.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.371305465698242, -18.817907333374023, -18.264507293701172, -17.711109161376953, -17.1577091217041, -16.604310989379883, -16.05091094970703, -15.497512817382812, -14.944112777709961, -14.390713691711426, -13.83731460571289, -13.283915519714355, -12.73051643371582, -12.177117347717285, -11.62371826171875, -11.070320129394531, -10.516921043395996, -9.963521957397461, -9.410122871398926, -8.85672378540039, -8.303324699401855, -7.74992561340332, -7.196527004241943, -6.643127918243408, -6.089728832244873, -5.536329746246338, -4.982930660247803, -4.429532051086426, -3.8761327266693115, -3.3227336406707764, -2.7693347930908203, -2.215935707092285, -1.66253662109375, -1.1091375350952148, -0.5557385683059692, -0.002339601516723633, 0.5510594844818115, 1.1044585704803467, 1.6578574180603027, 2.211256504058838, 2.764655590057373, 3.318054676055908, 3.8714537620544434, 4.42485237121582, 4.9782514572143555, 5.531650543212891, 6.085049629211426, 6.638448715209961, 7.191847801208496, 7.745246887207031, 8.298645973205566, 8.852045059204102, 9.405444145202637, 9.958843231201172, 10.51224136352539, 11.065641403198242, 11.619039535522461, 12.172438621520996, 12.725837707519531, 13.279236793518066, 13.832635879516602, 14.386034965515137, 14.939434051513672, 15.49283218383789, 16.046232223510742]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 6.0, 5.0, 13.0, 22.0, 20.0, 24.0, 55.0, 91.0, 108.0, 163.0, 239.0, 392.0, 536.0, 871.0, 1199.0, 1992.0, 3078.0, 4764.0, 7691.0, 12430.0, 20252.0, 32555.0, 51858.0, 79459.0, 113276.0, 142226.0, 151995.0, 134326.0, 101578.0, 69374.0, 44067.0, 27537.0, 17337.0, 10589.0, 6527.0, 4101.0, 2662.0, 1728.0, 1134.0, 753.0, 517.0, 324.0, 209.0, 157.0, 102.0, 75.0, 39.0, 34.0, 21.0, 15.0, 13.0, 7.0, 4.0, 6.0, 3.0, 2.0], "bins": [-22.3125, -21.66259765625, -21.0126953125, -20.36279296875, -19.712890625, -19.06298828125, -18.4130859375, -17.76318359375, -17.11328125, -16.46337890625, -15.8134765625, -15.16357421875, -14.513671875, -13.86376953125, -13.2138671875, -12.56396484375, -11.9140625, -11.26416015625, -10.6142578125, -9.96435546875, -9.314453125, -8.66455078125, -8.0146484375, -7.36474609375, -6.71484375, -6.06494140625, -5.4150390625, -4.76513671875, -4.115234375, -3.46533203125, -2.8154296875, -2.16552734375, -1.515625, -0.86572265625, -0.2158203125, 0.43408203125, 1.083984375, 1.73388671875, 2.3837890625, 3.03369140625, 3.68359375, 4.33349609375, 4.9833984375, 5.63330078125, 6.283203125, 6.93310546875, 7.5830078125, 8.23291015625, 8.8828125, 9.53271484375, 10.1826171875, 10.83251953125, 11.482421875, 12.13232421875, 12.7822265625, 13.43212890625, 14.08203125, 14.73193359375, 15.3818359375, 16.03173828125, 16.681640625, 17.33154296875, 17.9814453125, 18.63134765625, 19.28125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 5.0, 10.0, 7.0, 11.0, 6.0, 22.0, 15.0, 20.0, 22.0, 30.0, 28.0, 35.0, 29.0, 37.0, 36.0, 32.0, 42.0, 43.0, 44.0, 50.0, 44.0, 38.0, 34.0, 36.0, 40.0, 34.0, 28.0, 37.0, 35.0, 25.0, 21.0, 18.0, 14.0, 10.0, 9.0, 7.0, 12.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.296875, -18.72998046875, -18.1630859375, -17.59619140625, -17.029296875, -16.46240234375, -15.8955078125, -15.32861328125, -14.76171875, -14.19482421875, -13.6279296875, -13.06103515625, -12.494140625, -11.92724609375, -11.3603515625, -10.79345703125, -10.2265625, -9.65966796875, -9.0927734375, -8.52587890625, -7.958984375, -7.39208984375, -6.8251953125, -6.25830078125, -5.69140625, -5.12451171875, -4.5576171875, -3.99072265625, -3.423828125, -2.85693359375, -2.2900390625, -1.72314453125, -1.15625, -0.58935546875, -0.0224609375, 0.54443359375, 1.111328125, 1.67822265625, 2.2451171875, 2.81201171875, 3.37890625, 3.94580078125, 4.5126953125, 5.07958984375, 5.646484375, 6.21337890625, 6.7802734375, 7.34716796875, 7.9140625, 8.48095703125, 9.0478515625, 9.61474609375, 10.181640625, 10.74853515625, 11.3154296875, 11.88232421875, 12.44921875, 13.01611328125, 13.5830078125, 14.14990234375, 14.716796875, 15.28369140625, 15.8505859375, 16.41748046875, 16.984375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 18.0, 20.0, 37.0, 44.0, 89.0, 125.0, 188.0, 297.0, 464.0, 708.0, 1071.0, 1794.0, 2775.0, 4323.0, 7121.0, 11504.0, 18740.0, 29842.0, 46802.0, 70966.0, 100054.0, 129089.0, 143513.0, 137036.0, 111554.0, 81073.0, 54941.0, 35472.0, 22271.0, 13847.0, 8551.0, 5238.0, 3340.0, 1993.0, 1341.0, 796.0, 564.0, 331.0, 225.0, 143.0, 98.0, 65.0, 38.0, 21.0, 16.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-18.421875, -17.875, -17.328125, -16.78125, -16.234375, -15.6875, -15.140625, -14.59375, -14.046875, -13.5, -12.953125, -12.40625, -11.859375, -11.3125, -10.765625, -10.21875, -9.671875, -9.125, -8.578125, -8.03125, -7.484375, -6.9375, -6.390625, -5.84375, -5.296875, -4.75, -4.203125, -3.65625, -3.109375, -2.5625, -2.015625, -1.46875, -0.921875, -0.375, 0.171875, 0.71875, 1.265625, 1.8125, 2.359375, 2.90625, 3.453125, 4.0, 4.546875, 5.09375, 5.640625, 6.1875, 6.734375, 7.28125, 7.828125, 8.375, 8.921875, 9.46875, 10.015625, 10.5625, 11.109375, 11.65625, 12.203125, 12.75, 13.296875, 13.84375, 14.390625, 14.9375, 15.484375, 16.03125, 16.578125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 3.0, 2.0, 2.0, 7.0, 5.0, 16.0, 15.0, 22.0, 18.0, 20.0, 25.0, 18.0, 30.0, 32.0, 41.0, 33.0, 35.0, 42.0, 50.0, 47.0, 43.0, 53.0, 41.0, 48.0, 49.0, 34.0, 32.0, 34.0, 36.0, 26.0, 28.0, 15.0, 14.0, 16.0, 9.0, 8.0, 10.0, 10.0, 3.0, 4.0, 6.0, 6.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.0390625, -13.6446533203125, -13.250244140625, -12.8558349609375, -12.46142578125, -12.0670166015625, -11.672607421875, -11.2781982421875, -10.8837890625, -10.4893798828125, -10.094970703125, -9.7005615234375, -9.30615234375, -8.9117431640625, -8.517333984375, -8.1229248046875, -7.728515625, -7.3341064453125, -6.939697265625, -6.5452880859375, -6.15087890625, -5.7564697265625, -5.362060546875, -4.9676513671875, -4.5732421875, -4.1788330078125, -3.784423828125, -3.3900146484375, -2.99560546875, -2.6011962890625, -2.206787109375, -1.8123779296875, -1.41796875, -1.0235595703125, -0.629150390625, -0.2347412109375, 0.15966796875, 0.5540771484375, 0.948486328125, 1.3428955078125, 1.7373046875, 2.1317138671875, 2.526123046875, 2.9205322265625, 3.31494140625, 3.7093505859375, 4.103759765625, 4.4981689453125, 4.892578125, 5.2869873046875, 5.681396484375, 6.0758056640625, 6.47021484375, 6.8646240234375, 7.259033203125, 7.6534423828125, 8.0478515625, 8.4422607421875, 8.836669921875, 9.2310791015625, 9.62548828125, 10.0198974609375, 10.414306640625, 10.8087158203125, 11.203125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 16.0, 13.0, 27.0, 22.0, 44.0, 55.0, 66.0, 114.0, 161.0, 179.0, 263.0, 393.0, 539.0, 779.0, 1260.0, 2041.0, 3560.0, 7057.0, 15165.0, 39236.0, 118556.0, 330497.0, 335087.0, 121123.0, 39893.0, 15702.0, 7091.0, 3540.0, 2053.0, 1238.0, 797.0, 574.0, 406.0, 296.0, 222.0, 153.0, 102.0, 72.0, 51.0, 35.0, 21.0, 14.0, 15.0, 11.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-50.5, -49.01513671875, -47.5302734375, -46.04541015625, -44.560546875, -43.07568359375, -41.5908203125, -40.10595703125, -38.62109375, -37.13623046875, -35.6513671875, -34.16650390625, -32.681640625, -31.19677734375, -29.7119140625, -28.22705078125, -26.7421875, -25.25732421875, -23.7724609375, -22.28759765625, -20.802734375, -19.31787109375, -17.8330078125, -16.34814453125, -14.86328125, -13.37841796875, -11.8935546875, -10.40869140625, -8.923828125, -7.43896484375, -5.9541015625, -4.46923828125, -2.984375, -1.49951171875, -0.0146484375, 1.47021484375, 2.955078125, 4.43994140625, 5.9248046875, 7.40966796875, 8.89453125, 10.37939453125, 11.8642578125, 13.34912109375, 14.833984375, 16.31884765625, 17.8037109375, 19.28857421875, 20.7734375, 22.25830078125, 23.7431640625, 25.22802734375, 26.712890625, 28.19775390625, 29.6826171875, 31.16748046875, 32.65234375, 34.13720703125, 35.6220703125, 37.10693359375, 38.591796875, 40.07666015625, 41.5615234375, 43.04638671875, 44.53125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 3.0, 8.0, 8.0, 13.0, 14.0, 15.0, 26.0, 37.0, 37.0, 50.0, 55.0, 71.0, 75.0, 93.0, 82.0, 96.0, 73.0, 59.0, 43.0, 35.0, 24.0, 20.0, 16.0, 15.0, 8.0, 7.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0031261444091796875, -0.0030343830585479736, -0.0029426217079162598, -0.002850860357284546, -0.002759099006652832, -0.002667337656021118, -0.0025755763053894043, -0.0024838149547576904, -0.0023920536041259766, -0.0023002922534942627, -0.002208530902862549, -0.002116769552230835, -0.002025008201599121, -0.0019332468509674072, -0.0018414855003356934, -0.0017497241497039795, -0.0016579627990722656, -0.0015662014484405518, -0.0014744400978088379, -0.001382678747177124, -0.0012909173965454102, -0.0011991560459136963, -0.0011073946952819824, -0.0010156333446502686, -0.0009238719940185547, -0.0008321106433868408, -0.000740349292755127, -0.0006485879421234131, -0.0005568265914916992, -0.00046506524085998535, -0.0003733038902282715, -0.0002815425395965576, -0.00018978118896484375, -9.801983833312988e-05, -6.258487701416016e-06, 8.550286293029785e-05, 0.00017726421356201172, 0.0002690255641937256, 0.00036078691482543945, 0.0004525482654571533, 0.0005443096160888672, 0.0006360709667205811, 0.0007278323173522949, 0.0008195936679840088, 0.0009113550186157227, 0.0010031163692474365, 0.0010948777198791504, 0.0011866390705108643, 0.0012784004211425781, 0.001370161771774292, 0.0014619231224060059, 0.0015536844730377197, 0.0016454458236694336, 0.0017372071743011475, 0.0018289685249328613, 0.0019207298755645752, 0.002012491226196289, 0.002104252576828003, 0.002196013927459717, 0.0022877752780914307, 0.0023795366287231445, 0.0024712979793548584, 0.0025630593299865723, 0.002654820680618286, 0.00274658203125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 8.0, 12.0, 10.0, 14.0, 44.0, 45.0, 82.0, 105.0, 131.0, 208.0, 266.0, 434.0, 707.0, 1204.0, 2135.0, 3877.0, 7380.0, 15263.0, 35221.0, 87300.0, 217066.0, 325483.0, 205184.0, 82583.0, 32943.0, 14702.0, 7202.0, 3678.0, 1992.0, 1181.0, 715.0, 469.0, 305.0, 191.0, 128.0, 87.0, 61.0, 41.0, 28.0, 21.0, 21.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-39.15625, -38.05224609375, -36.9482421875, -35.84423828125, -34.740234375, -33.63623046875, -32.5322265625, -31.42822265625, -30.32421875, -29.22021484375, -28.1162109375, -27.01220703125, -25.908203125, -24.80419921875, -23.7001953125, -22.59619140625, -21.4921875, -20.38818359375, -19.2841796875, -18.18017578125, -17.076171875, -15.97216796875, -14.8681640625, -13.76416015625, -12.66015625, -11.55615234375, -10.4521484375, -9.34814453125, -8.244140625, -7.14013671875, -6.0361328125, -4.93212890625, -3.828125, -2.72412109375, -1.6201171875, -0.51611328125, 0.587890625, 1.69189453125, 2.7958984375, 3.89990234375, 5.00390625, 6.10791015625, 7.2119140625, 8.31591796875, 9.419921875, 10.52392578125, 11.6279296875, 12.73193359375, 13.8359375, 14.93994140625, 16.0439453125, 17.14794921875, 18.251953125, 19.35595703125, 20.4599609375, 21.56396484375, 22.66796875, 23.77197265625, 24.8759765625, 25.97998046875, 27.083984375, 28.18798828125, 29.2919921875, 30.39599609375, 31.5]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 5.0, 4.0, 12.0, 7.0, 11.0, 18.0, 17.0, 24.0, 33.0, 54.0, 47.0, 62.0, 90.0, 96.0, 92.0, 97.0, 79.0, 65.0, 35.0, 37.0, 24.0, 11.0, 14.0, 19.0, 9.0, 10.0, 5.0, 7.0, 4.0, 3.0, 2.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.234375, -8.8935546875, -8.552734375, -8.2119140625, -7.87109375, -7.5302734375, -7.189453125, -6.8486328125, -6.5078125, -6.1669921875, -5.826171875, -5.4853515625, -5.14453125, -4.8037109375, -4.462890625, -4.1220703125, -3.78125, -3.4404296875, -3.099609375, -2.7587890625, -2.41796875, -2.0771484375, -1.736328125, -1.3955078125, -1.0546875, -0.7138671875, -0.373046875, -0.0322265625, 0.30859375, 0.6494140625, 0.990234375, 1.3310546875, 1.671875, 2.0126953125, 2.353515625, 2.6943359375, 3.03515625, 3.3759765625, 3.716796875, 4.0576171875, 4.3984375, 4.7392578125, 5.080078125, 5.4208984375, 5.76171875, 6.1025390625, 6.443359375, 6.7841796875, 7.125, 7.4658203125, 7.806640625, 8.1474609375, 8.48828125, 8.8291015625, 9.169921875, 9.5107421875, 9.8515625, 10.1923828125, 10.533203125, 10.8740234375, 11.21484375, 11.5556640625, 11.896484375, 12.2373046875, 12.578125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 2.0, 6.0, 6.0, 7.0, 9.0, 14.0, 17.0, 21.0, 38.0, 30.0, 31.0, 40.0, 43.0, 59.0, 53.0, 60.0, 54.0, 65.0, 67.0, 50.0, 52.0, 48.0, 36.0, 41.0, 25.0, 23.0, 23.0, 13.0, 12.0, 7.0, 9.0, 12.0, 3.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.140806198120117, -27.35431671142578, -26.567829132080078, -25.781339645385742, -24.994850158691406, -24.208362579345703, -23.421873092651367, -22.63538360595703, -21.848896026611328, -21.062406539916992, -20.27591896057129, -19.489429473876953, -18.702939987182617, -17.91645050048828, -17.129962921142578, -16.343473434448242, -15.556983947753906, -14.770495414733887, -13.98400592803955, -13.197517395019531, -12.411027908325195, -11.624539375305176, -10.838050842285156, -10.05156135559082, -9.2650728225708, -8.478584289550781, -7.692094802856445, -6.905606269836426, -6.119117259979248, -5.33262825012207, -4.546139717102051, -3.759650707244873, -2.9731616973876953, -2.1866726875305176, -1.400183916091919, -0.6136951446533203, 0.17279386520385742, 0.9592828750610352, 1.7457714080810547, 2.5322604179382324, 3.31874942779541, 4.105238437652588, 4.891727447509766, 5.678215980529785, 6.464704990386963, 7.251194000244141, 8.03768253326416, 8.82417106628418, 9.610660552978516, 10.397149085998535, 11.183638572692871, 11.97012710571289, 12.756616592407227, 13.543105125427246, 14.329593658447266, 15.116083145141602, 15.902571678161621, 16.68906021118164, 17.475549697875977, 18.262039184570312, 19.048526763916016, 19.83501625061035, 20.621505737304688, 21.40799331665039, 22.194482803344727]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 11.0, 12.0, 9.0, 9.0, 7.0, 9.0, 14.0, 16.0, 27.0, 28.0, 19.0, 23.0, 25.0, 37.0, 36.0, 33.0, 38.0, 33.0, 43.0, 25.0, 36.0, 44.0, 34.0, 32.0, 35.0, 43.0, 38.0, 33.0, 39.0, 26.0, 30.0, 16.0, 14.0, 13.0, 11.0, 17.0, 13.0, 14.0, 8.0, 9.0, 7.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-17.88873863220215, -17.347524642944336, -16.806310653686523, -16.26509666442871, -15.723883628845215, -15.182669639587402, -14.641456604003906, -14.100242614746094, -13.559028625488281, -13.017814636230469, -12.476600646972656, -11.93538761138916, -11.394173622131348, -10.852959632873535, -10.311746597290039, -9.770532608032227, -9.229318618774414, -8.688104629516602, -8.146890640258789, -7.605677604675293, -7.0644636154174805, -6.523249626159668, -5.982036113739014, -5.440822601318359, -4.899608612060547, -4.358394622802734, -3.81718111038208, -3.2759673595428467, -2.7347536087036133, -2.19353985786438, -1.6523261070251465, -1.111112356185913, -0.5698986053466797, -0.02868485450744629, 0.5125288963317871, 1.0537426471710205, 1.594956398010254, 2.1361701488494873, 2.6773838996887207, 3.218597650527954, 3.7598114013671875, 4.301025390625, 4.842238903045654, 5.383452415466309, 5.924666404724121, 6.465880393981934, 7.007093906402588, 7.548307418823242, 8.089521408081055, 8.630735397338867, 9.17194938659668, 9.713162422180176, 10.254376411437988, 10.7955904006958, 11.336803436279297, 11.87801742553711, 12.419231414794922, 12.960445404052734, 13.501659393310547, 14.042872428894043, 14.584086418151855, 15.125300407409668, 15.666513442993164, 16.207727432250977, 16.74894142150879]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 12.0, 13.0, 28.0, 30.0, 49.0, 88.0, 134.0, 207.0, 337.0, 481.0, 781.0, 1307.0, 2041.0, 3338.0, 5745.0, 9923.0, 17774.0, 32259.0, 61150.0, 120446.0, 237248.0, 461688.0, 778696.0, 922268.0, 708580.0, 400891.0, 205318.0, 103009.0, 53792.0, 28901.0, 15898.0, 8939.0, 5043.0, 3017.0, 1828.0, 1067.0, 670.0, 425.0, 278.0, 202.0, 147.0, 66.0, 52.0, 37.0, 24.0, 15.0, 13.0, 1.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.03125, -17.417724609375, -16.80419921875, -16.190673828125, -15.5771484375, -14.963623046875, -14.35009765625, -13.736572265625, -13.123046875, -12.509521484375, -11.89599609375, -11.282470703125, -10.6689453125, -10.055419921875, -9.44189453125, -8.828369140625, -8.21484375, -7.601318359375, -6.98779296875, -6.374267578125, -5.7607421875, -5.147216796875, -4.53369140625, -3.920166015625, -3.306640625, -2.693115234375, -2.07958984375, -1.466064453125, -0.8525390625, -0.239013671875, 0.37451171875, 0.988037109375, 1.6015625, 2.215087890625, 2.82861328125, 3.442138671875, 4.0556640625, 4.669189453125, 5.28271484375, 5.896240234375, 6.509765625, 7.123291015625, 7.73681640625, 8.350341796875, 8.9638671875, 9.577392578125, 10.19091796875, 10.804443359375, 11.41796875, 12.031494140625, 12.64501953125, 13.258544921875, 13.8720703125, 14.485595703125, 15.09912109375, 15.712646484375, 16.326171875, 16.939697265625, 17.55322265625, 18.166748046875, 18.7802734375, 19.393798828125, 20.00732421875, 20.620849609375, 21.234375]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 8.0, 9.0, 9.0, 13.0, 6.0, 14.0, 13.0, 9.0, 16.0, 13.0, 19.0, 25.0, 21.0, 26.0, 32.0, 32.0, 47.0, 33.0, 30.0, 40.0, 41.0, 27.0, 46.0, 40.0, 34.0, 33.0, 35.0, 36.0, 44.0, 30.0, 14.0, 27.0, 30.0, 20.0, 25.0, 17.0, 6.0, 14.0, 14.0, 10.0, 7.0, 10.0, 8.0, 3.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.75, -11.391357421875, -11.03271484375, -10.674072265625, -10.3154296875, -9.956787109375, -9.59814453125, -9.239501953125, -8.880859375, -8.522216796875, -8.16357421875, -7.804931640625, -7.4462890625, -7.087646484375, -6.72900390625, -6.370361328125, -6.01171875, -5.653076171875, -5.29443359375, -4.935791015625, -4.5771484375, -4.218505859375, -3.85986328125, -3.501220703125, -3.142578125, -2.783935546875, -2.42529296875, -2.066650390625, -1.7080078125, -1.349365234375, -0.99072265625, -0.632080078125, -0.2734375, 0.085205078125, 0.44384765625, 0.802490234375, 1.1611328125, 1.519775390625, 1.87841796875, 2.237060546875, 2.595703125, 2.954345703125, 3.31298828125, 3.671630859375, 4.0302734375, 4.388916015625, 4.74755859375, 5.106201171875, 5.46484375, 5.823486328125, 6.18212890625, 6.540771484375, 6.8994140625, 7.258056640625, 7.61669921875, 7.975341796875, 8.333984375, 8.692626953125, 9.05126953125, 9.409912109375, 9.7685546875, 10.127197265625, 10.48583984375, 10.844482421875, 11.203125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 11.0, 20.0, 25.0, 37.0, 63.0, 135.0, 166.0, 265.0, 463.0, 722.0, 1179.0, 1877.0, 3234.0, 5589.0, 9641.0, 17025.0, 30606.0, 56424.0, 106153.0, 197099.0, 354976.0, 585417.0, 790944.0, 768473.0, 545968.0, 326754.0, 178547.0, 95832.0, 51556.0, 27821.0, 15569.0, 8686.0, 5110.0, 3050.0, 1849.0, 1081.0, 674.0, 422.0, 290.0, 198.0, 113.0, 69.0, 50.0, 40.0, 17.0, 18.0, 7.0, 11.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.484375, -16.9189453125, -16.353515625, -15.7880859375, -15.22265625, -14.6572265625, -14.091796875, -13.5263671875, -12.9609375, -12.3955078125, -11.830078125, -11.2646484375, -10.69921875, -10.1337890625, -9.568359375, -9.0029296875, -8.4375, -7.8720703125, -7.306640625, -6.7412109375, -6.17578125, -5.6103515625, -5.044921875, -4.4794921875, -3.9140625, -3.3486328125, -2.783203125, -2.2177734375, -1.65234375, -1.0869140625, -0.521484375, 0.0439453125, 0.609375, 1.1748046875, 1.740234375, 2.3056640625, 2.87109375, 3.4365234375, 4.001953125, 4.5673828125, 5.1328125, 5.6982421875, 6.263671875, 6.8291015625, 7.39453125, 7.9599609375, 8.525390625, 9.0908203125, 9.65625, 10.2216796875, 10.787109375, 11.3525390625, 11.91796875, 12.4833984375, 13.048828125, 13.6142578125, 14.1796875, 14.7451171875, 15.310546875, 15.8759765625, 16.44140625, 17.0068359375, 17.572265625, 18.1376953125, 18.703125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 6.0, 8.0, 8.0, 8.0, 18.0, 28.0, 24.0, 35.0, 45.0, 47.0, 59.0, 71.0, 100.0, 85.0, 117.0, 125.0, 134.0, 157.0, 167.0, 168.0, 196.0, 223.0, 203.0, 212.0, 207.0, 177.0, 162.0, 153.0, 144.0, 140.0, 120.0, 123.0, 110.0, 79.0, 66.0, 61.0, 50.0, 40.0, 41.0, 26.0, 22.0, 26.0, 16.0, 13.0, 11.0, 12.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 7.0, 0.0, 3.0], "bins": [-5.1875, -5.02508544921875, -4.8626708984375, -4.70025634765625, -4.537841796875, -4.37542724609375, -4.2130126953125, -4.05059814453125, -3.88818359375, -3.72576904296875, -3.5633544921875, -3.40093994140625, -3.238525390625, -3.07611083984375, -2.9136962890625, -2.75128173828125, -2.5888671875, -2.42645263671875, -2.2640380859375, -2.10162353515625, -1.939208984375, -1.77679443359375, -1.6143798828125, -1.45196533203125, -1.28955078125, -1.12713623046875, -0.9647216796875, -0.80230712890625, -0.639892578125, -0.47747802734375, -0.3150634765625, -0.15264892578125, 0.009765625, 0.17218017578125, 0.3345947265625, 0.49700927734375, 0.659423828125, 0.82183837890625, 0.9842529296875, 1.14666748046875, 1.30908203125, 1.47149658203125, 1.6339111328125, 1.79632568359375, 1.958740234375, 2.12115478515625, 2.2835693359375, 2.44598388671875, 2.6083984375, 2.77081298828125, 2.9332275390625, 3.09564208984375, 3.258056640625, 3.42047119140625, 3.5828857421875, 3.74530029296875, 3.90771484375, 4.07012939453125, 4.2325439453125, 4.39495849609375, 4.557373046875, 4.71978759765625, 4.8822021484375, 5.04461669921875, 5.20703125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 6.0, 7.0, 4.0, 6.0, 7.0, 4.0, 17.0, 9.0, 18.0, 22.0, 26.0, 30.0, 36.0, 42.0, 46.0, 47.0, 41.0, 56.0, 59.0, 44.0, 49.0, 58.0, 55.0, 50.0, 44.0, 37.0, 33.0, 27.0, 25.0, 26.0, 18.0, 4.0, 10.0, 10.0, 4.0, 4.0, 7.0, 5.0, 4.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.74671173095703, -21.143985748291016, -20.541259765625, -19.93853187561035, -19.335805892944336, -18.73307991027832, -18.130353927612305, -17.527626037597656, -16.92490005493164, -16.322174072265625, -15.719447135925293, -15.116721153259277, -14.513994216918945, -13.91126823425293, -13.308542251586914, -12.705815315246582, -12.103089332580566, -11.50036334991455, -10.897636413574219, -10.294910430908203, -9.692183494567871, -9.089457511901855, -8.486730575561523, -7.884004592895508, -7.281278133392334, -6.67855167388916, -6.075825214385986, -5.4730987548828125, -4.870372772216797, -4.267645835876465, -3.664919853210449, -3.0621933937072754, -2.4594669342041016, -1.8567404747009277, -1.2540141344070435, -0.6512877941131592, -0.04856133460998535, 0.5541651248931885, 1.1568913459777832, 1.759617805480957, 2.362344264984131, 2.9650707244873047, 3.5677971839904785, 4.170523643493652, 4.773249626159668, 5.3759765625, 5.978702545166016, 6.5814290046691895, 7.184155464172363, 7.786881923675537, 8.389608383178711, 8.992334365844727, 9.595061302185059, 10.197787284851074, 10.800514221191406, 11.403240203857422, 12.005966186523438, 12.608692169189453, 13.211419105529785, 13.8141450881958, 14.416872024536133, 15.019598007202148, 15.622323989868164, 16.225051879882812, 16.827777862548828]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 3.0, 5.0, 10.0, 12.0, 18.0, 18.0, 12.0, 17.0, 16.0, 30.0, 22.0, 25.0, 32.0, 31.0, 39.0, 46.0, 48.0, 36.0, 47.0, 42.0, 51.0, 42.0, 25.0, 28.0, 49.0, 34.0, 35.0, 29.0, 21.0, 26.0, 25.0, 25.0, 20.0, 13.0, 11.0, 13.0, 9.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.483270645141602, -15.011285781860352, -14.539301872253418, -14.067317008972168, -13.595333099365234, -13.123348236083984, -12.651363372802734, -12.179378509521484, -11.70739459991455, -11.2354097366333, -10.763425827026367, -10.291440963745117, -9.819456100463867, -9.347472190856934, -8.875487327575684, -8.40350341796875, -7.9315185546875, -7.459534168243408, -6.987549781799316, -6.515564918518066, -6.043580532073975, -5.571596145629883, -5.099611282348633, -4.627626895904541, -4.155642509460449, -3.6836581230163574, -3.2116734981536865, -2.7396888732910156, -2.267704486846924, -1.795720100402832, -1.3237354755401611, -0.8517508506774902, -0.37976551055908203, 0.09221899509429932, 0.5642035007476807, 1.036188006401062, 1.5081725120544434, 1.9801568984985352, 2.452141523361206, 2.924126148223877, 3.3961105346679688, 3.8680949211120605, 4.340079307556152, 4.812064170837402, 5.284048557281494, 5.756032943725586, 6.228017807006836, 6.700002193450928, 7.1719865798950195, 7.643970966339111, 8.115955352783203, 8.587940216064453, 9.059925079345703, 9.531908988952637, 10.003893852233887, 10.47587776184082, 10.94786262512207, 11.41984748840332, 11.891831398010254, 12.363816261291504, 12.835800170898438, 13.307785034179688, 13.779769897460938, 14.251754760742188, 14.723738670349121]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 8.0, 9.0, 7.0, 6.0, 10.0, 14.0, 26.0, 45.0, 87.0, 141.0, 179.0, 270.0, 405.0, 642.0, 911.0, 1405.0, 2258.0, 3584.0, 5897.0, 10464.0, 19741.0, 40563.0, 89179.0, 188625.0, 276045.0, 208964.0, 102323.0, 45847.0, 22147.0, 11554.0, 6412.0, 3930.0, 2472.0, 1579.0, 953.0, 634.0, 416.0, 287.0, 159.0, 136.0, 90.0, 45.0, 36.0, 25.0, 16.0, 10.0, 5.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.90625, -19.1845703125, -18.462890625, -17.7412109375, -17.01953125, -16.2978515625, -15.576171875, -14.8544921875, -14.1328125, -13.4111328125, -12.689453125, -11.9677734375, -11.24609375, -10.5244140625, -9.802734375, -9.0810546875, -8.359375, -7.6376953125, -6.916015625, -6.1943359375, -5.47265625, -4.7509765625, -4.029296875, -3.3076171875, -2.5859375, -1.8642578125, -1.142578125, -0.4208984375, 0.30078125, 1.0224609375, 1.744140625, 2.4658203125, 3.1875, 3.9091796875, 4.630859375, 5.3525390625, 6.07421875, 6.7958984375, 7.517578125, 8.2392578125, 8.9609375, 9.6826171875, 10.404296875, 11.1259765625, 11.84765625, 12.5693359375, 13.291015625, 14.0126953125, 14.734375, 15.4560546875, 16.177734375, 16.8994140625, 17.62109375, 18.3427734375, 19.064453125, 19.7861328125, 20.5078125, 21.2294921875, 21.951171875, 22.6728515625, 23.39453125, 24.1162109375, 24.837890625, 25.5595703125, 26.28125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 2.0, 1.0, 8.0, 11.0, 19.0, 8.0, 9.0, 14.0, 22.0, 13.0, 32.0, 34.0, 38.0, 39.0, 36.0, 43.0, 43.0, 52.0, 53.0, 55.0, 46.0, 37.0, 51.0, 36.0, 40.0, 35.0, 34.0, 29.0, 29.0, 18.0, 24.0, 20.0, 13.0, 13.0, 13.0, 12.0, 6.0, 2.0, 8.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.4375, -16.88525390625, -16.3330078125, -15.78076171875, -15.228515625, -14.67626953125, -14.1240234375, -13.57177734375, -13.01953125, -12.46728515625, -11.9150390625, -11.36279296875, -10.810546875, -10.25830078125, -9.7060546875, -9.15380859375, -8.6015625, -8.04931640625, -7.4970703125, -6.94482421875, -6.392578125, -5.84033203125, -5.2880859375, -4.73583984375, -4.18359375, -3.63134765625, -3.0791015625, -2.52685546875, -1.974609375, -1.42236328125, -0.8701171875, -0.31787109375, 0.234375, 0.78662109375, 1.3388671875, 1.89111328125, 2.443359375, 2.99560546875, 3.5478515625, 4.10009765625, 4.65234375, 5.20458984375, 5.7568359375, 6.30908203125, 6.861328125, 7.41357421875, 7.9658203125, 8.51806640625, 9.0703125, 9.62255859375, 10.1748046875, 10.72705078125, 11.279296875, 11.83154296875, 12.3837890625, 12.93603515625, 13.48828125, 14.04052734375, 14.5927734375, 15.14501953125, 15.697265625, 16.24951171875, 16.8017578125, 17.35400390625, 17.90625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 15.0, 19.0, 30.0, 23.0, 44.0, 76.0, 102.0, 133.0, 190.0, 277.0, 411.0, 635.0, 867.0, 1458.0, 2159.0, 3526.0, 5921.0, 10199.0, 19315.0, 39693.0, 87700.0, 198412.0, 308574.0, 197214.0, 87147.0, 39225.0, 19358.0, 10122.0, 5778.0, 3529.0, 2142.0, 1372.0, 924.0, 589.0, 395.0, 273.0, 200.0, 149.0, 104.0, 73.0, 45.0, 37.0, 24.0, 23.0, 9.0, 14.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-24.8125, -24.024658203125, -23.23681640625, -22.448974609375, -21.6611328125, -20.873291015625, -20.08544921875, -19.297607421875, -18.509765625, -17.721923828125, -16.93408203125, -16.146240234375, -15.3583984375, -14.570556640625, -13.78271484375, -12.994873046875, -12.20703125, -11.419189453125, -10.63134765625, -9.843505859375, -9.0556640625, -8.267822265625, -7.47998046875, -6.692138671875, -5.904296875, -5.116455078125, -4.32861328125, -3.540771484375, -2.7529296875, -1.965087890625, -1.17724609375, -0.389404296875, 0.3984375, 1.186279296875, 1.97412109375, 2.761962890625, 3.5498046875, 4.337646484375, 5.12548828125, 5.913330078125, 6.701171875, 7.489013671875, 8.27685546875, 9.064697265625, 9.8525390625, 10.640380859375, 11.42822265625, 12.216064453125, 13.00390625, 13.791748046875, 14.57958984375, 15.367431640625, 16.1552734375, 16.943115234375, 17.73095703125, 18.518798828125, 19.306640625, 20.094482421875, 20.88232421875, 21.670166015625, 22.4580078125, 23.245849609375, 24.03369140625, 24.821533203125, 25.609375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 5.0, 4.0, 0.0, 3.0, 6.0, 11.0, 10.0, 9.0, 8.0, 15.0, 20.0, 15.0, 13.0, 16.0, 18.0, 24.0, 29.0, 36.0, 28.0, 25.0, 36.0, 33.0, 32.0, 44.0, 31.0, 37.0, 36.0, 43.0, 29.0, 35.0, 29.0, 31.0, 38.0, 37.0, 30.0, 15.0, 29.0, 14.0, 21.0, 20.0, 11.0, 15.0, 10.0, 17.0, 7.0, 5.0, 12.0, 5.0, 7.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.4375, -8.157470703125, -7.87744140625, -7.597412109375, -7.3173828125, -7.037353515625, -6.75732421875, -6.477294921875, -6.197265625, -5.917236328125, -5.63720703125, -5.357177734375, -5.0771484375, -4.797119140625, -4.51708984375, -4.237060546875, -3.95703125, -3.677001953125, -3.39697265625, -3.116943359375, -2.8369140625, -2.556884765625, -2.27685546875, -1.996826171875, -1.716796875, -1.436767578125, -1.15673828125, -0.876708984375, -0.5966796875, -0.316650390625, -0.03662109375, 0.243408203125, 0.5234375, 0.803466796875, 1.08349609375, 1.363525390625, 1.6435546875, 1.923583984375, 2.20361328125, 2.483642578125, 2.763671875, 3.043701171875, 3.32373046875, 3.603759765625, 3.8837890625, 4.163818359375, 4.44384765625, 4.723876953125, 5.00390625, 5.283935546875, 5.56396484375, 5.843994140625, 6.1240234375, 6.404052734375, 6.68408203125, 6.964111328125, 7.244140625, 7.524169921875, 7.80419921875, 8.084228515625, 8.3642578125, 8.644287109375, 8.92431640625, 9.204345703125, 9.484375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 9.0, 8.0, 15.0, 8.0, 27.0, 29.0, 49.0, 54.0, 96.0, 123.0, 206.0, 304.0, 450.0, 728.0, 1228.0, 2261.0, 4206.0, 8865.0, 20967.0, 57683.0, 180515.0, 407400.0, 238142.0, 76158.0, 26690.0, 10799.0, 5110.0, 2584.0, 1464.0, 808.0, 539.0, 334.0, 220.0, 141.0, 88.0, 68.0, 42.0, 39.0, 27.0, 26.0, 12.0, 11.0, 4.0, 4.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.375, -15.822265625, -15.26953125, -14.716796875, -14.1640625, -13.611328125, -13.05859375, -12.505859375, -11.953125, -11.400390625, -10.84765625, -10.294921875, -9.7421875, -9.189453125, -8.63671875, -8.083984375, -7.53125, -6.978515625, -6.42578125, -5.873046875, -5.3203125, -4.767578125, -4.21484375, -3.662109375, -3.109375, -2.556640625, -2.00390625, -1.451171875, -0.8984375, -0.345703125, 0.20703125, 0.759765625, 1.3125, 1.865234375, 2.41796875, 2.970703125, 3.5234375, 4.076171875, 4.62890625, 5.181640625, 5.734375, 6.287109375, 6.83984375, 7.392578125, 7.9453125, 8.498046875, 9.05078125, 9.603515625, 10.15625, 10.708984375, 11.26171875, 11.814453125, 12.3671875, 12.919921875, 13.47265625, 14.025390625, 14.578125, 15.130859375, 15.68359375, 16.236328125, 16.7890625, 17.341796875, 17.89453125, 18.447265625, 19.0]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 6.0, 3.0, 5.0, 7.0, 7.0, 13.0, 19.0, 23.0, 46.0, 96.0, 147.0, 181.0, 143.0, 96.0, 58.0, 46.0, 24.0, 18.0, 7.0, 3.0, 13.0, 4.0, 7.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00098419189453125, -0.000951036810874939, -0.0009178817272186279, -0.0008847266435623169, -0.0008515715599060059, -0.0008184164762496948, -0.0007852613925933838, -0.0007521063089370728, -0.0007189512252807617, -0.0006857961416244507, -0.0006526410579681396, -0.0006194859743118286, -0.0005863308906555176, -0.0005531758069992065, -0.0005200207233428955, -0.00048686563968658447, -0.00045371055603027344, -0.0004205554723739624, -0.00038740038871765137, -0.00035424530506134033, -0.0003210902214050293, -0.00028793513774871826, -0.0002547800540924072, -0.0002216249704360962, -0.00018846988677978516, -0.00015531480312347412, -0.00012215971946716309, -8.900463581085205e-05, -5.5849552154541016e-05, -2.269446849822998e-05, 1.0460615158081055e-05, 4.361569881439209e-05, 7.677078247070312e-05, 0.00010992586612701416, 0.0001430809497833252, 0.00017623603343963623, 0.00020939111709594727, 0.0002425462007522583, 0.00027570128440856934, 0.00030885636806488037, 0.0003420114517211914, 0.00037516653537750244, 0.0004083216190338135, 0.0004414767026901245, 0.00047463178634643555, 0.0005077868700027466, 0.0005409419536590576, 0.0005740970373153687, 0.0006072521209716797, 0.0006404072046279907, 0.0006735622882843018, 0.0007067173719406128, 0.0007398724555969238, 0.0007730275392532349, 0.0008061826229095459, 0.0008393377065658569, 0.000872492790222168, 0.000905647873878479, 0.00093880295753479, 0.0009719580411911011, 0.0010051131248474121, 0.0010382682085037231, 0.0010714232921600342, 0.0011045783758163452, 0.0011377334594726562]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 12.0, 5.0, 11.0, 20.0, 24.0, 50.0, 57.0, 54.0, 135.0, 161.0, 220.0, 321.0, 440.0, 631.0, 871.0, 1285.0, 1866.0, 2792.0, 4194.0, 6763.0, 11631.0, 21097.0, 41126.0, 82429.0, 157736.0, 233072.0, 213199.0, 127636.0, 64826.0, 32432.0, 16852.0, 9426.0, 5759.0, 3607.0, 2393.0, 1672.0, 1132.0, 736.0, 548.0, 411.0, 276.0, 182.0, 128.0, 78.0, 86.0, 61.0, 40.0, 19.0, 25.0, 8.0, 6.0, 8.0, 3.0, 6.0, 3.0, 0.0, 2.0], "bins": [-10.8984375, -10.56640625, -10.234375, -9.90234375, -9.5703125, -9.23828125, -8.90625, -8.57421875, -8.2421875, -7.91015625, -7.578125, -7.24609375, -6.9140625, -6.58203125, -6.25, -5.91796875, -5.5859375, -5.25390625, -4.921875, -4.58984375, -4.2578125, -3.92578125, -3.59375, -3.26171875, -2.9296875, -2.59765625, -2.265625, -1.93359375, -1.6015625, -1.26953125, -0.9375, -0.60546875, -0.2734375, 0.05859375, 0.390625, 0.72265625, 1.0546875, 1.38671875, 1.71875, 2.05078125, 2.3828125, 2.71484375, 3.046875, 3.37890625, 3.7109375, 4.04296875, 4.375, 4.70703125, 5.0390625, 5.37109375, 5.703125, 6.03515625, 6.3671875, 6.69921875, 7.03125, 7.36328125, 7.6953125, 8.02734375, 8.359375, 8.69140625, 9.0234375, 9.35546875, 9.6875, 10.01953125, 10.3515625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 11.0, 8.0, 9.0, 18.0, 12.0, 30.0, 30.0, 34.0, 42.0, 51.0, 53.0, 74.0, 60.0, 70.0, 75.0, 63.0, 62.0, 53.0, 44.0, 33.0, 25.0, 29.0, 19.0, 19.0, 7.0, 10.0, 2.0, 6.0, 11.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.89453125, -3.787872314453125, -3.68121337890625, -3.574554443359375, -3.4678955078125, -3.361236572265625, -3.25457763671875, -3.147918701171875, -3.041259765625, -2.934600830078125, -2.82794189453125, -2.721282958984375, -2.6146240234375, -2.507965087890625, -2.40130615234375, -2.294647216796875, -2.18798828125, -2.081329345703125, -1.97467041015625, -1.868011474609375, -1.7613525390625, -1.654693603515625, -1.54803466796875, -1.441375732421875, -1.334716796875, -1.228057861328125, -1.12139892578125, -1.014739990234375, -0.9080810546875, -0.801422119140625, -0.69476318359375, -0.588104248046875, -0.4814453125, -0.374786376953125, -0.26812744140625, -0.161468505859375, -0.0548095703125, 0.051849365234375, 0.15850830078125, 0.265167236328125, 0.371826171875, 0.478485107421875, 0.58514404296875, 0.691802978515625, 0.7984619140625, 0.905120849609375, 1.01177978515625, 1.118438720703125, 1.22509765625, 1.331756591796875, 1.43841552734375, 1.545074462890625, 1.6517333984375, 1.758392333984375, 1.86505126953125, 1.971710205078125, 2.078369140625, 2.185028076171875, 2.29168701171875, 2.398345947265625, 2.5050048828125, 2.611663818359375, 2.71832275390625, 2.824981689453125, 2.931640625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 5.0, 2.0, 9.0, 4.0, 13.0, 9.0, 7.0, 16.0, 23.0, 24.0, 20.0, 30.0, 39.0, 45.0, 48.0, 54.0, 46.0, 39.0, 54.0, 64.0, 47.0, 48.0, 41.0, 47.0, 50.0, 39.0, 37.0, 22.0, 23.0, 15.0, 11.0, 10.0, 9.0, 10.0, 6.0, 5.0, 6.0, 9.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-20.627744674682617, -20.064741134643555, -19.50173568725586, -18.938732147216797, -18.375728607177734, -17.81272315979004, -17.249719619750977, -16.686716079711914, -16.12371063232422, -15.56070613861084, -14.997702598571777, -14.434698104858398, -13.87169361114502, -13.30868911743164, -12.745685577392578, -12.1826810836792, -11.619677543640137, -11.056673049926758, -10.493669509887695, -9.930665016174316, -9.367660522460938, -8.804656982421875, -8.241652488708496, -7.678647994995117, -7.1156439781188965, -6.552639961242676, -5.989635467529297, -5.426631450653076, -4.8636274337768555, -4.300622940063477, -3.737618923187256, -3.174614667892456, -2.6116104125976562, -2.0486061573028564, -1.4856020212173462, -0.9225978851318359, -0.35959362983703613, 0.20341062545776367, 0.7664146423339844, 1.3294188976287842, 1.892423152923584, 2.455427408218384, 3.0184316635131836, 3.5814356803894043, 4.144439697265625, 4.707444190979004, 5.270448207855225, 5.833452224731445, 6.396456718444824, 6.959460735321045, 7.522465229034424, 8.085469245910645, 8.648473739624023, 9.211477279663086, 9.774481773376465, 10.337486267089844, 10.900489807128906, 11.463494300842285, 12.026497840881348, 12.589502334594727, 13.152506828308105, 13.715511322021484, 14.278514862060547, 14.841519355773926, 15.404523849487305]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 1.0, 9.0, 9.0, 14.0, 12.0, 13.0, 19.0, 16.0, 24.0, 26.0, 23.0, 29.0, 27.0, 42.0, 51.0, 40.0, 47.0, 48.0, 43.0, 41.0, 46.0, 37.0, 36.0, 35.0, 43.0, 37.0, 24.0, 25.0, 27.0, 26.0, 20.0, 24.0, 18.0, 10.0, 16.0, 5.0, 8.0, 5.0, 1.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.564419746398926, -15.093890190124512, -14.623359680175781, -14.152830123901367, -13.682299613952637, -13.211770057678223, -12.741239547729492, -12.270709991455078, -11.800180435180664, -11.32965087890625, -10.85912036895752, -10.388590812683105, -9.918060302734375, -9.447530746459961, -8.977001190185547, -8.506470680236816, -8.035940170288086, -7.565410137176514, -7.094880104064941, -6.624350547790527, -6.153820037841797, -5.683290481567383, -5.2127604484558105, -4.742230415344238, -4.271700382232666, -3.8011703491210938, -3.3306403160095215, -2.8601105213165283, -2.389580488204956, -1.9190504550933838, -1.4485206604003906, -0.9779906272888184, -0.5074615478515625, -0.03693157434463501, 0.4335983991622925, 0.9041283130645752, 1.3746583461761475, 1.8451883792877197, 2.315718173980713, 2.786248207092285, 3.2567782402038574, 3.7273082733154297, 4.197838306427002, 4.668368339538574, 5.138897895812988, 5.609428405761719, 6.079957962036133, 6.550487995147705, 7.021018028259277, 7.49154806137085, 7.962078094482422, 8.432607650756836, 8.903138160705566, 9.37366771697998, 9.844198226928711, 10.314727783203125, 10.785257339477539, 11.255786895751953, 11.726317405700684, 12.196846961975098, 12.667377471923828, 13.137907028198242, 13.608436584472656, 14.078967094421387, 14.549497604370117]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 13.0, 18.0, 19.0, 41.0, 53.0, 87.0, 121.0, 169.0, 270.0, 410.0, 652.0, 1038.0, 1527.0, 2320.0, 3902.0, 6258.0, 10705.0, 18108.0, 30479.0, 51608.0, 83490.0, 124748.0, 160415.0, 166719.0, 138349.0, 96134.0, 60701.0, 36313.0, 21403.0, 12600.0, 7640.0, 4532.0, 2750.0, 1765.0, 1080.0, 758.0, 475.0, 289.0, 182.0, 147.0, 95.0, 48.0, 36.0, 18.0, 22.0, 10.0, 11.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.046875, -19.423583984375, -18.80029296875, -18.177001953125, -17.5537109375, -16.930419921875, -16.30712890625, -15.683837890625, -15.060546875, -14.437255859375, -13.81396484375, -13.190673828125, -12.5673828125, -11.944091796875, -11.32080078125, -10.697509765625, -10.07421875, -9.450927734375, -8.82763671875, -8.204345703125, -7.5810546875, -6.957763671875, -6.33447265625, -5.711181640625, -5.087890625, -4.464599609375, -3.84130859375, -3.218017578125, -2.5947265625, -1.971435546875, -1.34814453125, -0.724853515625, -0.1015625, 0.521728515625, 1.14501953125, 1.768310546875, 2.3916015625, 3.014892578125, 3.63818359375, 4.261474609375, 4.884765625, 5.508056640625, 6.13134765625, 6.754638671875, 7.3779296875, 8.001220703125, 8.62451171875, 9.247802734375, 9.87109375, 10.494384765625, 11.11767578125, 11.740966796875, 12.3642578125, 12.987548828125, 13.61083984375, 14.234130859375, 14.857421875, 15.480712890625, 16.10400390625, 16.727294921875, 17.3505859375, 17.973876953125, 18.59716796875, 19.220458984375, 19.84375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 3.0, 3.0, 5.0, 7.0, 14.0, 14.0, 8.0, 15.0, 18.0, 12.0, 25.0, 19.0, 25.0, 35.0, 32.0, 40.0, 41.0, 36.0, 41.0, 35.0, 52.0, 36.0, 41.0, 50.0, 40.0, 30.0, 31.0, 31.0, 39.0, 36.0, 24.0, 23.0, 24.0, 9.0, 21.0, 20.0, 10.0, 12.0, 8.0, 7.0, 4.0, 1.0, 7.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-14.65625, -14.1898193359375, -13.723388671875, -13.2569580078125, -12.79052734375, -12.3240966796875, -11.857666015625, -11.3912353515625, -10.9248046875, -10.4583740234375, -9.991943359375, -9.5255126953125, -9.05908203125, -8.5926513671875, -8.126220703125, -7.6597900390625, -7.193359375, -6.7269287109375, -6.260498046875, -5.7940673828125, -5.32763671875, -4.8612060546875, -4.394775390625, -3.9283447265625, -3.4619140625, -2.9954833984375, -2.529052734375, -2.0626220703125, -1.59619140625, -1.1297607421875, -0.663330078125, -0.1968994140625, 0.26953125, 0.7359619140625, 1.202392578125, 1.6688232421875, 2.13525390625, 2.6016845703125, 3.068115234375, 3.5345458984375, 4.0009765625, 4.4674072265625, 4.933837890625, 5.4002685546875, 5.86669921875, 6.3331298828125, 6.799560546875, 7.2659912109375, 7.732421875, 8.1988525390625, 8.665283203125, 9.1317138671875, 9.59814453125, 10.0645751953125, 10.531005859375, 10.9974365234375, 11.4638671875, 11.9302978515625, 12.396728515625, 12.8631591796875, 13.32958984375, 13.7960205078125, 14.262451171875, 14.7288818359375, 15.1953125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 12.0, 18.0, 21.0, 33.0, 35.0, 71.0, 114.0, 152.0, 220.0, 344.0, 534.0, 797.0, 1265.0, 1908.0, 2945.0, 4229.0, 6668.0, 10139.0, 15593.0, 24098.0, 35781.0, 52977.0, 75995.0, 102886.0, 126526.0, 135060.0, 124374.0, 99918.0, 73755.0, 51182.0, 34774.0, 22774.0, 15053.0, 9765.0, 6323.0, 4157.0, 2715.0, 1782.0, 1189.0, 807.0, 527.0, 367.0, 238.0, 126.0, 114.0, 65.0, 49.0, 43.0, 15.0, 8.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-14.8671875, -14.4090576171875, -13.950927734375, -13.4927978515625, -13.03466796875, -12.5765380859375, -12.118408203125, -11.6602783203125, -11.2021484375, -10.7440185546875, -10.285888671875, -9.8277587890625, -9.36962890625, -8.9114990234375, -8.453369140625, -7.9952392578125, -7.537109375, -7.0789794921875, -6.620849609375, -6.1627197265625, -5.70458984375, -5.2464599609375, -4.788330078125, -4.3302001953125, -3.8720703125, -3.4139404296875, -2.955810546875, -2.4976806640625, -2.03955078125, -1.5814208984375, -1.123291015625, -0.6651611328125, -0.20703125, 0.2510986328125, 0.709228515625, 1.1673583984375, 1.62548828125, 2.0836181640625, 2.541748046875, 2.9998779296875, 3.4580078125, 3.9161376953125, 4.374267578125, 4.8323974609375, 5.29052734375, 5.7486572265625, 6.206787109375, 6.6649169921875, 7.123046875, 7.5811767578125, 8.039306640625, 8.4974365234375, 8.95556640625, 9.4136962890625, 9.871826171875, 10.3299560546875, 10.7880859375, 11.2462158203125, 11.704345703125, 12.1624755859375, 12.62060546875, 13.0787353515625, 13.536865234375, 13.9949951171875, 14.453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 2.0, 5.0, 6.0, 7.0, 10.0, 11.0, 11.0, 8.0, 18.0, 25.0, 23.0, 33.0, 35.0, 35.0, 24.0, 37.0, 40.0, 27.0, 49.0, 47.0, 47.0, 53.0, 48.0, 40.0, 44.0, 36.0, 30.0, 32.0, 23.0, 29.0, 23.0, 23.0, 20.0, 24.0, 8.0, 15.0, 11.0, 9.0, 4.0, 10.0, 0.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.3125, -9.975341796875, -9.63818359375, -9.301025390625, -8.9638671875, -8.626708984375, -8.28955078125, -7.952392578125, -7.615234375, -7.278076171875, -6.94091796875, -6.603759765625, -6.2666015625, -5.929443359375, -5.59228515625, -5.255126953125, -4.91796875, -4.580810546875, -4.24365234375, -3.906494140625, -3.5693359375, -3.232177734375, -2.89501953125, -2.557861328125, -2.220703125, -1.883544921875, -1.54638671875, -1.209228515625, -0.8720703125, -0.534912109375, -0.19775390625, 0.139404296875, 0.4765625, 0.813720703125, 1.15087890625, 1.488037109375, 1.8251953125, 2.162353515625, 2.49951171875, 2.836669921875, 3.173828125, 3.510986328125, 3.84814453125, 4.185302734375, 4.5224609375, 4.859619140625, 5.19677734375, 5.533935546875, 5.87109375, 6.208251953125, 6.54541015625, 6.882568359375, 7.2197265625, 7.556884765625, 7.89404296875, 8.231201171875, 8.568359375, 8.905517578125, 9.24267578125, 9.579833984375, 9.9169921875, 10.254150390625, 10.59130859375, 10.928466796875, 11.265625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 22.0, 14.0, 23.0, 30.0, 49.0, 82.0, 93.0, 131.0, 169.0, 232.0, 345.0, 482.0, 731.0, 1043.0, 1628.0, 2518.0, 3990.0, 6803.0, 12131.0, 23533.0, 51212.0, 124132.0, 282612.0, 293318.0, 132122.0, 54278.0, 25097.0, 12760.0, 6921.0, 4224.0, 2560.0, 1691.0, 1081.0, 719.0, 512.0, 376.0, 237.0, 183.0, 128.0, 82.0, 71.0, 49.0, 44.0, 26.0, 19.0, 8.0, 7.0, 12.0, 3.0, 6.0, 5.0, 4.0], "bins": [-34.625, -33.63671875, -32.6484375, -31.66015625, -30.671875, -29.68359375, -28.6953125, -27.70703125, -26.71875, -25.73046875, -24.7421875, -23.75390625, -22.765625, -21.77734375, -20.7890625, -19.80078125, -18.8125, -17.82421875, -16.8359375, -15.84765625, -14.859375, -13.87109375, -12.8828125, -11.89453125, -10.90625, -9.91796875, -8.9296875, -7.94140625, -6.953125, -5.96484375, -4.9765625, -3.98828125, -3.0, -2.01171875, -1.0234375, -0.03515625, 0.953125, 1.94140625, 2.9296875, 3.91796875, 4.90625, 5.89453125, 6.8828125, 7.87109375, 8.859375, 9.84765625, 10.8359375, 11.82421875, 12.8125, 13.80078125, 14.7890625, 15.77734375, 16.765625, 17.75390625, 18.7421875, 19.73046875, 20.71875, 21.70703125, 22.6953125, 23.68359375, 24.671875, 25.66015625, 26.6484375, 27.63671875, 28.625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 6.0, 15.0, 14.0, 49.0, 97.0, 148.0, 208.0, 168.0, 133.0, 58.0, 34.0, 20.0, 10.0, 9.0, 6.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004913330078125, -0.0047228336334228516, -0.004532337188720703, -0.004341840744018555, -0.004151344299316406, -0.003960847854614258, -0.0037703514099121094, -0.003579854965209961, -0.0033893585205078125, -0.003198862075805664, -0.0030083656311035156, -0.002817869186401367, -0.0026273727416992188, -0.0024368762969970703, -0.002246379852294922, -0.0020558834075927734, -0.001865386962890625, -0.0016748905181884766, -0.0014843940734863281, -0.0012938976287841797, -0.0011034011840820312, -0.0009129047393798828, -0.0007224082946777344, -0.0005319118499755859, -0.0003414154052734375, -0.00015091896057128906, 3.9577484130859375e-05, 0.0002300739288330078, 0.00042057037353515625, 0.0006110668182373047, 0.0008015632629394531, 0.0009920597076416016, 0.00118255615234375, 0.0013730525970458984, 0.0015635490417480469, 0.0017540454864501953, 0.0019445419311523438, 0.002135038375854492, 0.0023255348205566406, 0.002516031265258789, 0.0027065277099609375, 0.002897024154663086, 0.0030875205993652344, 0.003278017044067383, 0.0034685134887695312, 0.0036590099334716797, 0.003849506378173828, 0.0040400028228759766, 0.004230499267578125, 0.0044209957122802734, 0.004611492156982422, 0.00480198860168457, 0.004992485046386719, 0.005182981491088867, 0.005373477935791016, 0.005563974380493164, 0.0057544708251953125, 0.005944967269897461, 0.006135463714599609, 0.006325960159301758, 0.006516456604003906, 0.006706953048706055, 0.006897449493408203, 0.0070879459381103516, 0.0072784423828125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 9.0, 10.0, 8.0, 19.0, 31.0, 29.0, 55.0, 64.0, 101.0, 175.0, 233.0, 336.0, 476.0, 671.0, 950.0, 1511.0, 2304.0, 3496.0, 5698.0, 9435.0, 16682.0, 30938.0, 61029.0, 121337.0, 208202.0, 237558.0, 163660.0, 85826.0, 42691.0, 22321.0, 12367.0, 7436.0, 4463.0, 2749.0, 1821.0, 1251.0, 842.0, 555.0, 373.0, 251.0, 158.0, 119.0, 90.0, 61.0, 50.0, 30.0, 25.0, 22.0, 18.0, 13.0, 11.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.578125, -17.94287109375, -17.3076171875, -16.67236328125, -16.037109375, -15.40185546875, -14.7666015625, -14.13134765625, -13.49609375, -12.86083984375, -12.2255859375, -11.59033203125, -10.955078125, -10.31982421875, -9.6845703125, -9.04931640625, -8.4140625, -7.77880859375, -7.1435546875, -6.50830078125, -5.873046875, -5.23779296875, -4.6025390625, -3.96728515625, -3.33203125, -2.69677734375, -2.0615234375, -1.42626953125, -0.791015625, -0.15576171875, 0.4794921875, 1.11474609375, 1.75, 2.38525390625, 3.0205078125, 3.65576171875, 4.291015625, 4.92626953125, 5.5615234375, 6.19677734375, 6.83203125, 7.46728515625, 8.1025390625, 8.73779296875, 9.373046875, 10.00830078125, 10.6435546875, 11.27880859375, 11.9140625, 12.54931640625, 13.1845703125, 13.81982421875, 14.455078125, 15.09033203125, 15.7255859375, 16.36083984375, 16.99609375, 17.63134765625, 18.2666015625, 18.90185546875, 19.537109375, 20.17236328125, 20.8076171875, 21.44287109375, 22.078125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 3.0, 5.0, 2.0, 6.0, 10.0, 15.0, 11.0, 15.0, 23.0, 30.0, 41.0, 62.0, 51.0, 69.0, 86.0, 96.0, 65.0, 74.0, 76.0, 56.0, 48.0, 28.0, 27.0, 23.0, 18.0, 18.0, 10.0, 9.0, 9.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.08203125, -6.8665771484375, -6.651123046875, -6.4356689453125, -6.22021484375, -6.0047607421875, -5.789306640625, -5.5738525390625, -5.3583984375, -5.1429443359375, -4.927490234375, -4.7120361328125, -4.49658203125, -4.2811279296875, -4.065673828125, -3.8502197265625, -3.634765625, -3.4193115234375, -3.203857421875, -2.9884033203125, -2.77294921875, -2.5574951171875, -2.342041015625, -2.1265869140625, -1.9111328125, -1.6956787109375, -1.480224609375, -1.2647705078125, -1.04931640625, -0.8338623046875, -0.618408203125, -0.4029541015625, -0.1875, 0.0279541015625, 0.243408203125, 0.4588623046875, 0.67431640625, 0.8897705078125, 1.105224609375, 1.3206787109375, 1.5361328125, 1.7515869140625, 1.967041015625, 2.1824951171875, 2.39794921875, 2.6134033203125, 2.828857421875, 3.0443115234375, 3.259765625, 3.4752197265625, 3.690673828125, 3.9061279296875, 4.12158203125, 4.3370361328125, 4.552490234375, 4.7679443359375, 4.9833984375, 5.1988525390625, 5.414306640625, 5.6297607421875, 5.84521484375, 6.0606689453125, 6.276123046875, 6.4915771484375, 6.70703125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 10.0, 9.0, 9.0, 13.0, 19.0, 16.0, 16.0, 11.0, 21.0, 29.0, 35.0, 38.0, 34.0, 49.0, 48.0, 59.0, 48.0, 47.0, 48.0, 54.0, 50.0, 50.0, 30.0, 36.0, 33.0, 26.0, 17.0, 22.0, 16.0, 16.0, 11.0, 11.0, 8.0, 5.0, 6.0, 9.0, 5.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-20.95793342590332, -20.393394470214844, -19.828857421875, -19.264320373535156, -18.69978141784668, -18.135242462158203, -17.57070541381836, -17.006168365478516, -16.44162940979004, -15.877091407775879, -15.312553405761719, -14.748015403747559, -14.183477401733398, -13.618939399719238, -13.054401397705078, -12.489863395690918, -11.925325393676758, -11.360787391662598, -10.796249389648438, -10.231711387634277, -9.667173385620117, -9.102635383605957, -8.538097381591797, -7.973559379577637, -7.409021377563477, -6.844483375549316, -6.279945373535156, -5.715407371520996, -5.150869369506836, -4.586331367492676, -4.021793365478516, -3.4572553634643555, -2.892716407775879, -2.3281784057617188, -1.7636404037475586, -1.1991024017333984, -0.6345643997192383, -0.07002639770507812, 0.49451160430908203, 1.0590496063232422, 1.6235876083374023, 2.1881256103515625, 2.7526636123657227, 3.317201614379883, 3.881739616394043, 4.446277618408203, 5.010815620422363, 5.575353622436523, 6.139891624450684, 6.704429626464844, 7.268967628479004, 7.833505630493164, 8.398043632507324, 8.962581634521484, 9.527119636535645, 10.091657638549805, 10.656195640563965, 11.220733642578125, 11.785271644592285, 12.349809646606445, 12.914347648620605, 13.478885650634766, 14.043423652648926, 14.607961654663086, 15.172499656677246]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 6.0, 17.0, 13.0, 14.0, 16.0, 19.0, 25.0, 31.0, 28.0, 36.0, 38.0, 48.0, 51.0, 52.0, 46.0, 41.0, 43.0, 51.0, 35.0, 32.0, 39.0, 40.0, 37.0, 38.0, 27.0, 33.0, 23.0, 17.0, 19.0, 16.0, 7.0, 15.0, 8.0, 2.0, 4.0, 5.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-18.153623580932617, -17.63864517211914, -17.12366485595703, -16.608686447143555, -16.093708038330078, -15.578729629516602, -15.063750267028809, -14.548770904541016, -14.033792495727539, -13.518814086914062, -13.00383472442627, -12.488855361938477, -11.973876953125, -11.458898544311523, -10.94391918182373, -10.428939819335938, -9.913961410522461, -9.398983001708984, -8.884003639221191, -8.369024276733398, -7.854045867919922, -7.339066982269287, -6.824088096618652, -6.309109210968018, -5.794130325317383, -5.279151439666748, -4.764172554016113, -4.2491936683654785, -3.7342147827148438, -3.219235897064209, -2.704257011413574, -2.1892781257629395, -1.674300193786621, -1.1593213081359863, -0.6443424224853516, -0.1293635368347168, 0.38561534881591797, 0.9005942344665527, 1.4155731201171875, 1.9305520057678223, 2.445530891418457, 2.960509777069092, 3.4754886627197266, 3.9904675483703613, 4.505446434020996, 5.020425319671631, 5.535404205322266, 6.0503830909729, 6.565361976623535, 7.08034086227417, 7.595319747924805, 8.110298156738281, 8.625277519226074, 9.140256881713867, 9.655235290527344, 10.17021369934082, 10.685193061828613, 11.200172424316406, 11.715150833129883, 12.23012924194336, 12.745108604431152, 13.260087966918945, 13.775066375732422, 14.290044784545898, 14.805024147033691]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 4.0, 5.0, 9.0, 16.0, 30.0, 32.0, 77.0, 105.0, 155.0, 216.0, 381.0, 633.0, 1057.0, 1725.0, 2982.0, 5084.0, 8673.0, 15755.0, 28810.0, 55045.0, 109642.0, 226026.0, 468803.0, 839161.0, 992550.0, 703599.0, 367540.0, 177853.0, 88204.0, 44607.0, 24009.0, 13004.0, 7510.0, 4409.0, 2553.0, 1566.0, 899.0, 591.0, 318.0, 230.0, 148.0, 87.0, 72.0, 44.0, 23.0, 10.0, 13.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.609375, -18.03369140625, -17.4580078125, -16.88232421875, -16.306640625, -15.73095703125, -15.1552734375, -14.57958984375, -14.00390625, -13.42822265625, -12.8525390625, -12.27685546875, -11.701171875, -11.12548828125, -10.5498046875, -9.97412109375, -9.3984375, -8.82275390625, -8.2470703125, -7.67138671875, -7.095703125, -6.52001953125, -5.9443359375, -5.36865234375, -4.79296875, -4.21728515625, -3.6416015625, -3.06591796875, -2.490234375, -1.91455078125, -1.3388671875, -0.76318359375, -0.1875, 0.38818359375, 0.9638671875, 1.53955078125, 2.115234375, 2.69091796875, 3.2666015625, 3.84228515625, 4.41796875, 4.99365234375, 5.5693359375, 6.14501953125, 6.720703125, 7.29638671875, 7.8720703125, 8.44775390625, 9.0234375, 9.59912109375, 10.1748046875, 10.75048828125, 11.326171875, 11.90185546875, 12.4775390625, 13.05322265625, 13.62890625, 14.20458984375, 14.7802734375, 15.35595703125, 15.931640625, 16.50732421875, 17.0830078125, 17.65869140625, 18.234375]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 9.0, 11.0, 12.0, 20.0, 9.0, 20.0, 25.0, 37.0, 36.0, 36.0, 39.0, 39.0, 41.0, 44.0, 51.0, 44.0, 49.0, 44.0, 43.0, 51.0, 35.0, 39.0, 33.0, 34.0, 28.0, 22.0, 22.0, 22.0, 15.0, 11.0, 8.0, 12.0, 9.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.75, -10.4105224609375, -10.071044921875, -9.7315673828125, -9.39208984375, -9.0526123046875, -8.713134765625, -8.3736572265625, -8.0341796875, -7.6947021484375, -7.355224609375, -7.0157470703125, -6.67626953125, -6.3367919921875, -5.997314453125, -5.6578369140625, -5.318359375, -4.9788818359375, -4.639404296875, -4.2999267578125, -3.96044921875, -3.6209716796875, -3.281494140625, -2.9420166015625, -2.6025390625, -2.2630615234375, -1.923583984375, -1.5841064453125, -1.24462890625, -0.9051513671875, -0.565673828125, -0.2261962890625, 0.11328125, 0.4527587890625, 0.792236328125, 1.1317138671875, 1.47119140625, 1.8106689453125, 2.150146484375, 2.4896240234375, 2.8291015625, 3.1685791015625, 3.508056640625, 3.8475341796875, 4.18701171875, 4.5264892578125, 4.865966796875, 5.2054443359375, 5.544921875, 5.8843994140625, 6.223876953125, 6.5633544921875, 6.90283203125, 7.2423095703125, 7.581787109375, 7.9212646484375, 8.2607421875, 8.6002197265625, 8.939697265625, 9.2791748046875, 9.61865234375, 9.9581298828125, 10.297607421875, 10.6370849609375, 10.9765625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 9.0, 10.0, 22.0, 24.0, 64.0, 67.0, 118.0, 186.0, 361.0, 549.0, 889.0, 1507.0, 2561.0, 4470.0, 7792.0, 13911.0, 25269.0, 47214.0, 88637.0, 166818.0, 310738.0, 540447.0, 798707.0, 832889.0, 593780.0, 348064.0, 190579.0, 100463.0, 53162.0, 28601.0, 15428.0, 8916.0, 4889.0, 2784.0, 1667.0, 1052.0, 584.0, 372.0, 250.0, 145.0, 98.0, 65.0, 33.0, 24.0, 17.0, 13.0, 9.0, 3.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-16.171875, -15.65185546875, -15.1318359375, -14.61181640625, -14.091796875, -13.57177734375, -13.0517578125, -12.53173828125, -12.01171875, -11.49169921875, -10.9716796875, -10.45166015625, -9.931640625, -9.41162109375, -8.8916015625, -8.37158203125, -7.8515625, -7.33154296875, -6.8115234375, -6.29150390625, -5.771484375, -5.25146484375, -4.7314453125, -4.21142578125, -3.69140625, -3.17138671875, -2.6513671875, -2.13134765625, -1.611328125, -1.09130859375, -0.5712890625, -0.05126953125, 0.46875, 0.98876953125, 1.5087890625, 2.02880859375, 2.548828125, 3.06884765625, 3.5888671875, 4.10888671875, 4.62890625, 5.14892578125, 5.6689453125, 6.18896484375, 6.708984375, 7.22900390625, 7.7490234375, 8.26904296875, 8.7890625, 9.30908203125, 9.8291015625, 10.34912109375, 10.869140625, 11.38916015625, 11.9091796875, 12.42919921875, 12.94921875, 13.46923828125, 13.9892578125, 14.50927734375, 15.029296875, 15.54931640625, 16.0693359375, 16.58935546875, 17.109375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 11.0, 6.0, 12.0, 14.0, 22.0, 27.0, 35.0, 47.0, 65.0, 80.0, 78.0, 96.0, 112.0, 133.0, 160.0, 203.0, 206.0, 253.0, 266.0, 253.0, 252.0, 267.0, 205.0, 191.0, 182.0, 170.0, 126.0, 144.0, 93.0, 71.0, 69.0, 40.0, 45.0, 29.0, 33.0, 25.0, 11.0, 11.0, 4.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.7020263671875, -5.532958984375, -5.3638916015625, -5.19482421875, -5.0257568359375, -4.856689453125, -4.6876220703125, -4.5185546875, -4.3494873046875, -4.180419921875, -4.0113525390625, -3.84228515625, -3.6732177734375, -3.504150390625, -3.3350830078125, -3.166015625, -2.9969482421875, -2.827880859375, -2.6588134765625, -2.48974609375, -2.3206787109375, -2.151611328125, -1.9825439453125, -1.8134765625, -1.6444091796875, -1.475341796875, -1.3062744140625, -1.13720703125, -0.9681396484375, -0.799072265625, -0.6300048828125, -0.4609375, -0.2918701171875, -0.122802734375, 0.0462646484375, 0.21533203125, 0.3843994140625, 0.553466796875, 0.7225341796875, 0.8916015625, 1.0606689453125, 1.229736328125, 1.3988037109375, 1.56787109375, 1.7369384765625, 1.906005859375, 2.0750732421875, 2.244140625, 2.4132080078125, 2.582275390625, 2.7513427734375, 2.92041015625, 3.0894775390625, 3.258544921875, 3.4276123046875, 3.5966796875, 3.7657470703125, 3.934814453125, 4.1038818359375, 4.27294921875, 4.4420166015625, 4.611083984375, 4.7801513671875, 4.94921875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 9.0, 8.0, 9.0, 10.0, 14.0, 12.0, 19.0, 19.0, 37.0, 41.0, 49.0, 49.0, 49.0, 66.0, 52.0, 62.0, 78.0, 69.0, 54.0, 53.0, 35.0, 41.0, 30.0, 31.0, 22.0, 11.0, 14.0, 14.0, 11.0, 10.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.769283294677734, -24.143207550048828, -23.517131805419922, -22.891056060791016, -22.26498031616211, -21.638904571533203, -21.012828826904297, -20.38675308227539, -19.760677337646484, -19.134601593017578, -18.508525848388672, -17.882450103759766, -17.25637435913086, -16.630298614501953, -16.004222869873047, -15.37814712524414, -14.752070426940918, -14.125994682312012, -13.499918937683105, -12.8738431930542, -12.247767448425293, -11.621691703796387, -10.995615005493164, -10.369539260864258, -9.743463516235352, -9.117387771606445, -8.491312026977539, -7.865236282348633, -7.239160537719727, -6.61308479309082, -5.987008571624756, -5.36093282699585, -4.734857559204102, -4.108781814575195, -3.482706069946289, -2.8566300868988037, -2.2305543422698975, -1.6044785976409912, -0.9784026145935059, -0.3523268699645996, 0.27374887466430664, 0.8998246788978577, 1.5259004831314087, 2.1519763469696045, 2.7780520915985107, 3.404127836227417, 4.030203819274902, 4.656279563903809, 5.282355308532715, 5.908431053161621, 6.534506797790527, 7.160582542419434, 7.78665828704834, 8.412734031677246, 9.038810729980469, 9.664886474609375, 10.290962219238281, 10.917037963867188, 11.543113708496094, 12.169189453125, 12.795265197753906, 13.421340942382812, 14.047416687011719, 14.673492431640625, 15.299568176269531]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 0.0, 5.0, 5.0, 8.0, 8.0, 7.0, 16.0, 21.0, 22.0, 31.0, 25.0, 34.0, 27.0, 33.0, 33.0, 47.0, 37.0, 36.0, 33.0, 36.0, 51.0, 33.0, 43.0, 37.0, 36.0, 31.0, 39.0, 36.0, 33.0, 31.0, 21.0, 25.0, 23.0, 18.0, 13.0, 12.0, 10.0, 7.0, 9.0, 8.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.344612121582031, -10.96313190460205, -10.58165168762207, -10.20017147064209, -9.81869125366211, -9.437211036682129, -9.055730819702148, -8.674251556396484, -8.292770385742188, -7.911290168762207, -7.529809951782227, -7.148329734802246, -6.766849517822266, -6.385369300842285, -6.003889560699463, -5.622409343719482, -5.24092960357666, -4.85944938659668, -4.477969169616699, -4.096488952636719, -3.7150089740753174, -3.333528757095337, -2.9520487785339355, -2.570568561553955, -2.1890883445739746, -1.8076081275939941, -1.4261280298233032, -1.0446479320526123, -0.6631677150726318, -0.28168749809265137, 0.09979248046875, 0.48127269744873047, 0.8627519607543945, 1.244232177734375, 1.625712275505066, 2.007192373275757, 2.3886725902557373, 2.7701528072357178, 3.151632785797119, 3.5331130027770996, 3.91459321975708, 4.2960734367370605, 4.677553653717041, 5.059033393859863, 5.440513610839844, 5.821993827819824, 6.203474044799805, 6.584954261779785, 6.966434478759766, 7.347914695739746, 7.729394912719727, 8.110875129699707, 8.492355346679688, 8.873835563659668, 9.255315780639648, 9.636795043945312, 10.01827621459961, 10.39975643157959, 10.78123664855957, 11.16271686553955, 11.544197082519531, 11.925677299499512, 12.307157516479492, 12.688636779785156, 13.070116996765137]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 11.0, 9.0, 22.0, 38.0, 35.0, 52.0, 87.0, 124.0, 202.0, 314.0, 589.0, 846.0, 1385.0, 2233.0, 3628.0, 6186.0, 10611.0, 18861.0, 33573.0, 61854.0, 109640.0, 172123.0, 204811.0, 171536.0, 109473.0, 61501.0, 33683.0, 18644.0, 10633.0, 6219.0, 3572.0, 2253.0, 1402.0, 858.0, 564.0, 340.0, 235.0, 136.0, 91.0, 63.0, 49.0, 26.0, 17.0, 13.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7421875, -11.357177734375, -10.97216796875, -10.587158203125, -10.2021484375, -9.817138671875, -9.43212890625, -9.047119140625, -8.662109375, -8.277099609375, -7.89208984375, -7.507080078125, -7.1220703125, -6.737060546875, -6.35205078125, -5.967041015625, -5.58203125, -5.197021484375, -4.81201171875, -4.427001953125, -4.0419921875, -3.656982421875, -3.27197265625, -2.886962890625, -2.501953125, -2.116943359375, -1.73193359375, -1.346923828125, -0.9619140625, -0.576904296875, -0.19189453125, 0.193115234375, 0.578125, 0.963134765625, 1.34814453125, 1.733154296875, 2.1181640625, 2.503173828125, 2.88818359375, 3.273193359375, 3.658203125, 4.043212890625, 4.42822265625, 4.813232421875, 5.1982421875, 5.583251953125, 5.96826171875, 6.353271484375, 6.73828125, 7.123291015625, 7.50830078125, 7.893310546875, 8.2783203125, 8.663330078125, 9.04833984375, 9.433349609375, 9.818359375, 10.203369140625, 10.58837890625, 10.973388671875, 11.3583984375, 11.743408203125, 12.12841796875, 12.513427734375, 12.8984375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 8.0, 11.0, 6.0, 4.0, 11.0, 13.0, 17.0, 31.0, 26.0, 34.0, 24.0, 38.0, 41.0, 29.0, 33.0, 44.0, 43.0, 32.0, 43.0, 41.0, 49.0, 45.0, 34.0, 39.0, 30.0, 32.0, 27.0, 26.0, 25.0, 21.0, 19.0, 26.0, 11.0, 22.0, 14.0, 12.0, 7.0, 8.0, 1.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.0234375, -12.619140625, -12.21484375, -11.810546875, -11.40625, -11.001953125, -10.59765625, -10.193359375, -9.7890625, -9.384765625, -8.98046875, -8.576171875, -8.171875, -7.767578125, -7.36328125, -6.958984375, -6.5546875, -6.150390625, -5.74609375, -5.341796875, -4.9375, -4.533203125, -4.12890625, -3.724609375, -3.3203125, -2.916015625, -2.51171875, -2.107421875, -1.703125, -1.298828125, -0.89453125, -0.490234375, -0.0859375, 0.318359375, 0.72265625, 1.126953125, 1.53125, 1.935546875, 2.33984375, 2.744140625, 3.1484375, 3.552734375, 3.95703125, 4.361328125, 4.765625, 5.169921875, 5.57421875, 5.978515625, 6.3828125, 6.787109375, 7.19140625, 7.595703125, 8.0, 8.404296875, 8.80859375, 9.212890625, 9.6171875, 10.021484375, 10.42578125, 10.830078125, 11.234375, 11.638671875, 12.04296875, 12.447265625, 12.8515625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 5.0, 4.0, 9.0, 11.0, 16.0, 21.0, 22.0, 62.0, 87.0, 122.0, 162.0, 250.0, 338.0, 552.0, 892.0, 1459.0, 2433.0, 4075.0, 7561.0, 14917.0, 31759.0, 75576.0, 187228.0, 336158.0, 219924.0, 90374.0, 37556.0, 16795.0, 8500.0, 4578.0, 2672.0, 1568.0, 990.0, 654.0, 405.0, 288.0, 160.0, 117.0, 91.0, 67.0, 33.0, 24.0, 13.0, 17.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.296875, -19.611083984375, -18.92529296875, -18.239501953125, -17.5537109375, -16.867919921875, -16.18212890625, -15.496337890625, -14.810546875, -14.124755859375, -13.43896484375, -12.753173828125, -12.0673828125, -11.381591796875, -10.69580078125, -10.010009765625, -9.32421875, -8.638427734375, -7.95263671875, -7.266845703125, -6.5810546875, -5.895263671875, -5.20947265625, -4.523681640625, -3.837890625, -3.152099609375, -2.46630859375, -1.780517578125, -1.0947265625, -0.408935546875, 0.27685546875, 0.962646484375, 1.6484375, 2.334228515625, 3.02001953125, 3.705810546875, 4.3916015625, 5.077392578125, 5.76318359375, 6.448974609375, 7.134765625, 7.820556640625, 8.50634765625, 9.192138671875, 9.8779296875, 10.563720703125, 11.24951171875, 11.935302734375, 12.62109375, 13.306884765625, 13.99267578125, 14.678466796875, 15.3642578125, 16.050048828125, 16.73583984375, 17.421630859375, 18.107421875, 18.793212890625, 19.47900390625, 20.164794921875, 20.8505859375, 21.536376953125, 22.22216796875, 22.907958984375, 23.59375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 3.0, 6.0, 7.0, 7.0, 20.0, 15.0, 12.0, 20.0, 24.0, 35.0, 34.0, 25.0, 37.0, 45.0, 52.0, 42.0, 46.0, 37.0, 42.0, 41.0, 45.0, 32.0, 36.0, 43.0, 41.0, 37.0, 22.0, 31.0, 29.0, 30.0, 15.0, 18.0, 13.0, 11.0, 8.0, 14.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.815185546875, -8.52880859375, -8.242431640625, -7.9560546875, -7.669677734375, -7.38330078125, -7.096923828125, -6.810546875, -6.524169921875, -6.23779296875, -5.951416015625, -5.6650390625, -5.378662109375, -5.09228515625, -4.805908203125, -4.51953125, -4.233154296875, -3.94677734375, -3.660400390625, -3.3740234375, -3.087646484375, -2.80126953125, -2.514892578125, -2.228515625, -1.942138671875, -1.65576171875, -1.369384765625, -1.0830078125, -0.796630859375, -0.51025390625, -0.223876953125, 0.0625, 0.348876953125, 0.63525390625, 0.921630859375, 1.2080078125, 1.494384765625, 1.78076171875, 2.067138671875, 2.353515625, 2.639892578125, 2.92626953125, 3.212646484375, 3.4990234375, 3.785400390625, 4.07177734375, 4.358154296875, 4.64453125, 4.930908203125, 5.21728515625, 5.503662109375, 5.7900390625, 6.076416015625, 6.36279296875, 6.649169921875, 6.935546875, 7.221923828125, 7.50830078125, 7.794677734375, 8.0810546875, 8.367431640625, 8.65380859375, 8.940185546875, 9.2265625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 0.0, 2.0, 6.0, 5.0, 9.0, 8.0, 10.0, 12.0, 23.0, 38.0, 50.0, 33.0, 75.0, 101.0, 158.0, 226.0, 348.0, 570.0, 915.0, 1551.0, 2508.0, 4418.0, 8088.0, 15294.0, 30491.0, 64493.0, 142014.0, 279238.0, 258313.0, 124574.0, 56251.0, 27098.0, 13848.0, 7380.0, 4085.0, 2318.0, 1391.0, 909.0, 530.0, 371.0, 260.0, 163.0, 115.0, 66.0, 57.0, 38.0, 24.0, 26.0, 17.0, 12.0, 12.0, 2.0, 5.0, 4.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.4765625, -9.1700439453125, -8.863525390625, -8.5570068359375, -8.25048828125, -7.9439697265625, -7.637451171875, -7.3309326171875, -7.0244140625, -6.7178955078125, -6.411376953125, -6.1048583984375, -5.79833984375, -5.4918212890625, -5.185302734375, -4.8787841796875, -4.572265625, -4.2657470703125, -3.959228515625, -3.6527099609375, -3.34619140625, -3.0396728515625, -2.733154296875, -2.4266357421875, -2.1201171875, -1.8135986328125, -1.507080078125, -1.2005615234375, -0.89404296875, -0.5875244140625, -0.281005859375, 0.0255126953125, 0.33203125, 0.6385498046875, 0.945068359375, 1.2515869140625, 1.55810546875, 1.8646240234375, 2.171142578125, 2.4776611328125, 2.7841796875, 3.0906982421875, 3.397216796875, 3.7037353515625, 4.01025390625, 4.3167724609375, 4.623291015625, 4.9298095703125, 5.236328125, 5.5428466796875, 5.849365234375, 6.1558837890625, 6.46240234375, 6.7689208984375, 7.075439453125, 7.3819580078125, 7.6884765625, 7.9949951171875, 8.301513671875, 8.6080322265625, 8.91455078125, 9.2210693359375, 9.527587890625, 9.8341064453125, 10.140625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 9.0, 13.0, 17.0, 9.0, 29.0, 43.0, 31.0, 67.0, 77.0, 105.0, 130.0, 103.0, 107.0, 75.0, 55.0, 38.0, 27.0, 14.0, 13.0, 9.0, 5.0, 6.0, 3.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007715225219726562, -0.0007519684731960297, -0.0007324144244194031, -0.0007128603756427765, -0.0006933063268661499, -0.0006737522780895233, -0.0006541982293128967, -0.0006346441805362701, -0.0006150901317596436, -0.000595536082983017, -0.0005759820342063904, -0.0005564279854297638, -0.0005368739366531372, -0.0005173198878765106, -0.000497765839099884, -0.00047821179032325745, -0.00045865774154663086, -0.00043910369277000427, -0.0004195496439933777, -0.0003999955952167511, -0.0003804415464401245, -0.0003608874976634979, -0.00034133344888687134, -0.00032177940011024475, -0.00030222535133361816, -0.0002826713025569916, -0.000263117253780365, -0.0002435632050037384, -0.00022400915622711182, -0.00020445510745048523, -0.00018490105867385864, -0.00016534700989723206, -0.00014579296112060547, -0.00012623891234397888, -0.0001066848635673523, -8.713081479072571e-05, -6.757676601409912e-05, -4.8022717237472534e-05, -2.8468668460845947e-05, -8.91461968421936e-06, 1.0639429092407227e-05, 3.0193477869033813e-05, 4.97475266456604e-05, 6.930157542228699e-05, 8.885562419891357e-05, 0.00010840967297554016, 0.00012796372175216675, 0.00014751777052879333, 0.00016707181930541992, 0.0001866258680820465, 0.0002061799168586731, 0.00022573396563529968, 0.00024528801441192627, 0.00026484206318855286, 0.00028439611196517944, 0.00030395016074180603, 0.0003235042095184326, 0.0003430582582950592, 0.0003626123070716858, 0.0003821663558483124, 0.00040172040462493896, 0.00042127445340156555, 0.00044082850217819214, 0.0004603825509548187, 0.0004799365997314453]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 4.0, 11.0, 12.0, 17.0, 34.0, 36.0, 50.0, 72.0, 89.0, 130.0, 199.0, 306.0, 441.0, 669.0, 1035.0, 1649.0, 2606.0, 4592.0, 8405.0, 16649.0, 35079.0, 75842.0, 159909.0, 259551.0, 234870.0, 128471.0, 59824.0, 27592.0, 13470.0, 6922.0, 3692.0, 2129.0, 1456.0, 924.0, 563.0, 407.0, 267.0, 168.0, 107.0, 95.0, 55.0, 58.0, 30.0, 16.0, 15.0, 13.0, 7.0, 1.0, 3.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.546875, -8.269775390625, -7.99267578125, -7.715576171875, -7.4384765625, -7.161376953125, -6.88427734375, -6.607177734375, -6.330078125, -6.052978515625, -5.77587890625, -5.498779296875, -5.2216796875, -4.944580078125, -4.66748046875, -4.390380859375, -4.11328125, -3.836181640625, -3.55908203125, -3.281982421875, -3.0048828125, -2.727783203125, -2.45068359375, -2.173583984375, -1.896484375, -1.619384765625, -1.34228515625, -1.065185546875, -0.7880859375, -0.510986328125, -0.23388671875, 0.043212890625, 0.3203125, 0.597412109375, 0.87451171875, 1.151611328125, 1.4287109375, 1.705810546875, 1.98291015625, 2.260009765625, 2.537109375, 2.814208984375, 3.09130859375, 3.368408203125, 3.6455078125, 3.922607421875, 4.19970703125, 4.476806640625, 4.75390625, 5.031005859375, 5.30810546875, 5.585205078125, 5.8623046875, 6.139404296875, 6.41650390625, 6.693603515625, 6.970703125, 7.247802734375, 7.52490234375, 7.802001953125, 8.0791015625, 8.356201171875, 8.63330078125, 8.910400390625, 9.1875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 7.0, 14.0, 15.0, 29.0, 29.0, 43.0, 59.0, 81.0, 75.0, 89.0, 90.0, 81.0, 72.0, 71.0, 54.0, 45.0, 32.0, 25.0, 26.0, 17.0, 15.0, 8.0, 4.0, 0.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.76953125, -2.668060302734375, -2.56658935546875, -2.465118408203125, -2.3636474609375, -2.262176513671875, -2.16070556640625, -2.059234619140625, -1.957763671875, -1.856292724609375, -1.75482177734375, -1.653350830078125, -1.5518798828125, -1.450408935546875, -1.34893798828125, -1.247467041015625, -1.14599609375, -1.044525146484375, -0.94305419921875, -0.841583251953125, -0.7401123046875, -0.638641357421875, -0.53717041015625, -0.435699462890625, -0.334228515625, -0.232757568359375, -0.13128662109375, -0.029815673828125, 0.0716552734375, 0.173126220703125, 0.27459716796875, 0.376068115234375, 0.4775390625, 0.579010009765625, 0.68048095703125, 0.781951904296875, 0.8834228515625, 0.984893798828125, 1.08636474609375, 1.187835693359375, 1.289306640625, 1.390777587890625, 1.49224853515625, 1.593719482421875, 1.6951904296875, 1.796661376953125, 1.89813232421875, 1.999603271484375, 2.10107421875, 2.202545166015625, 2.30401611328125, 2.405487060546875, 2.5069580078125, 2.608428955078125, 2.70989990234375, 2.811370849609375, 2.912841796875, 3.014312744140625, 3.11578369140625, 3.217254638671875, 3.3187255859375, 3.420196533203125, 3.52166748046875, 3.623138427734375, 3.724609375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 7.0, 7.0, 9.0, 5.0, 16.0, 11.0, 21.0, 22.0, 23.0, 37.0, 43.0, 48.0, 59.0, 48.0, 58.0, 57.0, 81.0, 55.0, 60.0, 61.0, 55.0, 37.0, 38.0, 25.0, 28.0, 13.0, 17.0, 13.0, 20.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.11474609375, -23.49626922607422, -22.87779426574707, -22.25931739807129, -21.640840530395508, -21.02236557006836, -20.403888702392578, -19.785411834716797, -19.16693687438965, -18.548460006713867, -17.92998504638672, -17.311508178710938, -16.693031311035156, -16.074556350708008, -15.456079483032227, -14.837603569030762, -14.21912670135498, -13.600650787353516, -12.982173919677734, -12.36369800567627, -11.745222091674805, -11.126745223999023, -10.508269309997559, -9.889793395996094, -9.271316528320312, -8.652840614318848, -8.034363746643066, -7.415887832641602, -6.797411918640137, -6.178935527801514, -5.560459136962891, -4.941983222961426, -4.323508262634277, -3.7050321102142334, -3.0865559577941895, -2.4680795669555664, -1.8496034145355225, -1.2311272621154785, -0.6126508712768555, 0.005825042724609375, 0.6243014335632324, 1.2427775859832764, 1.8612538576126099, 2.4797301292419434, 3.0982062816619873, 3.7166824340820312, 4.335158824920654, 4.953634738922119, 5.572111129760742, 6.190587520599365, 6.80906343460083, 7.427539825439453, 8.046015739440918, 8.664491653442383, 9.282968521118164, 9.901444435119629, 10.519920349121094, 11.138396263122559, 11.75687313079834, 12.375349044799805, 12.99382495880127, 13.612300872802734, 14.230777740478516, 14.84925365447998, 15.467730522155762]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 0.0, 3.0, 10.0, 6.0, 13.0, 11.0, 18.0, 23.0, 25.0, 32.0, 32.0, 27.0, 38.0, 36.0, 26.0, 34.0, 41.0, 40.0, 39.0, 33.0, 45.0, 48.0, 32.0, 37.0, 31.0, 38.0, 37.0, 26.0, 36.0, 28.0, 19.0, 27.0, 19.0, 18.0, 9.0, 17.0, 5.0, 8.0, 6.0, 5.0, 3.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.791863441467285, -10.419767379760742, -10.047672271728516, -9.675577163696289, -9.303481101989746, -8.931385040283203, -8.559289932250977, -8.18719482421875, -7.815098762512207, -7.443003177642822, -7.0709075927734375, -6.698812007904053, -6.326716423034668, -5.954620838165283, -5.582525253295898, -5.210429668426514, -4.838334083557129, -4.466238498687744, -4.094142913818359, -3.7220473289489746, -3.34995174407959, -2.977856159210205, -2.6057605743408203, -2.2336649894714355, -1.8615694046020508, -1.489473819732666, -1.1173782348632812, -0.7452826499938965, -0.3731870651245117, -0.0010914802551269531, 0.3710041046142578, 0.7430996894836426, 1.115194320678711, 1.4872899055480957, 1.8593854904174805, 2.2314810752868652, 2.60357666015625, 2.9756722450256348, 3.3477678298950195, 3.7198634147644043, 4.091958999633789, 4.464054584503174, 4.836150169372559, 5.208245754241943, 5.580341339111328, 5.952436923980713, 6.324532508850098, 6.696628093719482, 7.068723678588867, 7.440819263458252, 7.812914848327637, 8.18501091003418, 8.557106018066406, 8.929201126098633, 9.301297187805176, 9.673393249511719, 10.045488357543945, 10.417583465576172, 10.789679527282715, 11.161775588989258, 11.533870697021484, 11.905965805053711, 12.278061866760254, 12.650157928466797, 13.022253036499023]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 17.0, 17.0, 14.0, 20.0, 34.0, 32.0, 74.0, 83.0, 131.0, 158.0, 241.0, 364.0, 492.0, 845.0, 1277.0, 1945.0, 3365.0, 5405.0, 9059.0, 15664.0, 26858.0, 46832.0, 78525.0, 120822.0, 160256.0, 172340.0, 146315.0, 102593.0, 63763.0, 37352.0, 21752.0, 12490.0, 7365.0, 4467.0, 2788.0, 1691.0, 1037.0, 658.0, 436.0, 309.0, 212.0, 133.0, 109.0, 51.0, 54.0, 41.0, 22.0, 14.0, 11.0, 6.0, 3.0, 5.0, 3.0, 2.0, 0.0, 5.0, 4.0, 3.0], "bins": [-14.78125, -14.3089599609375, -13.836669921875, -13.3643798828125, -12.89208984375, -12.4197998046875, -11.947509765625, -11.4752197265625, -11.0029296875, -10.5306396484375, -10.058349609375, -9.5860595703125, -9.11376953125, -8.6414794921875, -8.169189453125, -7.6968994140625, -7.224609375, -6.7523193359375, -6.280029296875, -5.8077392578125, -5.33544921875, -4.8631591796875, -4.390869140625, -3.9185791015625, -3.4462890625, -2.9739990234375, -2.501708984375, -2.0294189453125, -1.55712890625, -1.0848388671875, -0.612548828125, -0.1402587890625, 0.33203125, 0.8043212890625, 1.276611328125, 1.7489013671875, 2.22119140625, 2.6934814453125, 3.165771484375, 3.6380615234375, 4.1103515625, 4.5826416015625, 5.054931640625, 5.5272216796875, 5.99951171875, 6.4718017578125, 6.944091796875, 7.4163818359375, 7.888671875, 8.3609619140625, 8.833251953125, 9.3055419921875, 9.77783203125, 10.2501220703125, 10.722412109375, 11.1947021484375, 11.6669921875, 12.1392822265625, 12.611572265625, 13.0838623046875, 13.55615234375, 14.0284423828125, 14.500732421875, 14.9730224609375, 15.4453125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 5.0, 8.0, 7.0, 4.0, 11.0, 6.0, 8.0, 10.0, 16.0, 20.0, 24.0, 33.0, 29.0, 38.0, 31.0, 38.0, 38.0, 30.0, 51.0, 35.0, 49.0, 45.0, 47.0, 47.0, 36.0, 51.0, 35.0, 33.0, 28.0, 37.0, 7.0, 25.0, 23.0, 23.0, 10.0, 12.0, 11.0, 11.0, 3.0, 12.0, 3.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.59375, -11.1868896484375, -10.780029296875, -10.3731689453125, -9.96630859375, -9.5594482421875, -9.152587890625, -8.7457275390625, -8.3388671875, -7.9320068359375, -7.525146484375, -7.1182861328125, -6.71142578125, -6.3045654296875, -5.897705078125, -5.4908447265625, -5.083984375, -4.6771240234375, -4.270263671875, -3.8634033203125, -3.45654296875, -3.0496826171875, -2.642822265625, -2.2359619140625, -1.8291015625, -1.4222412109375, -1.015380859375, -0.6085205078125, -0.20166015625, 0.2052001953125, 0.612060546875, 1.0189208984375, 1.42578125, 1.8326416015625, 2.239501953125, 2.6463623046875, 3.05322265625, 3.4600830078125, 3.866943359375, 4.2738037109375, 4.6806640625, 5.0875244140625, 5.494384765625, 5.9012451171875, 6.30810546875, 6.7149658203125, 7.121826171875, 7.5286865234375, 7.935546875, 8.3424072265625, 8.749267578125, 9.1561279296875, 9.56298828125, 9.9698486328125, 10.376708984375, 10.7835693359375, 11.1904296875, 11.5972900390625, 12.004150390625, 12.4110107421875, 12.81787109375, 13.2247314453125, 13.631591796875, 14.0384521484375, 14.4453125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 7.0, 8.0, 22.0, 26.0, 37.0, 61.0, 90.0, 179.0, 294.0, 436.0, 737.0, 1196.0, 2171.0, 3479.0, 6182.0, 10628.0, 18879.0, 32884.0, 55760.0, 90079.0, 133126.0, 164952.0, 166142.0, 134175.0, 91300.0, 57124.0, 33458.0, 19075.0, 10823.0, 6231.0, 3674.0, 2133.0, 1243.0, 729.0, 459.0, 276.0, 188.0, 111.0, 59.0, 47.0, 29.0, 22.0, 13.0, 6.0, 9.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.7265625, -15.2899169921875, -14.853271484375, -14.4166259765625, -13.97998046875, -13.5433349609375, -13.106689453125, -12.6700439453125, -12.2333984375, -11.7967529296875, -11.360107421875, -10.9234619140625, -10.48681640625, -10.0501708984375, -9.613525390625, -9.1768798828125, -8.740234375, -8.3035888671875, -7.866943359375, -7.4302978515625, -6.99365234375, -6.5570068359375, -6.120361328125, -5.6837158203125, -5.2470703125, -4.8104248046875, -4.373779296875, -3.9371337890625, -3.50048828125, -3.0638427734375, -2.627197265625, -2.1905517578125, -1.75390625, -1.3172607421875, -0.880615234375, -0.4439697265625, -0.00732421875, 0.4293212890625, 0.865966796875, 1.3026123046875, 1.7392578125, 2.1759033203125, 2.612548828125, 3.0491943359375, 3.48583984375, 3.9224853515625, 4.359130859375, 4.7957763671875, 5.232421875, 5.6690673828125, 6.105712890625, 6.5423583984375, 6.97900390625, 7.4156494140625, 7.852294921875, 8.2889404296875, 8.7255859375, 9.1622314453125, 9.598876953125, 10.0355224609375, 10.47216796875, 10.9088134765625, 11.345458984375, 11.7821044921875, 12.21875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 3.0, 8.0, 12.0, 10.0, 16.0, 18.0, 22.0, 21.0, 36.0, 30.0, 26.0, 38.0, 38.0, 41.0, 37.0, 45.0, 56.0, 40.0, 36.0, 36.0, 49.0, 41.0, 39.0, 41.0, 39.0, 32.0, 37.0, 23.0, 26.0, 19.0, 16.0, 15.0, 13.0, 9.0, 12.0, 5.0, 7.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5546875, -7.2857666015625, -7.016845703125, -6.7479248046875, -6.47900390625, -6.2100830078125, -5.941162109375, -5.6722412109375, -5.4033203125, -5.1343994140625, -4.865478515625, -4.5965576171875, -4.32763671875, -4.0587158203125, -3.789794921875, -3.5208740234375, -3.251953125, -2.9830322265625, -2.714111328125, -2.4451904296875, -2.17626953125, -1.9073486328125, -1.638427734375, -1.3695068359375, -1.1005859375, -0.8316650390625, -0.562744140625, -0.2938232421875, -0.02490234375, 0.2440185546875, 0.512939453125, 0.7818603515625, 1.05078125, 1.3197021484375, 1.588623046875, 1.8575439453125, 2.12646484375, 2.3953857421875, 2.664306640625, 2.9332275390625, 3.2021484375, 3.4710693359375, 3.739990234375, 4.0089111328125, 4.27783203125, 4.5467529296875, 4.815673828125, 5.0845947265625, 5.353515625, 5.6224365234375, 5.891357421875, 6.1602783203125, 6.42919921875, 6.6981201171875, 6.967041015625, 7.2359619140625, 7.5048828125, 7.7738037109375, 8.042724609375, 8.3116455078125, 8.58056640625, 8.8494873046875, 9.118408203125, 9.3873291015625, 9.65625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 13.0, 14.0, 14.0, 28.0, 46.0, 70.0, 82.0, 157.0, 277.0, 463.0, 691.0, 1276.0, 2203.0, 4233.0, 9801.0, 31144.0, 148005.0, 543429.0, 236306.0, 45891.0, 13104.0, 5182.0, 2470.0, 1446.0, 852.0, 505.0, 312.0, 183.0, 114.0, 67.0, 51.0, 27.0, 24.0, 20.0, 13.0, 6.0, 4.0, 9.0, 5.0, 5.0, 0.0, 4.0, 0.0, 1.0], "bins": [-61.875, -60.23095703125, -58.5869140625, -56.94287109375, -55.298828125, -53.65478515625, -52.0107421875, -50.36669921875, -48.72265625, -47.07861328125, -45.4345703125, -43.79052734375, -42.146484375, -40.50244140625, -38.8583984375, -37.21435546875, -35.5703125, -33.92626953125, -32.2822265625, -30.63818359375, -28.994140625, -27.35009765625, -25.7060546875, -24.06201171875, -22.41796875, -20.77392578125, -19.1298828125, -17.48583984375, -15.841796875, -14.19775390625, -12.5537109375, -10.90966796875, -9.265625, -7.62158203125, -5.9775390625, -4.33349609375, -2.689453125, -1.04541015625, 0.5986328125, 2.24267578125, 3.88671875, 5.53076171875, 7.1748046875, 8.81884765625, 10.462890625, 12.10693359375, 13.7509765625, 15.39501953125, 17.0390625, 18.68310546875, 20.3271484375, 21.97119140625, 23.615234375, 25.25927734375, 26.9033203125, 28.54736328125, 30.19140625, 31.83544921875, 33.4794921875, 35.12353515625, 36.767578125, 38.41162109375, 40.0556640625, 41.69970703125, 43.34375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 9.0, 9.0, 7.0, 11.0, 26.0, 32.0, 34.0, 52.0, 77.0, 107.0, 99.0, 118.0, 112.0, 87.0, 77.0, 40.0, 39.0, 22.0, 14.0, 7.0, 8.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0033111572265625, -0.003214418888092041, -0.003117680549621582, -0.003020942211151123, -0.002924203872680664, -0.002827465534210205, -0.002730727195739746, -0.002633988857269287, -0.002537250518798828, -0.002440512180328369, -0.00234377384185791, -0.002247035503387451, -0.002150297164916992, -0.002053558826446533, -0.0019568204879760742, -0.0018600821495056152, -0.0017633438110351562, -0.0016666054725646973, -0.0015698671340942383, -0.0014731287956237793, -0.0013763904571533203, -0.0012796521186828613, -0.0011829137802124023, -0.0010861754417419434, -0.0009894371032714844, -0.0008926987648010254, -0.0007959604263305664, -0.0006992220878601074, -0.0006024837493896484, -0.0005057454109191895, -0.00040900707244873047, -0.0003122687339782715, -0.0002155303955078125, -0.00011879205703735352, -2.205371856689453e-05, 7.468461990356445e-05, 0.00017142295837402344, 0.0002681612968444824, 0.0003648996353149414, 0.0004616379737854004, 0.0005583763122558594, 0.0006551146507263184, 0.0007518529891967773, 0.0008485913276672363, 0.0009453296661376953, 0.0010420680046081543, 0.0011388063430786133, 0.0012355446815490723, 0.0013322830200195312, 0.0014290213584899902, 0.0015257596969604492, 0.0016224980354309082, 0.0017192363739013672, 0.0018159747123718262, 0.0019127130508422852, 0.002009451389312744, 0.002106189727783203, 0.002202928066253662, 0.002299666404724121, 0.00239640474319458, 0.002493143081665039, 0.002589881420135498, 0.002686619758605957, 0.002783358097076416, 0.002880096435546875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 10.0, 18.0, 18.0, 20.0, 38.0, 54.0, 62.0, 102.0, 155.0, 148.0, 295.0, 369.0, 525.0, 741.0, 1141.0, 1652.0, 2746.0, 4904.0, 9703.0, 21186.0, 50158.0, 127760.0, 274829.0, 295715.0, 147992.0, 58812.0, 24193.0, 10905.0, 5437.0, 3044.0, 1870.0, 1157.0, 813.0, 576.0, 362.0, 272.0, 223.0, 172.0, 107.0, 83.0, 55.0, 41.0, 27.0, 16.0, 10.0, 9.0, 8.0, 3.0, 4.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.171875, -23.41845703125, -22.6650390625, -21.91162109375, -21.158203125, -20.40478515625, -19.6513671875, -18.89794921875, -18.14453125, -17.39111328125, -16.6376953125, -15.88427734375, -15.130859375, -14.37744140625, -13.6240234375, -12.87060546875, -12.1171875, -11.36376953125, -10.6103515625, -9.85693359375, -9.103515625, -8.35009765625, -7.5966796875, -6.84326171875, -6.08984375, -5.33642578125, -4.5830078125, -3.82958984375, -3.076171875, -2.32275390625, -1.5693359375, -0.81591796875, -0.0625, 0.69091796875, 1.4443359375, 2.19775390625, 2.951171875, 3.70458984375, 4.4580078125, 5.21142578125, 5.96484375, 6.71826171875, 7.4716796875, 8.22509765625, 8.978515625, 9.73193359375, 10.4853515625, 11.23876953125, 11.9921875, 12.74560546875, 13.4990234375, 14.25244140625, 15.005859375, 15.75927734375, 16.5126953125, 17.26611328125, 18.01953125, 18.77294921875, 19.5263671875, 20.27978515625, 21.033203125, 21.78662109375, 22.5400390625, 23.29345703125, 24.046875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 8.0, 6.0, 14.0, 13.0, 16.0, 21.0, 34.0, 43.0, 36.0, 68.0, 54.0, 75.0, 75.0, 69.0, 62.0, 66.0, 63.0, 54.0, 40.0, 33.0, 31.0, 22.0, 16.0, 14.0, 14.0, 8.0, 5.0, 12.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.87890625, -4.7333984375, -4.587890625, -4.4423828125, -4.296875, -4.1513671875, -4.005859375, -3.8603515625, -3.71484375, -3.5693359375, -3.423828125, -3.2783203125, -3.1328125, -2.9873046875, -2.841796875, -2.6962890625, -2.55078125, -2.4052734375, -2.259765625, -2.1142578125, -1.96875, -1.8232421875, -1.677734375, -1.5322265625, -1.38671875, -1.2412109375, -1.095703125, -0.9501953125, -0.8046875, -0.6591796875, -0.513671875, -0.3681640625, -0.22265625, -0.0771484375, 0.068359375, 0.2138671875, 0.359375, 0.5048828125, 0.650390625, 0.7958984375, 0.94140625, 1.0869140625, 1.232421875, 1.3779296875, 1.5234375, 1.6689453125, 1.814453125, 1.9599609375, 2.10546875, 2.2509765625, 2.396484375, 2.5419921875, 2.6875, 2.8330078125, 2.978515625, 3.1240234375, 3.26953125, 3.4150390625, 3.560546875, 3.7060546875, 3.8515625, 3.9970703125, 4.142578125, 4.2880859375, 4.43359375]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 13.0, 13.0, 17.0, 18.0, 22.0, 35.0, 47.0, 52.0, 58.0, 59.0, 53.0, 69.0, 69.0, 68.0, 62.0, 61.0, 49.0, 43.0, 33.0, 32.0, 28.0, 27.0, 13.0, 12.0, 12.0, 8.0, 4.0, 4.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-26.580930709838867, -25.90925407409668, -25.23757553100586, -24.565898895263672, -23.894222259521484, -23.222543716430664, -22.550867080688477, -21.879188537597656, -21.20751190185547, -20.53583526611328, -19.86415672302246, -19.192480087280273, -18.520803451538086, -17.849124908447266, -17.177448272705078, -16.50577163696289, -15.834094047546387, -15.162416458129883, -14.490739822387695, -13.819062232971191, -13.147384643554688, -12.4757080078125, -11.804030418395996, -11.132352828979492, -10.460676193237305, -9.7889986038208, -9.117321968078613, -8.44564437866211, -7.7739667892456055, -7.10228967666626, -6.430612564086914, -5.75893497467041, -5.087257385253906, -4.4155802726745605, -3.7439026832580566, -3.072225570678711, -2.400548219680786, -1.7288708686828613, -1.0571937561035156, -0.3855161666870117, 0.286160945892334, 0.957838237285614, 1.629515528678894, 2.3011927604675293, 2.972870111465454, 3.644547462463379, 4.316224575042725, 4.9879021644592285, 5.659579277038574, 6.33125638961792, 7.002933979034424, 7.6746110916137695, 8.346288681030273, 9.017965316772461, 9.689642906188965, 10.361320495605469, 11.032997131347656, 11.70467472076416, 12.376351356506348, 13.048028945922852, 13.719706535339355, 14.39138412475586, 15.063060760498047, 15.73473834991455, 16.406415939331055]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 9.0, 5.0, 13.0, 14.0, 21.0, 13.0, 20.0, 16.0, 29.0, 26.0, 29.0, 40.0, 40.0, 34.0, 42.0, 45.0, 50.0, 40.0, 39.0, 48.0, 45.0, 44.0, 39.0, 39.0, 30.0, 37.0, 25.0, 36.0, 25.0, 20.0, 18.0, 13.0, 10.0, 8.0, 5.0, 5.0, 4.0, 6.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.532588958740234, -13.110087394714355, -12.687585830688477, -12.265084266662598, -11.842582702636719, -11.42008113861084, -10.997579574584961, -10.575077056884766, -10.152576446533203, -9.730074882507324, -9.307573318481445, -8.885071754455566, -8.462570190429688, -8.040068626403809, -7.6175665855407715, -7.195065021514893, -6.7725629806518555, -6.350061416625977, -5.927559852600098, -5.505058288574219, -5.08255672454834, -4.660055160522461, -4.237553119659424, -3.815051555633545, -3.392549991607666, -2.970048427581787, -2.547546863555908, -2.12504506111145, -1.7025434970855713, -1.2800419330596924, -0.8575401306152344, -0.43503856658935547, -0.012537002563476562, 0.4099646210670471, 0.8324662446975708, 1.2549679279327393, 1.6774694919586182, 2.099971055984497, 2.522472858428955, 2.944974422454834, 3.367475986480713, 3.789977550506592, 4.212479114532471, 4.634981155395508, 5.057482719421387, 5.479984283447266, 5.9024858474731445, 6.324987411499023, 6.747488975524902, 7.169990539550781, 7.59249210357666, 8.014993667602539, 8.437495231628418, 8.859996795654297, 9.282499313354492, 9.704999923706055, 10.12750244140625, 10.550004005432129, 10.972505569458008, 11.395007133483887, 11.817508697509766, 12.240010261535645, 12.662511825561523, 13.085014343261719, 13.507514953613281]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 9.0, 14.0, 29.0, 46.0, 63.0, 123.0, 187.0, 292.0, 410.0, 696.0, 1084.0, 1758.0, 2727.0, 4621.0, 7132.0, 11802.0, 19891.0, 33948.0, 58779.0, 104255.0, 188087.0, 336221.0, 565490.0, 779676.0, 774881.0, 551526.0, 327434.0, 182494.0, 100965.0, 56859.0, 32530.0, 19201.0, 11459.0, 7204.0, 4249.0, 2752.0, 1785.0, 1181.0, 801.0, 521.0, 349.0, 263.0, 143.0, 117.0, 70.0, 55.0, 34.0, 33.0, 13.0, 12.0, 8.0, 1.0, 5.0, 1.0, 1.0], "bins": [-13.7734375, -13.355712890625, -12.93798828125, -12.520263671875, -12.1025390625, -11.684814453125, -11.26708984375, -10.849365234375, -10.431640625, -10.013916015625, -9.59619140625, -9.178466796875, -8.7607421875, -8.343017578125, -7.92529296875, -7.507568359375, -7.08984375, -6.672119140625, -6.25439453125, -5.836669921875, -5.4189453125, -5.001220703125, -4.58349609375, -4.165771484375, -3.748046875, -3.330322265625, -2.91259765625, -2.494873046875, -2.0771484375, -1.659423828125, -1.24169921875, -0.823974609375, -0.40625, 0.011474609375, 0.42919921875, 0.846923828125, 1.2646484375, 1.682373046875, 2.10009765625, 2.517822265625, 2.935546875, 3.353271484375, 3.77099609375, 4.188720703125, 4.6064453125, 5.024169921875, 5.44189453125, 5.859619140625, 6.27734375, 6.695068359375, 7.11279296875, 7.530517578125, 7.9482421875, 8.365966796875, 8.78369140625, 9.201416015625, 9.619140625, 10.036865234375, 10.45458984375, 10.872314453125, 11.2900390625, 11.707763671875, 12.12548828125, 12.543212890625, 12.9609375]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 4.0, 6.0, 5.0, 6.0, 12.0, 18.0, 18.0, 16.0, 24.0, 37.0, 29.0, 27.0, 36.0, 29.0, 39.0, 41.0, 45.0, 35.0, 51.0, 41.0, 40.0, 47.0, 37.0, 49.0, 26.0, 35.0, 36.0, 32.0, 22.0, 22.0, 27.0, 14.0, 16.0, 11.0, 6.0, 8.0, 8.0, 7.0, 11.0, 6.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.1328125, -7.8726806640625, -7.612548828125, -7.3524169921875, -7.09228515625, -6.8321533203125, -6.572021484375, -6.3118896484375, -6.0517578125, -5.7916259765625, -5.531494140625, -5.2713623046875, -5.01123046875, -4.7510986328125, -4.490966796875, -4.2308349609375, -3.970703125, -3.7105712890625, -3.450439453125, -3.1903076171875, -2.93017578125, -2.6700439453125, -2.409912109375, -2.1497802734375, -1.8896484375, -1.6295166015625, -1.369384765625, -1.1092529296875, -0.84912109375, -0.5889892578125, -0.328857421875, -0.0687255859375, 0.19140625, 0.4515380859375, 0.711669921875, 0.9718017578125, 1.23193359375, 1.4920654296875, 1.752197265625, 2.0123291015625, 2.2724609375, 2.5325927734375, 2.792724609375, 3.0528564453125, 3.31298828125, 3.5731201171875, 3.833251953125, 4.0933837890625, 4.353515625, 4.6136474609375, 4.873779296875, 5.1339111328125, 5.39404296875, 5.6541748046875, 5.914306640625, 6.1744384765625, 6.4345703125, 6.6947021484375, 6.954833984375, 7.2149658203125, 7.47509765625, 7.7352294921875, 7.995361328125, 8.2554931640625, 8.515625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 12.0, 7.0, 9.0, 18.0, 30.0, 41.0, 73.0, 117.0, 185.0, 283.0, 454.0, 670.0, 1150.0, 2024.0, 3259.0, 5351.0, 9048.0, 15466.0, 26080.0, 45509.0, 78499.0, 135277.0, 229078.0, 371628.0, 556404.0, 701107.0, 678302.0, 511547.0, 333794.0, 203990.0, 118989.0, 69157.0, 39645.0, 23079.0, 13743.0, 8091.0, 4768.0, 2856.0, 1708.0, 1018.0, 636.0, 425.0, 292.0, 170.0, 103.0, 62.0, 44.0, 34.0, 15.0, 12.0, 14.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.1015625, -11.709716796875, -11.31787109375, -10.926025390625, -10.5341796875, -10.142333984375, -9.75048828125, -9.358642578125, -8.966796875, -8.574951171875, -8.18310546875, -7.791259765625, -7.3994140625, -7.007568359375, -6.61572265625, -6.223876953125, -5.83203125, -5.440185546875, -5.04833984375, -4.656494140625, -4.2646484375, -3.872802734375, -3.48095703125, -3.089111328125, -2.697265625, -2.305419921875, -1.91357421875, -1.521728515625, -1.1298828125, -0.738037109375, -0.34619140625, 0.045654296875, 0.4375, 0.829345703125, 1.22119140625, 1.613037109375, 2.0048828125, 2.396728515625, 2.78857421875, 3.180419921875, 3.572265625, 3.964111328125, 4.35595703125, 4.747802734375, 5.1396484375, 5.531494140625, 5.92333984375, 6.315185546875, 6.70703125, 7.098876953125, 7.49072265625, 7.882568359375, 8.2744140625, 8.666259765625, 9.05810546875, 9.449951171875, 9.841796875, 10.233642578125, 10.62548828125, 11.017333984375, 11.4091796875, 11.801025390625, 12.19287109375, 12.584716796875, 12.9765625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 6.0, 5.0, 4.0, 4.0, 6.0, 17.0, 17.0, 17.0, 37.0, 38.0, 42.0, 54.0, 50.0, 88.0, 80.0, 103.0, 142.0, 156.0, 172.0, 187.0, 219.0, 227.0, 231.0, 226.0, 210.0, 226.0, 243.0, 188.0, 168.0, 143.0, 148.0, 129.0, 111.0, 81.0, 65.0, 49.0, 45.0, 36.0, 24.0, 25.0, 21.0, 12.0, 5.0, 2.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.51953125, -4.37786865234375, -4.2362060546875, -4.09454345703125, -3.952880859375, -3.81121826171875, -3.6695556640625, -3.52789306640625, -3.38623046875, -3.24456787109375, -3.1029052734375, -2.96124267578125, -2.819580078125, -2.67791748046875, -2.5362548828125, -2.39459228515625, -2.2529296875, -2.11126708984375, -1.9696044921875, -1.82794189453125, -1.686279296875, -1.54461669921875, -1.4029541015625, -1.26129150390625, -1.11962890625, -0.97796630859375, -0.8363037109375, -0.69464111328125, -0.552978515625, -0.41131591796875, -0.2696533203125, -0.12799072265625, 0.013671875, 0.15533447265625, 0.2969970703125, 0.43865966796875, 0.580322265625, 0.72198486328125, 0.8636474609375, 1.00531005859375, 1.14697265625, 1.28863525390625, 1.4302978515625, 1.57196044921875, 1.713623046875, 1.85528564453125, 1.9969482421875, 2.13861083984375, 2.2802734375, 2.42193603515625, 2.5635986328125, 2.70526123046875, 2.846923828125, 2.98858642578125, 3.1302490234375, 3.27191162109375, 3.41357421875, 3.55523681640625, 3.6968994140625, 3.83856201171875, 3.980224609375, 4.12188720703125, 4.2635498046875, 4.40521240234375, 4.546875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 10.0, 10.0, 15.0, 11.0, 16.0, 21.0, 34.0, 45.0, 54.0, 46.0, 59.0, 52.0, 89.0, 77.0, 79.0, 69.0, 57.0, 60.0, 38.0, 39.0, 26.0, 18.0, 17.0, 12.0, 10.0, 12.0, 8.0, 4.0, 7.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.62752914428711, -23.010971069335938, -22.394411087036133, -21.77785301208496, -21.161293029785156, -20.544734954833984, -19.92817497253418, -19.311616897583008, -18.695056915283203, -18.07849884033203, -17.461938858032227, -16.845380783081055, -16.22882080078125, -15.612262725830078, -14.99570369720459, -14.379144668579102, -13.76258659362793, -13.146027565002441, -12.529468536376953, -11.912909507751465, -11.296350479125977, -10.679792404174805, -10.063233375549316, -9.446674346923828, -8.83011531829834, -8.213556289672852, -7.596997261047363, -6.980438709259033, -6.363879680633545, -5.747320652008057, -5.130762100219727, -4.514203071594238, -3.89764404296875, -3.2810850143432617, -2.6645262241363525, -2.0479674339294434, -1.431408405303955, -0.8148493766784668, -0.19829058647155762, 0.41826820373535156, 1.0348272323608398, 1.6513861417770386, 2.2679450511932373, 2.8845038414001465, 3.5010628700256348, 4.117621898651123, 4.734180450439453, 5.350739479064941, 5.96729850769043, 6.583857536315918, 7.200416564941406, 7.816975116729736, 8.433534622192383, 9.050092697143555, 9.666651725769043, 10.283210754394531, 10.89976978302002, 11.516328811645508, 12.132887840270996, 12.749446868896484, 13.366004943847656, 13.982564926147461, 14.599123001098633, 15.215682029724121, 15.83224105834961]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 6.0, 9.0, 16.0, 9.0, 16.0, 25.0, 12.0, 18.0, 27.0, 25.0, 25.0, 32.0, 31.0, 32.0, 42.0, 37.0, 52.0, 35.0, 56.0, 51.0, 49.0, 39.0, 29.0, 35.0, 34.0, 29.0, 44.0, 20.0, 30.0, 17.0, 25.0, 19.0, 18.0, 11.0, 7.0, 5.0, 5.0, 5.0, 8.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.867642402648926, -10.535539627075195, -10.203436851501465, -9.871334075927734, -9.539231300354004, -9.207128524780273, -8.875025749206543, -8.542922973632812, -8.210820198059082, -7.878717422485352, -7.546614646911621, -7.214511871337891, -6.88240909576416, -6.55030632019043, -6.218203544616699, -5.886100769042969, -5.553997993469238, -5.221895217895508, -4.889792442321777, -4.557689666748047, -4.225586891174316, -3.893484115600586, -3.5613813400268555, -3.229278564453125, -2.8971757888793945, -2.565073013305664, -2.2329702377319336, -1.9008674621582031, -1.5687646865844727, -1.2366619110107422, -0.9045591354370117, -0.5724563598632812, -0.24035263061523438, 0.0917501449584961, 0.42385292053222656, 0.755955696105957, 1.0880584716796875, 1.420161247253418, 1.7522640228271484, 2.084366798400879, 2.4164695739746094, 2.74857234954834, 3.0806751251220703, 3.412777900695801, 3.7448806762695312, 4.076983451843262, 4.409086227416992, 4.741189002990723, 5.073291778564453, 5.405394554138184, 5.737497329711914, 6.0696001052856445, 6.401702880859375, 6.7338056564331055, 7.065908432006836, 7.398011207580566, 7.730113983154297, 8.062216758728027, 8.394319534301758, 8.726422309875488, 9.058525085449219, 9.39062786102295, 9.72273063659668, 10.05483341217041, 10.38693618774414]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 7.0, 9.0, 18.0, 15.0, 28.0, 43.0, 68.0, 81.0, 160.0, 241.0, 333.0, 583.0, 851.0, 1492.0, 2450.0, 4041.0, 7162.0, 12864.0, 22724.0, 40686.0, 69070.0, 109991.0, 152990.0, 175108.0, 157685.0, 115226.0, 73807.0, 43387.0, 24937.0, 13646.0, 7741.0, 4349.0, 2547.0, 1560.0, 899.0, 581.0, 405.0, 278.0, 162.0, 116.0, 76.0, 37.0, 31.0, 25.0, 20.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-7.64453125, -7.4295654296875, -7.214599609375, -6.9996337890625, -6.78466796875, -6.5697021484375, -6.354736328125, -6.1397705078125, -5.9248046875, -5.7098388671875, -5.494873046875, -5.2799072265625, -5.06494140625, -4.8499755859375, -4.635009765625, -4.4200439453125, -4.205078125, -3.9901123046875, -3.775146484375, -3.5601806640625, -3.34521484375, -3.1302490234375, -2.915283203125, -2.7003173828125, -2.4853515625, -2.2703857421875, -2.055419921875, -1.8404541015625, -1.62548828125, -1.4105224609375, -1.195556640625, -0.9805908203125, -0.765625, -0.5506591796875, -0.335693359375, -0.1207275390625, 0.09423828125, 0.3092041015625, 0.524169921875, 0.7391357421875, 0.9541015625, 1.1690673828125, 1.384033203125, 1.5989990234375, 1.81396484375, 2.0289306640625, 2.243896484375, 2.4588623046875, 2.673828125, 2.8887939453125, 3.103759765625, 3.3187255859375, 3.53369140625, 3.7486572265625, 3.963623046875, 4.1785888671875, 4.3935546875, 4.6085205078125, 4.823486328125, 5.0384521484375, 5.25341796875, 5.4683837890625, 5.683349609375, 5.8983154296875, 6.11328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 10.0, 10.0, 17.0, 9.0, 22.0, 24.0, 21.0, 30.0, 27.0, 41.0, 39.0, 36.0, 47.0, 38.0, 49.0, 59.0, 57.0, 51.0, 42.0, 40.0, 23.0, 44.0, 42.0, 46.0, 26.0, 30.0, 18.0, 24.0, 15.0, 8.0, 17.0, 6.0, 5.0, 4.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4296875, -12.0289306640625, -11.628173828125, -11.2274169921875, -10.82666015625, -10.4259033203125, -10.025146484375, -9.6243896484375, -9.2236328125, -8.8228759765625, -8.422119140625, -8.0213623046875, -7.62060546875, -7.2198486328125, -6.819091796875, -6.4183349609375, -6.017578125, -5.6168212890625, -5.216064453125, -4.8153076171875, -4.41455078125, -4.0137939453125, -3.613037109375, -3.2122802734375, -2.8115234375, -2.4107666015625, -2.010009765625, -1.6092529296875, -1.20849609375, -0.8077392578125, -0.406982421875, -0.0062255859375, 0.39453125, 0.7952880859375, 1.196044921875, 1.5968017578125, 1.99755859375, 2.3983154296875, 2.799072265625, 3.1998291015625, 3.6005859375, 4.0013427734375, 4.402099609375, 4.8028564453125, 5.20361328125, 5.6043701171875, 6.005126953125, 6.4058837890625, 6.806640625, 7.2073974609375, 7.608154296875, 8.0089111328125, 8.40966796875, 8.8104248046875, 9.211181640625, 9.6119384765625, 10.0126953125, 10.4134521484375, 10.814208984375, 11.2149658203125, 11.61572265625, 12.0164794921875, 12.417236328125, 12.8179931640625, 13.21875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 8.0, 10.0, 16.0, 17.0, 45.0, 52.0, 49.0, 124.0, 101.0, 169.0, 250.0, 437.0, 590.0, 881.0, 1501.0, 2326.0, 3539.0, 5812.0, 9476.0, 16162.0, 27969.0, 48035.0, 83726.0, 138743.0, 193281.0, 190249.0, 133369.0, 79661.0, 46026.0, 26214.0, 15233.0, 9116.0, 5648.0, 3457.0, 2163.0, 1399.0, 870.0, 583.0, 395.0, 258.0, 186.0, 119.0, 102.0, 58.0, 31.0, 30.0, 16.0, 15.0, 11.0, 10.0, 4.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0], "bins": [-8.28125, -8.0220947265625, -7.762939453125, -7.5037841796875, -7.24462890625, -6.9854736328125, -6.726318359375, -6.4671630859375, -6.2080078125, -5.9488525390625, -5.689697265625, -5.4305419921875, -5.17138671875, -4.9122314453125, -4.653076171875, -4.3939208984375, -4.134765625, -3.8756103515625, -3.616455078125, -3.3572998046875, -3.09814453125, -2.8389892578125, -2.579833984375, -2.3206787109375, -2.0615234375, -1.8023681640625, -1.543212890625, -1.2840576171875, -1.02490234375, -0.7657470703125, -0.506591796875, -0.2474365234375, 0.01171875, 0.2708740234375, 0.530029296875, 0.7891845703125, 1.04833984375, 1.3074951171875, 1.566650390625, 1.8258056640625, 2.0849609375, 2.3441162109375, 2.603271484375, 2.8624267578125, 3.12158203125, 3.3807373046875, 3.639892578125, 3.8990478515625, 4.158203125, 4.4173583984375, 4.676513671875, 4.9356689453125, 5.19482421875, 5.4539794921875, 5.713134765625, 5.9722900390625, 6.2314453125, 6.4906005859375, 6.749755859375, 7.0089111328125, 7.26806640625, 7.5272216796875, 7.786376953125, 8.0455322265625, 8.3046875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 10.0, 9.0, 12.0, 9.0, 5.0, 11.0, 9.0, 15.0, 15.0, 16.0, 17.0, 26.0, 19.0, 31.0, 31.0, 35.0, 34.0, 32.0, 31.0, 42.0, 30.0, 35.0, 33.0, 37.0, 42.0, 30.0, 28.0, 39.0, 19.0, 40.0, 36.0, 28.0, 22.0, 24.0, 13.0, 18.0, 10.0, 20.0, 18.0, 14.0, 17.0, 4.0, 8.0, 5.0, 2.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0], "bins": [-5.6953125, -5.51251220703125, -5.3297119140625, -5.14691162109375, -4.964111328125, -4.78131103515625, -4.5985107421875, -4.41571044921875, -4.23291015625, -4.05010986328125, -3.8673095703125, -3.68450927734375, -3.501708984375, -3.31890869140625, -3.1361083984375, -2.95330810546875, -2.7705078125, -2.58770751953125, -2.4049072265625, -2.22210693359375, -2.039306640625, -1.85650634765625, -1.6737060546875, -1.49090576171875, -1.30810546875, -1.12530517578125, -0.9425048828125, -0.75970458984375, -0.576904296875, -0.39410400390625, -0.2113037109375, -0.02850341796875, 0.154296875, 0.33709716796875, 0.5198974609375, 0.70269775390625, 0.885498046875, 1.06829833984375, 1.2510986328125, 1.43389892578125, 1.61669921875, 1.79949951171875, 1.9822998046875, 2.16510009765625, 2.347900390625, 2.53070068359375, 2.7135009765625, 2.89630126953125, 3.0791015625, 3.26190185546875, 3.4447021484375, 3.62750244140625, 3.810302734375, 3.99310302734375, 4.1759033203125, 4.35870361328125, 4.54150390625, 4.72430419921875, 4.9071044921875, 5.08990478515625, 5.272705078125, 5.45550537109375, 5.6383056640625, 5.82110595703125, 6.00390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 12.0, 17.0, 15.0, 28.0, 44.0, 44.0, 89.0, 132.0, 176.0, 261.0, 395.0, 584.0, 890.0, 1277.0, 1935.0, 2840.0, 4498.0, 7209.0, 11544.0, 18489.0, 30479.0, 50630.0, 82736.0, 128332.0, 174137.0, 176719.0, 132603.0, 85638.0, 52521.0, 32080.0, 19141.0, 11888.0, 7370.0, 4690.0, 2983.0, 1999.0, 1297.0, 919.0, 611.0, 403.0, 279.0, 187.0, 124.0, 81.0, 61.0, 57.0, 33.0, 24.0, 17.0, 15.0, 9.0, 11.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.515625, -3.398590087890625, -3.28155517578125, -3.164520263671875, -3.0474853515625, -2.930450439453125, -2.81341552734375, -2.696380615234375, -2.579345703125, -2.462310791015625, -2.34527587890625, -2.228240966796875, -2.1112060546875, -1.994171142578125, -1.87713623046875, -1.760101318359375, -1.64306640625, -1.526031494140625, -1.40899658203125, -1.291961669921875, -1.1749267578125, -1.057891845703125, -0.94085693359375, -0.823822021484375, -0.706787109375, -0.589752197265625, -0.47271728515625, -0.355682373046875, -0.2386474609375, -0.121612548828125, -0.00457763671875, 0.112457275390625, 0.2294921875, 0.346527099609375, 0.46356201171875, 0.580596923828125, 0.6976318359375, 0.814666748046875, 0.93170166015625, 1.048736572265625, 1.165771484375, 1.282806396484375, 1.39984130859375, 1.516876220703125, 1.6339111328125, 1.750946044921875, 1.86798095703125, 1.985015869140625, 2.10205078125, 2.219085693359375, 2.33612060546875, 2.453155517578125, 2.5701904296875, 2.687225341796875, 2.80426025390625, 2.921295166015625, 3.038330078125, 3.155364990234375, 3.27239990234375, 3.389434814453125, 3.5064697265625, 3.623504638671875, 3.74053955078125, 3.857574462890625, 3.974609375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 15.0, 23.0, 17.0, 20.0, 24.0, 40.0, 45.0, 60.0, 68.0, 67.0, 65.0, 60.0, 64.0, 77.0, 56.0, 53.0, 55.0, 40.0, 42.0, 27.0, 16.0, 12.0, 18.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00026702880859375, -0.0002598017454147339, -0.0002525746822357178, -0.00024534761905670166, -0.00023812055587768555, -0.00023089349269866943, -0.00022366642951965332, -0.0002164393663406372, -0.0002092123031616211, -0.00020198523998260498, -0.00019475817680358887, -0.00018753111362457275, -0.00018030405044555664, -0.00017307698726654053, -0.00016584992408752441, -0.0001586228609085083, -0.0001513957977294922, -0.00014416873455047607, -0.00013694167137145996, -0.00012971460819244385, -0.00012248754501342773, -0.00011526048183441162, -0.00010803341865539551, -0.0001008063554763794, -9.357929229736328e-05, -8.635222911834717e-05, -7.912516593933105e-05, -7.189810276031494e-05, -6.467103958129883e-05, -5.7443976402282715e-05, -5.02169132232666e-05, -4.298985004425049e-05, -3.5762786865234375e-05, -2.8535723686218262e-05, -2.130866050720215e-05, -1.4081597328186035e-05, -6.854534149169922e-06, 3.725290298461914e-07, 7.599592208862305e-06, 1.4826655387878418e-05, 2.205371856689453e-05, 2.9280781745910645e-05, 3.650784492492676e-05, 4.373490810394287e-05, 5.0961971282958984e-05, 5.81890344619751e-05, 6.541609764099121e-05, 7.264316082000732e-05, 7.987022399902344e-05, 8.709728717803955e-05, 9.432435035705566e-05, 0.00010155141353607178, 0.00010877847671508789, 0.000116005539894104, 0.00012323260307312012, 0.00013045966625213623, 0.00013768672943115234, 0.00014491379261016846, 0.00015214085578918457, 0.00015936791896820068, 0.0001665949821472168, 0.0001738220453262329, 0.00018104910850524902, 0.00018827617168426514, 0.00019550323486328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 11.0, 13.0, 26.0, 29.0, 44.0, 69.0, 123.0, 206.0, 375.0, 562.0, 923.0, 1496.0, 2538.0, 4359.0, 7612.0, 13256.0, 22250.0, 37396.0, 60711.0, 92953.0, 129847.0, 155072.0, 154101.0, 127144.0, 91030.0, 59235.0, 35662.0, 21294.0, 12407.0, 7282.0, 4227.0, 2414.0, 1520.0, 893.0, 584.0, 312.0, 207.0, 128.0, 91.0, 48.0, 38.0, 31.0, 10.0, 12.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.208984375, -3.1053466796875, -3.001708984375, -2.8980712890625, -2.79443359375, -2.6907958984375, -2.587158203125, -2.4835205078125, -2.3798828125, -2.2762451171875, -2.172607421875, -2.0689697265625, -1.96533203125, -1.8616943359375, -1.758056640625, -1.6544189453125, -1.55078125, -1.4471435546875, -1.343505859375, -1.2398681640625, -1.13623046875, -1.0325927734375, -0.928955078125, -0.8253173828125, -0.7216796875, -0.6180419921875, -0.514404296875, -0.4107666015625, -0.30712890625, -0.2034912109375, -0.099853515625, 0.0037841796875, 0.107421875, 0.2110595703125, 0.314697265625, 0.4183349609375, 0.52197265625, 0.6256103515625, 0.729248046875, 0.8328857421875, 0.9365234375, 1.0401611328125, 1.143798828125, 1.2474365234375, 1.35107421875, 1.4547119140625, 1.558349609375, 1.6619873046875, 1.765625, 1.8692626953125, 1.972900390625, 2.0765380859375, 2.18017578125, 2.2838134765625, 2.387451171875, 2.4910888671875, 2.5947265625, 2.6983642578125, 2.802001953125, 2.9056396484375, 3.00927734375, 3.1129150390625, 3.216552734375, 3.3201904296875, 3.423828125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 13.0, 10.0, 12.0, 23.0, 17.0, 23.0, 34.0, 44.0, 35.0, 51.0, 56.0, 71.0, 61.0, 72.0, 68.0, 70.0, 73.0, 55.0, 46.0, 39.0, 25.0, 20.0, 17.0, 19.0, 13.0, 9.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53125, -1.4858856201171875, -1.440521240234375, -1.3951568603515625, -1.34979248046875, -1.3044281005859375, -1.259063720703125, -1.2136993408203125, -1.1683349609375, -1.1229705810546875, -1.077606201171875, -1.0322418212890625, -0.98687744140625, -0.9415130615234375, -0.896148681640625, -0.8507843017578125, -0.805419921875, -0.7600555419921875, -0.714691162109375, -0.6693267822265625, -0.62396240234375, -0.5785980224609375, -0.533233642578125, -0.4878692626953125, -0.4425048828125, -0.3971405029296875, -0.351776123046875, -0.3064117431640625, -0.26104736328125, -0.2156829833984375, -0.170318603515625, -0.1249542236328125, -0.07958984375, -0.0342254638671875, 0.011138916015625, 0.0565032958984375, 0.10186767578125, 0.1472320556640625, 0.192596435546875, 0.2379608154296875, 0.2833251953125, 0.3286895751953125, 0.374053955078125, 0.4194183349609375, 0.46478271484375, 0.5101470947265625, 0.555511474609375, 0.6008758544921875, 0.646240234375, 0.6916046142578125, 0.736968994140625, 0.7823333740234375, 0.82769775390625, 0.8730621337890625, 0.918426513671875, 0.9637908935546875, 1.0091552734375, 1.0545196533203125, 1.099884033203125, 1.1452484130859375, 1.19061279296875, 1.2359771728515625, 1.281341552734375, 1.3267059326171875, 1.3720703125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 11.0, 11.0, 11.0, 11.0, 17.0, 20.0, 22.0, 45.0, 34.0, 46.0, 57.0, 61.0, 71.0, 80.0, 69.0, 75.0, 81.0, 49.0, 51.0, 38.0, 39.0, 19.0, 17.0, 14.0, 13.0, 8.0, 8.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.749038696289062, -23.15329360961914, -22.55754852294922, -21.961801528930664, -21.366056442260742, -20.77031135559082, -20.174564361572266, -19.578819274902344, -18.983074188232422, -18.3873291015625, -17.791584014892578, -17.195837020874023, -16.6000919342041, -16.00434684753418, -15.408600807189941, -14.812854766845703, -14.217109680175781, -13.62136459350586, -13.025618553161621, -12.429872512817383, -11.834127426147461, -11.238382339477539, -10.6426362991333, -10.046890258789062, -9.45114517211914, -8.855400085449219, -8.25965404510498, -7.6639084815979, -7.06816291809082, -6.47241735458374, -5.87667179107666, -5.28092622756958, -4.685182571411133, -4.089437007904053, -3.4936914443969727, -2.8979458808898926, -2.3022003173828125, -1.7064547538757324, -1.1107091903686523, -0.5149636268615723, 0.08078193664550781, 0.6765275001525879, 1.272273063659668, 1.868018627166748, 2.463764190673828, 3.059509754180908, 3.6552553176879883, 4.251000881195068, 4.846746444702148, 5.4424920082092285, 6.038237571716309, 6.633983135223389, 7.229728698730469, 7.825474262237549, 8.421219825744629, 9.016965866088867, 9.612710952758789, 10.208456039428711, 10.80420207977295, 11.399948120117188, 11.99569320678711, 12.591438293457031, 13.18718433380127, 13.782930374145508, 14.37867546081543]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 5.0, 11.0, 12.0, 11.0, 18.0, 15.0, 17.0, 17.0, 18.0, 28.0, 25.0, 24.0, 35.0, 34.0, 32.0, 48.0, 45.0, 45.0, 42.0, 46.0, 60.0, 41.0, 38.0, 32.0, 31.0, 29.0, 37.0, 32.0, 20.0, 26.0, 30.0, 16.0, 25.0, 8.0, 10.0, 7.0, 2.0, 10.0, 5.0, 5.0, 4.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.541228294372559, -10.21462345123291, -9.888019561767578, -9.56141471862793, -9.234809875488281, -8.908205032348633, -8.581600189208984, -8.254996299743652, -7.928391456604004, -7.6017866134643555, -7.275182247161865, -6.948577880859375, -6.621973037719727, -6.295368194580078, -5.968763828277588, -5.642159461975098, -5.315554618835449, -4.988949775695801, -4.6623454093933105, -4.33574104309082, -4.009136199951172, -3.6825315952301025, -3.355926990509033, -3.029322385787964, -2.7027177810668945, -2.376113176345825, -2.049508571624756, -1.7229039669036865, -1.3962993621826172, -1.0696947574615479, -0.7430901527404785, -0.4164855480194092, -0.08987998962402344, 0.2367246150970459, 0.5633292198181152, 0.8899338245391846, 1.216538429260254, 1.5431430339813232, 1.8697476387023926, 2.196352243423462, 2.5229568481445312, 2.8495614528656006, 3.17616605758667, 3.5027706623077393, 3.8293752670288086, 4.155980110168457, 4.482584476470947, 4.8091888427734375, 5.135793685913086, 5.462398529052734, 5.789002895355225, 6.115607261657715, 6.442212104797363, 6.768816947937012, 7.095421314239502, 7.422025680541992, 7.748630523681641, 8.075235366821289, 8.401840209960938, 8.72844409942627, 9.055048942565918, 9.381653785705566, 9.708257675170898, 10.034862518310547, 10.361467361450195]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 8.0, 17.0, 17.0, 43.0, 56.0, 79.0, 112.0, 190.0, 275.0, 451.0, 635.0, 1048.0, 1629.0, 2733.0, 4484.0, 7257.0, 11935.0, 19978.0, 32758.0, 51925.0, 79124.0, 110407.0, 137180.0, 146974.0, 133478.0, 104879.0, 74756.0, 48470.0, 30352.0, 18771.0, 11134.0, 6602.0, 4025.0, 2459.0, 1610.0, 938.0, 620.0, 376.0, 246.0, 161.0, 138.0, 63.0, 48.0, 32.0, 28.0, 19.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-10.1796875, -9.855712890625, -9.53173828125, -9.207763671875, -8.8837890625, -8.559814453125, -8.23583984375, -7.911865234375, -7.587890625, -7.263916015625, -6.93994140625, -6.615966796875, -6.2919921875, -5.968017578125, -5.64404296875, -5.320068359375, -4.99609375, -4.672119140625, -4.34814453125, -4.024169921875, -3.7001953125, -3.376220703125, -3.05224609375, -2.728271484375, -2.404296875, -2.080322265625, -1.75634765625, -1.432373046875, -1.1083984375, -0.784423828125, -0.46044921875, -0.136474609375, 0.1875, 0.511474609375, 0.83544921875, 1.159423828125, 1.4833984375, 1.807373046875, 2.13134765625, 2.455322265625, 2.779296875, 3.103271484375, 3.42724609375, 3.751220703125, 4.0751953125, 4.399169921875, 4.72314453125, 5.047119140625, 5.37109375, 5.695068359375, 6.01904296875, 6.343017578125, 6.6669921875, 6.990966796875, 7.31494140625, 7.638916015625, 7.962890625, 8.286865234375, 8.61083984375, 8.934814453125, 9.2587890625, 9.582763671875, 9.90673828125, 10.230712890625, 10.5546875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 11.0, 5.0, 11.0, 9.0, 13.0, 14.0, 24.0, 16.0, 18.0, 27.0, 23.0, 23.0, 32.0, 36.0, 44.0, 21.0, 38.0, 43.0, 42.0, 49.0, 47.0, 49.0, 41.0, 47.0, 39.0, 36.0, 38.0, 29.0, 29.0, 25.0, 18.0, 24.0, 14.0, 16.0, 9.0, 7.0, 8.0, 8.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8359375, -10.494384765625, -10.15283203125, -9.811279296875, -9.4697265625, -9.128173828125, -8.78662109375, -8.445068359375, -8.103515625, -7.761962890625, -7.42041015625, -7.078857421875, -6.7373046875, -6.395751953125, -6.05419921875, -5.712646484375, -5.37109375, -5.029541015625, -4.68798828125, -4.346435546875, -4.0048828125, -3.663330078125, -3.32177734375, -2.980224609375, -2.638671875, -2.297119140625, -1.95556640625, -1.614013671875, -1.2724609375, -0.930908203125, -0.58935546875, -0.247802734375, 0.09375, 0.435302734375, 0.77685546875, 1.118408203125, 1.4599609375, 1.801513671875, 2.14306640625, 2.484619140625, 2.826171875, 3.167724609375, 3.50927734375, 3.850830078125, 4.1923828125, 4.533935546875, 4.87548828125, 5.217041015625, 5.55859375, 5.900146484375, 6.24169921875, 6.583251953125, 6.9248046875, 7.266357421875, 7.60791015625, 7.949462890625, 8.291015625, 8.632568359375, 8.97412109375, 9.315673828125, 9.6572265625, 9.998779296875, 10.34033203125, 10.681884765625, 11.0234375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 8.0, 12.0, 35.0, 40.0, 63.0, 78.0, 160.0, 228.0, 394.0, 605.0, 1018.0, 1606.0, 2698.0, 4570.0, 7829.0, 13097.0, 22190.0, 36762.0, 58691.0, 89156.0, 123423.0, 148598.0, 150685.0, 128922.0, 94540.0, 63470.0, 39662.0, 24325.0, 14412.0, 8484.0, 5211.0, 2992.0, 1788.0, 999.0, 655.0, 409.0, 246.0, 190.0, 105.0, 69.0, 38.0, 32.0, 13.0, 19.0, 8.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0], "bins": [-11.1484375, -10.8306884765625, -10.512939453125, -10.1951904296875, -9.87744140625, -9.5596923828125, -9.241943359375, -8.9241943359375, -8.6064453125, -8.2886962890625, -7.970947265625, -7.6531982421875, -7.33544921875, -7.0177001953125, -6.699951171875, -6.3822021484375, -6.064453125, -5.7467041015625, -5.428955078125, -5.1112060546875, -4.79345703125, -4.4757080078125, -4.157958984375, -3.8402099609375, -3.5224609375, -3.2047119140625, -2.886962890625, -2.5692138671875, -2.25146484375, -1.9337158203125, -1.615966796875, -1.2982177734375, -0.98046875, -0.6627197265625, -0.344970703125, -0.0272216796875, 0.29052734375, 0.6082763671875, 0.926025390625, 1.2437744140625, 1.5615234375, 1.8792724609375, 2.197021484375, 2.5147705078125, 2.83251953125, 3.1502685546875, 3.468017578125, 3.7857666015625, 4.103515625, 4.4212646484375, 4.739013671875, 5.0567626953125, 5.37451171875, 5.6922607421875, 6.010009765625, 6.3277587890625, 6.6455078125, 6.9632568359375, 7.281005859375, 7.5987548828125, 7.91650390625, 8.2342529296875, 8.552001953125, 8.8697509765625, 9.1875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 4.0, 8.0, 8.0, 8.0, 13.0, 15.0, 6.0, 18.0, 15.0, 37.0, 24.0, 20.0, 34.0, 38.0, 30.0, 33.0, 40.0, 32.0, 38.0, 45.0, 38.0, 46.0, 43.0, 33.0, 35.0, 35.0, 34.0, 28.0, 25.0, 26.0, 23.0, 19.0, 27.0, 23.0, 18.0, 16.0, 15.0, 5.0, 7.0, 6.0, 8.0, 4.0, 1.0, 8.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0], "bins": [-6.671875, -6.477294921875, -6.28271484375, -6.088134765625, -5.8935546875, -5.698974609375, -5.50439453125, -5.309814453125, -5.115234375, -4.920654296875, -4.72607421875, -4.531494140625, -4.3369140625, -4.142333984375, -3.94775390625, -3.753173828125, -3.55859375, -3.364013671875, -3.16943359375, -2.974853515625, -2.7802734375, -2.585693359375, -2.39111328125, -2.196533203125, -2.001953125, -1.807373046875, -1.61279296875, -1.418212890625, -1.2236328125, -1.029052734375, -0.83447265625, -0.639892578125, -0.4453125, -0.250732421875, -0.05615234375, 0.138427734375, 0.3330078125, 0.527587890625, 0.72216796875, 0.916748046875, 1.111328125, 1.305908203125, 1.50048828125, 1.695068359375, 1.8896484375, 2.084228515625, 2.27880859375, 2.473388671875, 2.66796875, 2.862548828125, 3.05712890625, 3.251708984375, 3.4462890625, 3.640869140625, 3.83544921875, 4.030029296875, 4.224609375, 4.419189453125, 4.61376953125, 4.808349609375, 5.0029296875, 5.197509765625, 5.39208984375, 5.586669921875, 5.78125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 8.0, 14.0, 16.0, 19.0, 23.0, 38.0, 52.0, 66.0, 92.0, 122.0, 187.0, 282.0, 354.0, 609.0, 894.0, 1329.0, 2449.0, 4839.0, 10090.0, 26178.0, 83918.0, 285689.0, 400538.0, 156137.0, 44272.0, 15173.0, 6614.0, 3321.0, 1916.0, 1028.0, 734.0, 499.0, 320.0, 208.0, 132.0, 111.0, 93.0, 49.0, 37.0, 36.0, 18.0, 15.0, 10.0, 10.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.4375, -18.772705078125, -18.10791015625, -17.443115234375, -16.7783203125, -16.113525390625, -15.44873046875, -14.783935546875, -14.119140625, -13.454345703125, -12.78955078125, -12.124755859375, -11.4599609375, -10.795166015625, -10.13037109375, -9.465576171875, -8.80078125, -8.135986328125, -7.47119140625, -6.806396484375, -6.1416015625, -5.476806640625, -4.81201171875, -4.147216796875, -3.482421875, -2.817626953125, -2.15283203125, -1.488037109375, -0.8232421875, -0.158447265625, 0.50634765625, 1.171142578125, 1.8359375, 2.500732421875, 3.16552734375, 3.830322265625, 4.4951171875, 5.159912109375, 5.82470703125, 6.489501953125, 7.154296875, 7.819091796875, 8.48388671875, 9.148681640625, 9.8134765625, 10.478271484375, 11.14306640625, 11.807861328125, 12.47265625, 13.137451171875, 13.80224609375, 14.467041015625, 15.1318359375, 15.796630859375, 16.46142578125, 17.126220703125, 17.791015625, 18.455810546875, 19.12060546875, 19.785400390625, 20.4501953125, 21.114990234375, 21.77978515625, 22.444580078125, 23.109375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 2.0, 7.0, 5.0, 9.0, 11.0, 18.0, 27.0, 42.0, 44.0, 69.0, 114.0, 103.0, 131.0, 103.0, 79.0, 68.0, 55.0, 29.0, 30.0, 16.0, 16.0, 11.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011262893676757812, -0.0010731369256973267, -0.001019984483718872, -0.0009668320417404175, -0.0009136795997619629, -0.0008605271577835083, -0.0008073747158050537, -0.0007542222738265991, -0.0007010698318481445, -0.0006479173898696899, -0.0005947649478912354, -0.0005416125059127808, -0.0004884600639343262, -0.0004353076219558716, -0.000382155179977417, -0.0003290027379989624, -0.0002758502960205078, -0.00022269785404205322, -0.00016954541206359863, -0.00011639297008514404, -6.324052810668945e-05, -1.0088086128234863e-05, 4.3064355850219727e-05, 9.621679782867432e-05, 0.0001493692398071289, 0.0002025216817855835, 0.0002556741237640381, 0.0003088265657424927, 0.00036197900772094727, 0.00041513144969940186, 0.00046828389167785645, 0.000521436333656311, 0.0005745887756347656, 0.0006277412176132202, 0.0006808936595916748, 0.0007340461015701294, 0.000787198543548584, 0.0008403509855270386, 0.0008935034275054932, 0.0009466558694839478, 0.0009998083114624023, 0.001052960753440857, 0.0011061131954193115, 0.0011592656373977661, 0.0012124180793762207, 0.0012655705213546753, 0.0013187229633331299, 0.0013718754053115845, 0.001425027847290039, 0.0014781802892684937, 0.0015313327312469482, 0.0015844851732254028, 0.0016376376152038574, 0.001690790057182312, 0.0017439424991607666, 0.0017970949411392212, 0.0018502473831176758, 0.0019033998250961304, 0.001956552267074585, 0.0020097047090530396, 0.002062857151031494, 0.0021160095930099487, 0.0021691620349884033, 0.002222314476966858, 0.0022754669189453125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 1.0, 9.0, 10.0, 16.0, 30.0, 32.0, 39.0, 58.0, 61.0, 99.0, 141.0, 213.0, 331.0, 486.0, 798.0, 1241.0, 2160.0, 3916.0, 7430.0, 14888.0, 31851.0, 72176.0, 155091.0, 256964.0, 244301.0, 137756.0, 62153.0, 27797.0, 13167.0, 6689.0, 3377.0, 1976.0, 1136.0, 713.0, 436.0, 298.0, 197.0, 130.0, 104.0, 78.0, 50.0, 37.0, 31.0, 27.0, 19.0, 15.0, 8.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.234375, -12.832275390625, -12.43017578125, -12.028076171875, -11.6259765625, -11.223876953125, -10.82177734375, -10.419677734375, -10.017578125, -9.615478515625, -9.21337890625, -8.811279296875, -8.4091796875, -8.007080078125, -7.60498046875, -7.202880859375, -6.80078125, -6.398681640625, -5.99658203125, -5.594482421875, -5.1923828125, -4.790283203125, -4.38818359375, -3.986083984375, -3.583984375, -3.181884765625, -2.77978515625, -2.377685546875, -1.9755859375, -1.573486328125, -1.17138671875, -0.769287109375, -0.3671875, 0.034912109375, 0.43701171875, 0.839111328125, 1.2412109375, 1.643310546875, 2.04541015625, 2.447509765625, 2.849609375, 3.251708984375, 3.65380859375, 4.055908203125, 4.4580078125, 4.860107421875, 5.26220703125, 5.664306640625, 6.06640625, 6.468505859375, 6.87060546875, 7.272705078125, 7.6748046875, 8.076904296875, 8.47900390625, 8.881103515625, 9.283203125, 9.685302734375, 10.08740234375, 10.489501953125, 10.8916015625, 11.293701171875, 11.69580078125, 12.097900390625, 12.5]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 8.0, 3.0, 3.0, 5.0, 5.0, 6.0, 13.0, 19.0, 12.0, 29.0, 30.0, 39.0, 35.0, 67.0, 90.0, 64.0, 81.0, 77.0, 77.0, 67.0, 49.0, 54.0, 42.0, 34.0, 19.0, 17.0, 10.0, 11.0, 14.0, 10.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.23046875, -3.132293701171875, -3.03411865234375, -2.935943603515625, -2.8377685546875, -2.739593505859375, -2.64141845703125, -2.543243408203125, -2.445068359375, -2.346893310546875, -2.24871826171875, -2.150543212890625, -2.0523681640625, -1.954193115234375, -1.85601806640625, -1.757843017578125, -1.65966796875, -1.561492919921875, -1.46331787109375, -1.365142822265625, -1.2669677734375, -1.168792724609375, -1.07061767578125, -0.972442626953125, -0.874267578125, -0.776092529296875, -0.67791748046875, -0.579742431640625, -0.4815673828125, -0.383392333984375, -0.28521728515625, -0.187042236328125, -0.0888671875, 0.009307861328125, 0.10748291015625, 0.205657958984375, 0.3038330078125, 0.402008056640625, 0.50018310546875, 0.598358154296875, 0.696533203125, 0.794708251953125, 0.89288330078125, 0.991058349609375, 1.0892333984375, 1.187408447265625, 1.28558349609375, 1.383758544921875, 1.48193359375, 1.580108642578125, 1.67828369140625, 1.776458740234375, 1.8746337890625, 1.972808837890625, 2.07098388671875, 2.169158935546875, 2.267333984375, 2.365509033203125, 2.46368408203125, 2.561859130859375, 2.6600341796875, 2.758209228515625, 2.85638427734375, 2.954559326171875, 3.052734375]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 7.0, 6.0, 5.0, 13.0, 21.0, 29.0, 22.0, 35.0, 46.0, 34.0, 52.0, 73.0, 77.0, 82.0, 71.0, 85.0, 62.0, 60.0, 61.0, 36.0, 26.0, 28.0, 20.0, 8.0, 8.0, 12.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.303194046020508, -24.669628143310547, -24.036062240600586, -23.402494430541992, -22.76892852783203, -22.13536262512207, -21.50179672241211, -20.86823081970215, -20.234664916992188, -19.601099014282227, -18.967533111572266, -18.333965301513672, -17.70039939880371, -17.06683349609375, -16.43326759338379, -15.799701690673828, -15.166133880615234, -14.532567977905273, -13.899001121520996, -13.265435218811035, -12.631868362426758, -11.998302459716797, -11.364736557006836, -10.731170654296875, -10.097603797912598, -9.464037895202637, -8.83047103881836, -8.196905136108398, -7.563338756561279, -6.92977237701416, -6.296206474304199, -5.66264009475708, -5.029071807861328, -4.395505428314209, -3.761939287185669, -3.128373146057129, -2.4948067665100098, -1.8612403869628906, -1.2276742458343506, -0.5941081047058105, 0.039458274841308594, 0.6730245351791382, 1.3065907955169678, 1.9401570558547974, 2.573723316192627, 3.207289695739746, 3.840855836868286, 4.474421977996826, 5.107988357543945, 5.7415547370910645, 6.375121116638184, 7.0086870193481445, 7.642253398895264, 8.275819778442383, 8.909385681152344, 9.542951583862305, 10.176518440246582, 10.810084342956543, 11.44365119934082, 12.077217102050781, 12.710783004760742, 13.34434986114502, 13.97791576385498, 14.611482620239258, 15.245048522949219]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 4.0, 4.0, 6.0, 7.0, 13.0, 15.0, 16.0, 23.0, 24.0, 25.0, 24.0, 37.0, 22.0, 36.0, 39.0, 43.0, 29.0, 33.0, 42.0, 42.0, 46.0, 53.0, 39.0, 40.0, 42.0, 31.0, 28.0, 33.0, 25.0, 29.0, 23.0, 13.0, 22.0, 19.0, 14.0, 5.0, 11.0, 10.0, 4.0, 7.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.647385597229004, -9.334603309631348, -9.021821975708008, -8.709039688110352, -8.396257400512695, -8.083475112915039, -7.770693778991699, -7.457911491394043, -7.145129680633545, -6.832347869873047, -6.519565582275391, -6.206783771514893, -5.8940019607543945, -5.581219673156738, -5.26843786239624, -4.955656051635742, -4.642873764038086, -4.330091953277588, -4.017309665679932, -3.7045278549194336, -3.3917458057403564, -3.0789637565612793, -2.7661819458007812, -2.453399896621704, -2.140617847442627, -1.8278357982635498, -1.5150538682937622, -1.2022719383239746, -0.8894898891448975, -0.5767078399658203, -0.2639259099960327, 0.04885601997375488, 0.3616371154785156, 0.674419105052948, 0.9872010946273804, 1.299983024597168, 1.6127650737762451, 1.9255471229553223, 2.2383289337158203, 2.5511109828948975, 2.8638930320739746, 3.1766750812530518, 3.489457130432129, 3.802238941192627, 4.115020751953125, 4.427803039550781, 4.740584850311279, 5.053366661071777, 5.366148948669434, 5.678930759429932, 5.991713047027588, 6.304494857788086, 6.617277145385742, 6.93005895614624, 7.242840766906738, 7.5556230545043945, 7.868404865264893, 8.18118667602539, 8.493968963623047, 8.806751251220703, 9.119532585144043, 9.4323148727417, 9.745097160339355, 10.057878494262695, 10.370660781860352]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 15.0, 35.0, 37.0, 66.0, 138.0, 208.0, 385.0, 584.0, 1074.0, 1752.0, 2942.0, 5192.0, 9169.0, 16332.0, 29384.0, 54302.0, 102617.0, 196304.0, 375475.0, 664368.0, 906119.0, 798343.0, 484609.0, 256377.0, 132526.0, 69487.0, 37339.0, 20257.0, 11520.0, 6807.0, 3850.0, 2421.0, 1479.0, 937.0, 614.0, 427.0, 239.0, 207.0, 105.0, 79.0, 48.0, 32.0, 32.0, 20.0, 13.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-12.640625, -12.2420654296875, -11.843505859375, -11.4449462890625, -11.04638671875, -10.6478271484375, -10.249267578125, -9.8507080078125, -9.4521484375, -9.0535888671875, -8.655029296875, -8.2564697265625, -7.85791015625, -7.4593505859375, -7.060791015625, -6.6622314453125, -6.263671875, -5.8651123046875, -5.466552734375, -5.0679931640625, -4.66943359375, -4.2708740234375, -3.872314453125, -3.4737548828125, -3.0751953125, -2.6766357421875, -2.278076171875, -1.8795166015625, -1.48095703125, -1.0823974609375, -0.683837890625, -0.2852783203125, 0.11328125, 0.5118408203125, 0.910400390625, 1.3089599609375, 1.70751953125, 2.1060791015625, 2.504638671875, 2.9031982421875, 3.3017578125, 3.7003173828125, 4.098876953125, 4.4974365234375, 4.89599609375, 5.2945556640625, 5.693115234375, 6.0916748046875, 6.490234375, 6.8887939453125, 7.287353515625, 7.6859130859375, 8.08447265625, 8.4830322265625, 8.881591796875, 9.2801513671875, 9.6787109375, 10.0772705078125, 10.475830078125, 10.8743896484375, 11.27294921875, 11.6715087890625, 12.070068359375, 12.4686279296875, 12.8671875]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 9.0, 4.0, 9.0, 14.0, 21.0, 13.0, 14.0, 25.0, 24.0, 34.0, 34.0, 44.0, 29.0, 28.0, 44.0, 40.0, 48.0, 36.0, 36.0, 47.0, 39.0, 31.0, 53.0, 35.0, 34.0, 23.0, 30.0, 27.0, 34.0, 22.0, 14.0, 20.0, 10.0, 11.0, 12.0, 6.0, 5.0, 12.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-7.3828125, -7.16815185546875, -6.9534912109375, -6.73883056640625, -6.524169921875, -6.30950927734375, -6.0948486328125, -5.88018798828125, -5.66552734375, -5.45086669921875, -5.2362060546875, -5.02154541015625, -4.806884765625, -4.59222412109375, -4.3775634765625, -4.16290283203125, -3.9482421875, -3.73358154296875, -3.5189208984375, -3.30426025390625, -3.089599609375, -2.87493896484375, -2.6602783203125, -2.44561767578125, -2.23095703125, -2.01629638671875, -1.8016357421875, -1.58697509765625, -1.372314453125, -1.15765380859375, -0.9429931640625, -0.72833251953125, -0.513671875, -0.29901123046875, -0.0843505859375, 0.13031005859375, 0.344970703125, 0.55963134765625, 0.7742919921875, 0.98895263671875, 1.20361328125, 1.41827392578125, 1.6329345703125, 1.84759521484375, 2.062255859375, 2.27691650390625, 2.4915771484375, 2.70623779296875, 2.9208984375, 3.13555908203125, 3.3502197265625, 3.56488037109375, 3.779541015625, 3.99420166015625, 4.2088623046875, 4.42352294921875, 4.63818359375, 4.85284423828125, 5.0675048828125, 5.28216552734375, 5.496826171875, 5.71148681640625, 5.9261474609375, 6.14080810546875, 6.35546875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 13.0, 16.0, 34.0, 52.0, 108.0, 180.0, 324.0, 559.0, 942.0, 1751.0, 3290.0, 6024.0, 11553.0, 21926.0, 42800.0, 82273.0, 159369.0, 298542.0, 522684.0, 775446.0, 836534.0, 626340.0, 376302.0, 204306.0, 106798.0, 55593.0, 28573.0, 14824.0, 7835.0, 4202.0, 2287.0, 1198.0, 719.0, 377.0, 196.0, 123.0, 75.0, 42.0, 30.0, 25.0, 8.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.859375, -12.4599609375, -12.060546875, -11.6611328125, -11.26171875, -10.8623046875, -10.462890625, -10.0634765625, -9.6640625, -9.2646484375, -8.865234375, -8.4658203125, -8.06640625, -7.6669921875, -7.267578125, -6.8681640625, -6.46875, -6.0693359375, -5.669921875, -5.2705078125, -4.87109375, -4.4716796875, -4.072265625, -3.6728515625, -3.2734375, -2.8740234375, -2.474609375, -2.0751953125, -1.67578125, -1.2763671875, -0.876953125, -0.4775390625, -0.078125, 0.3212890625, 0.720703125, 1.1201171875, 1.51953125, 1.9189453125, 2.318359375, 2.7177734375, 3.1171875, 3.5166015625, 3.916015625, 4.3154296875, 4.71484375, 5.1142578125, 5.513671875, 5.9130859375, 6.3125, 6.7119140625, 7.111328125, 7.5107421875, 7.91015625, 8.3095703125, 8.708984375, 9.1083984375, 9.5078125, 9.9072265625, 10.306640625, 10.7060546875, 11.10546875, 11.5048828125, 11.904296875, 12.3037109375, 12.703125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 10.0, 4.0, 14.0, 16.0, 19.0, 18.0, 20.0, 32.0, 61.0, 52.0, 56.0, 64.0, 85.0, 91.0, 117.0, 132.0, 158.0, 154.0, 202.0, 204.0, 205.0, 217.0, 228.0, 219.0, 211.0, 218.0, 200.0, 158.0, 141.0, 122.0, 126.0, 105.0, 80.0, 75.0, 63.0, 35.0, 42.0, 36.0, 18.0, 13.0, 13.0, 12.0, 6.0, 7.0, 6.0, 6.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.427734375, -3.31829833984375, -3.2088623046875, -3.09942626953125, -2.989990234375, -2.88055419921875, -2.7711181640625, -2.66168212890625, -2.55224609375, -2.44281005859375, -2.3333740234375, -2.22393798828125, -2.114501953125, -2.00506591796875, -1.8956298828125, -1.78619384765625, -1.6767578125, -1.56732177734375, -1.4578857421875, -1.34844970703125, -1.239013671875, -1.12957763671875, -1.0201416015625, -0.91070556640625, -0.80126953125, -0.69183349609375, -0.5823974609375, -0.47296142578125, -0.363525390625, -0.25408935546875, -0.1446533203125, -0.03521728515625, 0.07421875, 0.18365478515625, 0.2930908203125, 0.40252685546875, 0.511962890625, 0.62139892578125, 0.7308349609375, 0.84027099609375, 0.94970703125, 1.05914306640625, 1.1685791015625, 1.27801513671875, 1.387451171875, 1.49688720703125, 1.6063232421875, 1.71575927734375, 1.8251953125, 1.93463134765625, 2.0440673828125, 2.15350341796875, 2.262939453125, 2.37237548828125, 2.4818115234375, 2.59124755859375, 2.70068359375, 2.81011962890625, 2.9195556640625, 3.02899169921875, 3.138427734375, 3.24786376953125, 3.3572998046875, 3.46673583984375, 3.576171875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 7.0, 4.0, 9.0, 4.0, 18.0, 10.0, 16.0, 27.0, 34.0, 30.0, 43.0, 32.0, 54.0, 65.0, 56.0, 63.0, 78.0, 65.0, 55.0, 45.0, 60.0, 41.0, 43.0, 33.0, 29.0, 17.0, 18.0, 14.0, 11.0, 9.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-19.493425369262695, -19.02005386352539, -18.546682357788086, -18.07331085205078, -17.599939346313477, -17.126567840576172, -16.653194427490234, -16.17982292175293, -15.706451416015625, -15.23307991027832, -14.759708404541016, -14.286336898803711, -13.81296443939209, -13.339592933654785, -12.86622142791748, -12.392849922180176, -11.919478416442871, -11.446106910705566, -10.972735404968262, -10.49936294555664, -10.025991439819336, -9.552619934082031, -9.079248428344727, -8.605876922607422, -8.132505416870117, -7.6591339111328125, -7.18576192855835, -6.712390422821045, -6.239018440246582, -5.765646934509277, -5.292275428771973, -4.818903923034668, -4.345531463623047, -3.872159719467163, -3.3987879753112793, -2.9254164695739746, -2.452044725418091, -1.978672981262207, -1.5053014755249023, -1.0319297313690186, -0.5585579872131348, -0.08518630266189575, 0.38818538188934326, 0.8615570068359375, 1.3349287509918213, 1.808300495147705, 2.2816720008850098, 2.7550437450408936, 3.2284154891967773, 3.701787233352661, 4.175158977508545, 4.64853048324585, 5.1219024658203125, 5.595273971557617, 6.068645477294922, 6.542016983032227, 7.0153889656066895, 7.488760471343994, 7.962132453918457, 8.435503959655762, 8.908875465393066, 9.382247924804688, 9.855619430541992, 10.328990936279297, 10.802362442016602]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 7.0, 1.0, 3.0, 3.0, 6.0, 9.0, 22.0, 18.0, 10.0, 13.0, 19.0, 29.0, 30.0, 23.0, 28.0, 41.0, 24.0, 25.0, 38.0, 39.0, 38.0, 41.0, 35.0, 46.0, 42.0, 38.0, 32.0, 32.0, 31.0, 41.0, 30.0, 24.0, 32.0, 18.0, 24.0, 18.0, 11.0, 14.0, 14.0, 20.0, 6.0, 9.0, 8.0, 3.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.207751750946045, -6.95649528503418, -6.705239295959473, -6.453982830047607, -6.202726364135742, -5.951469898223877, -5.700213432312012, -5.448957443237305, -5.1977009773254395, -4.946444511413574, -4.695188522338867, -4.443932056427002, -4.192675590515137, -3.9414191246032715, -3.6901628971099854, -3.438906669616699, -3.187650203704834, -2.9363937377929688, -2.6851375102996826, -2.4338812828063965, -2.1826248168945312, -1.9313684701919556, -1.6801121234893799, -1.4288557767868042, -1.1775994300842285, -0.9263430833816528, -0.6750867366790771, -0.42383038997650146, -0.17257404327392578, 0.0786823034286499, 0.3299386501312256, 0.5811949968338013, 0.8324508666992188, 1.0837072134017944, 1.3349635601043701, 1.5862199068069458, 1.8374762535095215, 2.0887327194213867, 2.339988946914673, 2.591245174407959, 2.842501640319824, 3.0937581062316895, 3.3450143337249756, 3.5962705612182617, 3.847527027130127, 4.098783493041992, 4.350039482116699, 4.6012959480285645, 4.85255241394043, 5.103808879852295, 5.35506534576416, 5.606321334838867, 5.857577800750732, 6.108834266662598, 6.360090255737305, 6.61134672164917, 6.862603187561035, 7.1138596534729, 7.365116119384766, 7.616372108459473, 7.867628574371338, 8.118885040283203, 8.37014102935791, 8.621397972106934, 8.87265396118164]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 7.0, 22.0, 28.0, 32.0, 82.0, 83.0, 143.0, 195.0, 319.0, 511.0, 694.0, 1169.0, 1751.0, 2719.0, 4550.0, 7331.0, 12201.0, 20497.0, 33898.0, 54905.0, 86150.0, 123158.0, 152781.0, 157805.0, 132202.0, 95216.0, 61966.0, 38542.0, 23239.0, 13752.0, 8485.0, 5193.0, 3231.0, 1942.0, 1260.0, 842.0, 545.0, 357.0, 234.0, 166.0, 100.0, 81.0, 62.0, 35.0, 26.0, 11.0, 11.0, 15.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.37890625, -5.20611572265625, -5.0333251953125, -4.86053466796875, -4.687744140625, -4.51495361328125, -4.3421630859375, -4.16937255859375, -3.99658203125, -3.82379150390625, -3.6510009765625, -3.47821044921875, -3.305419921875, -3.13262939453125, -2.9598388671875, -2.78704833984375, -2.6142578125, -2.44146728515625, -2.2686767578125, -2.09588623046875, -1.923095703125, -1.75030517578125, -1.5775146484375, -1.40472412109375, -1.23193359375, -1.05914306640625, -0.8863525390625, -0.71356201171875, -0.540771484375, -0.36798095703125, -0.1951904296875, -0.02239990234375, 0.150390625, 0.32318115234375, 0.4959716796875, 0.66876220703125, 0.841552734375, 1.01434326171875, 1.1871337890625, 1.35992431640625, 1.53271484375, 1.70550537109375, 1.8782958984375, 2.05108642578125, 2.223876953125, 2.39666748046875, 2.5694580078125, 2.74224853515625, 2.9150390625, 3.08782958984375, 3.2606201171875, 3.43341064453125, 3.606201171875, 3.77899169921875, 3.9517822265625, 4.12457275390625, 4.29736328125, 4.47015380859375, 4.6429443359375, 4.81573486328125, 4.988525390625, 5.16131591796875, 5.3341064453125, 5.50689697265625, 5.6796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 7.0, 7.0, 7.0, 6.0, 9.0, 15.0, 12.0, 19.0, 21.0, 16.0, 26.0, 26.0, 25.0, 44.0, 26.0, 38.0, 41.0, 33.0, 39.0, 33.0, 40.0, 41.0, 47.0, 47.0, 38.0, 48.0, 39.0, 29.0, 28.0, 21.0, 26.0, 23.0, 20.0, 14.0, 19.0, 16.0, 14.0, 11.0, 10.0, 5.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.1171875, -9.82373046875, -9.5302734375, -9.23681640625, -8.943359375, -8.64990234375, -8.3564453125, -8.06298828125, -7.76953125, -7.47607421875, -7.1826171875, -6.88916015625, -6.595703125, -6.30224609375, -6.0087890625, -5.71533203125, -5.421875, -5.12841796875, -4.8349609375, -4.54150390625, -4.248046875, -3.95458984375, -3.6611328125, -3.36767578125, -3.07421875, -2.78076171875, -2.4873046875, -2.19384765625, -1.900390625, -1.60693359375, -1.3134765625, -1.02001953125, -0.7265625, -0.43310546875, -0.1396484375, 0.15380859375, 0.447265625, 0.74072265625, 1.0341796875, 1.32763671875, 1.62109375, 1.91455078125, 2.2080078125, 2.50146484375, 2.794921875, 3.08837890625, 3.3818359375, 3.67529296875, 3.96875, 4.26220703125, 4.5556640625, 4.84912109375, 5.142578125, 5.43603515625, 5.7294921875, 6.02294921875, 6.31640625, 6.60986328125, 6.9033203125, 7.19677734375, 7.490234375, 7.78369140625, 8.0771484375, 8.37060546875, 8.6640625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 9.0, 15.0, 21.0, 33.0, 48.0, 66.0, 94.0, 162.0, 254.0, 464.0, 830.0, 1762.0, 3441.0, 7584.0, 18832.0, 51497.0, 151641.0, 351952.0, 289971.0, 107212.0, 37140.0, 13935.0, 5918.0, 2630.0, 1319.0, 703.0, 375.0, 212.0, 153.0, 90.0, 45.0, 39.0, 30.0, 20.0, 13.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.109375, -15.659912109375, -15.21044921875, -14.760986328125, -14.3115234375, -13.862060546875, -13.41259765625, -12.963134765625, -12.513671875, -12.064208984375, -11.61474609375, -11.165283203125, -10.7158203125, -10.266357421875, -9.81689453125, -9.367431640625, -8.91796875, -8.468505859375, -8.01904296875, -7.569580078125, -7.1201171875, -6.670654296875, -6.22119140625, -5.771728515625, -5.322265625, -4.872802734375, -4.42333984375, -3.973876953125, -3.5244140625, -3.074951171875, -2.62548828125, -2.176025390625, -1.7265625, -1.277099609375, -0.82763671875, -0.378173828125, 0.0712890625, 0.520751953125, 0.97021484375, 1.419677734375, 1.869140625, 2.318603515625, 2.76806640625, 3.217529296875, 3.6669921875, 4.116455078125, 4.56591796875, 5.015380859375, 5.46484375, 5.914306640625, 6.36376953125, 6.813232421875, 7.2626953125, 7.712158203125, 8.16162109375, 8.611083984375, 9.060546875, 9.510009765625, 9.95947265625, 10.408935546875, 10.8583984375, 11.307861328125, 11.75732421875, 12.206787109375, 12.65625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 7.0, 3.0, 3.0, 6.0, 2.0, 6.0, 6.0, 5.0, 6.0, 10.0, 13.0, 13.0, 14.0, 19.0, 18.0, 17.0, 28.0, 28.0, 38.0, 32.0, 24.0, 26.0, 40.0, 34.0, 42.0, 31.0, 41.0, 41.0, 34.0, 29.0, 34.0, 25.0, 39.0, 25.0, 30.0, 26.0, 30.0, 24.0, 16.0, 19.0, 22.0, 13.0, 16.0, 15.0, 11.0, 7.0, 5.0, 7.0, 9.0, 1.0, 9.0, 0.0, 5.0, 3.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.828125, -4.6724853515625, -4.516845703125, -4.3612060546875, -4.20556640625, -4.0499267578125, -3.894287109375, -3.7386474609375, -3.5830078125, -3.4273681640625, -3.271728515625, -3.1160888671875, -2.96044921875, -2.8048095703125, -2.649169921875, -2.4935302734375, -2.337890625, -2.1822509765625, -2.026611328125, -1.8709716796875, -1.71533203125, -1.5596923828125, -1.404052734375, -1.2484130859375, -1.0927734375, -0.9371337890625, -0.781494140625, -0.6258544921875, -0.47021484375, -0.3145751953125, -0.158935546875, -0.0032958984375, 0.15234375, 0.3079833984375, 0.463623046875, 0.6192626953125, 0.77490234375, 0.9305419921875, 1.086181640625, 1.2418212890625, 1.3974609375, 1.5531005859375, 1.708740234375, 1.8643798828125, 2.02001953125, 2.1756591796875, 2.331298828125, 2.4869384765625, 2.642578125, 2.7982177734375, 2.953857421875, 3.1094970703125, 3.26513671875, 3.4207763671875, 3.576416015625, 3.7320556640625, 3.8876953125, 4.0433349609375, 4.198974609375, 4.3546142578125, 4.51025390625, 4.6658935546875, 4.821533203125, 4.9771728515625, 5.1328125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 11.0, 17.0, 16.0, 15.0, 39.0, 51.0, 53.0, 89.0, 135.0, 180.0, 238.0, 365.0, 567.0, 786.0, 1285.0, 1972.0, 3024.0, 4988.0, 8512.0, 14225.0, 25016.0, 45501.0, 83416.0, 144604.0, 212515.0, 202097.0, 130125.0, 73387.0, 40222.0, 22260.0, 12765.0, 7467.0, 4624.0, 2720.0, 1715.0, 1128.0, 733.0, 507.0, 369.0, 242.0, 160.0, 124.0, 75.0, 66.0, 37.0, 25.0, 23.0, 21.0, 8.0, 10.0, 6.0, 8.0, 5.0, 1.0, 1.0, 2.0], "bins": [-3.796875, -3.68145751953125, -3.5660400390625, -3.45062255859375, -3.335205078125, -3.21978759765625, -3.1043701171875, -2.98895263671875, -2.87353515625, -2.75811767578125, -2.6427001953125, -2.52728271484375, -2.411865234375, -2.29644775390625, -2.1810302734375, -2.06561279296875, -1.9501953125, -1.83477783203125, -1.7193603515625, -1.60394287109375, -1.488525390625, -1.37310791015625, -1.2576904296875, -1.14227294921875, -1.02685546875, -0.91143798828125, -0.7960205078125, -0.68060302734375, -0.565185546875, -0.44976806640625, -0.3343505859375, -0.21893310546875, -0.103515625, 0.01190185546875, 0.1273193359375, 0.24273681640625, 0.358154296875, 0.47357177734375, 0.5889892578125, 0.70440673828125, 0.81982421875, 0.93524169921875, 1.0506591796875, 1.16607666015625, 1.281494140625, 1.39691162109375, 1.5123291015625, 1.62774658203125, 1.7431640625, 1.85858154296875, 1.9739990234375, 2.08941650390625, 2.204833984375, 2.32025146484375, 2.4356689453125, 2.55108642578125, 2.66650390625, 2.78192138671875, 2.8973388671875, 3.01275634765625, 3.128173828125, 3.24359130859375, 3.3590087890625, 3.47442626953125, 3.58984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 10.0, 8.0, 13.0, 14.0, 14.0, 19.0, 40.0, 42.0, 45.0, 60.0, 72.0, 76.0, 80.0, 79.0, 70.0, 48.0, 63.0, 45.0, 54.0, 30.0, 20.0, 26.0, 9.0, 10.0, 10.0, 8.0, 5.0, 0.0, 4.0, 9.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00019502639770507812, -0.0001892372965812683, -0.0001834481954574585, -0.00017765909433364868, -0.00017186999320983887, -0.00016608089208602905, -0.00016029179096221924, -0.00015450268983840942, -0.0001487135887145996, -0.0001429244875907898, -0.00013713538646697998, -0.00013134628534317017, -0.00012555718421936035, -0.00011976808309555054, -0.00011397898197174072, -0.00010818988084793091, -0.0001024007797241211, -9.661167860031128e-05, -9.082257747650146e-05, -8.503347635269165e-05, -7.924437522888184e-05, -7.345527410507202e-05, -6.766617298126221e-05, -6.187707185745239e-05, -5.608797073364258e-05, -5.0298869609832764e-05, -4.450976848602295e-05, -3.8720667362213135e-05, -3.293156623840332e-05, -2.7142465114593506e-05, -2.135336399078369e-05, -1.5564262866973877e-05, -9.775161743164062e-06, -3.986060619354248e-06, 1.8030405044555664e-06, 7.592141628265381e-06, 1.3381242752075195e-05, 1.917034387588501e-05, 2.4959444999694824e-05, 3.074854612350464e-05, 3.653764724731445e-05, 4.232674837112427e-05, 4.811584949493408e-05, 5.3904950618743896e-05, 5.969405174255371e-05, 6.548315286636353e-05, 7.127225399017334e-05, 7.706135511398315e-05, 8.285045623779297e-05, 8.863955736160278e-05, 9.44286584854126e-05, 0.00010021775960922241, 0.00010600686073303223, 0.00011179596185684204, 0.00011758506298065186, 0.00012337416410446167, 0.00012916326522827148, 0.0001349523663520813, 0.0001407414674758911, 0.00014653056859970093, 0.00015231966972351074, 0.00015810877084732056, 0.00016389787197113037, 0.00016968697309494019, 0.00017547607421875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 7.0, 11.0, 5.0, 11.0, 23.0, 28.0, 40.0, 53.0, 86.0, 127.0, 155.0, 234.0, 341.0, 516.0, 679.0, 1050.0, 1572.0, 2506.0, 3785.0, 5962.0, 9329.0, 14966.0, 24809.0, 39906.0, 63645.0, 95639.0, 131192.0, 154244.0, 149307.0, 120037.0, 83550.0, 54549.0, 33744.0, 20784.0, 12958.0, 8039.0, 5024.0, 3270.0, 2083.0, 1380.0, 900.0, 591.0, 433.0, 278.0, 225.0, 161.0, 111.0, 81.0, 45.0, 27.0, 19.0, 19.0, 8.0, 9.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.72265625, -2.63433837890625, -2.5460205078125, -2.45770263671875, -2.369384765625, -2.28106689453125, -2.1927490234375, -2.10443115234375, -2.01611328125, -1.92779541015625, -1.8394775390625, -1.75115966796875, -1.662841796875, -1.57452392578125, -1.4862060546875, -1.39788818359375, -1.3095703125, -1.22125244140625, -1.1329345703125, -1.04461669921875, -0.956298828125, -0.86798095703125, -0.7796630859375, -0.69134521484375, -0.60302734375, -0.51470947265625, -0.4263916015625, -0.33807373046875, -0.249755859375, -0.16143798828125, -0.0731201171875, 0.01519775390625, 0.103515625, 0.19183349609375, 0.2801513671875, 0.36846923828125, 0.456787109375, 0.54510498046875, 0.6334228515625, 0.72174072265625, 0.81005859375, 0.89837646484375, 0.9866943359375, 1.07501220703125, 1.163330078125, 1.25164794921875, 1.3399658203125, 1.42828369140625, 1.5166015625, 1.60491943359375, 1.6932373046875, 1.78155517578125, 1.869873046875, 1.95819091796875, 2.0465087890625, 2.13482666015625, 2.22314453125, 2.31146240234375, 2.3997802734375, 2.48809814453125, 2.576416015625, 2.66473388671875, 2.7530517578125, 2.84136962890625, 2.9296875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 4.0, 13.0, 13.0, 8.0, 19.0, 22.0, 29.0, 26.0, 23.0, 31.0, 51.0, 37.0, 53.0, 61.0, 51.0, 45.0, 59.0, 58.0, 45.0, 41.0, 36.0, 36.0, 39.0, 32.0, 21.0, 34.0, 15.0, 17.0, 9.0, 13.0, 11.0, 6.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9140625, -0.8857574462890625, -0.857452392578125, -0.8291473388671875, -0.80084228515625, -0.7725372314453125, -0.744232177734375, -0.7159271240234375, -0.6876220703125, -0.6593170166015625, -0.631011962890625, -0.6027069091796875, -0.57440185546875, -0.5460968017578125, -0.517791748046875, -0.4894866943359375, -0.461181640625, -0.4328765869140625, -0.404571533203125, -0.3762664794921875, -0.34796142578125, -0.3196563720703125, -0.291351318359375, -0.2630462646484375, -0.2347412109375, -0.2064361572265625, -0.178131103515625, -0.1498260498046875, -0.12152099609375, -0.0932159423828125, -0.064910888671875, -0.0366058349609375, -0.00830078125, 0.0200042724609375, 0.048309326171875, 0.0766143798828125, 0.10491943359375, 0.1332244873046875, 0.161529541015625, 0.1898345947265625, 0.2181396484375, 0.2464447021484375, 0.274749755859375, 0.3030548095703125, 0.33135986328125, 0.3596649169921875, 0.387969970703125, 0.4162750244140625, 0.444580078125, 0.4728851318359375, 0.501190185546875, 0.5294952392578125, 0.55780029296875, 0.5861053466796875, 0.614410400390625, 0.6427154541015625, 0.6710205078125, 0.6993255615234375, 0.727630615234375, 0.7559356689453125, 0.78424072265625, 0.8125457763671875, 0.840850830078125, 0.8691558837890625, 0.8974609375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 7.0, 7.0, 9.0, 6.0, 14.0, 16.0, 21.0, 25.0, 27.0, 38.0, 33.0, 45.0, 57.0, 65.0, 52.0, 75.0, 71.0, 65.0, 47.0, 45.0, 59.0, 52.0, 26.0, 36.0, 24.0, 19.0, 17.0, 15.0, 7.0, 7.0, 8.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 3.0, 1.0], "bins": [-18.98023796081543, -18.51675796508789, -18.05327796936035, -17.589797973632812, -17.126317977905273, -16.662837982177734, -16.199359893798828, -15.735878944396973, -15.27239990234375, -14.808919906616211, -14.345439910888672, -13.881959915161133, -13.41848087310791, -12.955000877380371, -12.491520881652832, -12.028040885925293, -11.564560890197754, -11.101080894470215, -10.637600898742676, -10.174121856689453, -9.710641860961914, -9.247161865234375, -8.783681869506836, -8.320201873779297, -7.856722354888916, -7.393242359161377, -6.929762840270996, -6.466282844543457, -6.002802848815918, -5.539323329925537, -5.075843334197998, -4.612363815307617, -4.148883819580078, -3.685404062271118, -3.221924304962158, -2.758444309234619, -2.294964551925659, -1.8314847946166992, -1.3680047988891602, -0.9045250415802002, -0.44104528427124023, 0.022434532642364502, 0.48591434955596924, 0.9493942260742188, 1.4128739833831787, 1.8763537406921387, 2.3398337364196777, 2.8033134937286377, 3.2667932510375977, 3.7302730083465576, 4.193752765655518, 4.657232761383057, 5.1207122802734375, 5.584192276000977, 6.047672271728516, 6.511152267456055, 6.9746317863464355, 7.438111782073975, 7.9015913009643555, 8.365071296691895, 8.828551292419434, 9.292030334472656, 9.755510330200195, 10.218990325927734, 10.682470321655273]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 3.0, 9.0, 10.0, 21.0, 15.0, 11.0, 16.0, 17.0, 23.0, 28.0, 27.0, 27.0, 32.0, 29.0, 37.0, 28.0, 35.0, 44.0, 36.0, 38.0, 43.0, 42.0, 41.0, 28.0, 36.0, 31.0, 32.0, 33.0, 25.0, 29.0, 29.0, 19.0, 14.0, 19.0, 12.0, 11.0, 14.0, 16.0, 12.0, 5.0, 4.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.138815402984619, -6.893415927886963, -6.648016929626465, -6.402617454528809, -6.157217979431152, -5.911818504333496, -5.66641902923584, -5.421020030975342, -5.1756205558776855, -4.930221080780029, -4.684822082519531, -4.439422607421875, -4.194023132324219, -3.9486236572265625, -3.7032244205474854, -3.457825183868408, -3.212425708770752, -2.9670262336730957, -2.7216269969940186, -2.4762277603149414, -2.230828285217285, -1.9854289293289185, -1.7400295734405518, -1.494630217552185, -1.2492308616638184, -1.0038315057754517, -0.758432149887085, -0.5130327939987183, -0.26763343811035156, -0.022234082221984863, 0.22316527366638184, 0.46856462955474854, 0.713963508605957, 0.9593628644943237, 1.2047622203826904, 1.4501615762710571, 1.6955609321594238, 1.9409602880477905, 2.1863596439361572, 2.4317588806152344, 2.6771583557128906, 2.922557830810547, 3.167957067489624, 3.413356304168701, 3.6587557792663574, 3.9041552543640137, 4.149554252624512, 4.394953727722168, 4.640353202819824, 4.8857526779174805, 5.131152153015137, 5.376551151275635, 5.621950626373291, 5.867350101470947, 6.112749099731445, 6.358148574829102, 6.603548049926758, 6.848947525024414, 7.09434700012207, 7.339745998382568, 7.585145473480225, 7.830544948577881, 8.075943946838379, 8.321343421936035, 8.566742897033691]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 3.0, 1.0, 13.0, 6.0, 13.0, 28.0, 29.0, 46.0, 69.0, 103.0, 162.0, 244.0, 339.0, 507.0, 773.0, 1215.0, 1866.0, 3026.0, 4780.0, 7550.0, 11820.0, 18677.0, 28825.0, 44325.0, 64865.0, 90200.0, 115120.0, 130975.0, 130598.0, 114964.0, 89974.0, 64487.0, 44104.0, 28647.0, 18278.0, 11701.0, 7190.0, 4637.0, 2927.0, 1990.0, 1193.0, 819.0, 515.0, 310.0, 233.0, 136.0, 72.0, 58.0, 63.0, 31.0, 17.0, 14.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-7.72265625, -7.47344970703125, -7.2242431640625, -6.97503662109375, -6.725830078125, -6.47662353515625, -6.2274169921875, -5.97821044921875, -5.72900390625, -5.47979736328125, -5.2305908203125, -4.98138427734375, -4.732177734375, -4.48297119140625, -4.2337646484375, -3.98455810546875, -3.7353515625, -3.48614501953125, -3.2369384765625, -2.98773193359375, -2.738525390625, -2.48931884765625, -2.2401123046875, -1.99090576171875, -1.74169921875, -1.49249267578125, -1.2432861328125, -0.99407958984375, -0.744873046875, -0.49566650390625, -0.2464599609375, 0.00274658203125, 0.251953125, 0.50115966796875, 0.7503662109375, 0.99957275390625, 1.248779296875, 1.49798583984375, 1.7471923828125, 1.99639892578125, 2.24560546875, 2.49481201171875, 2.7440185546875, 2.99322509765625, 3.242431640625, 3.49163818359375, 3.7408447265625, 3.99005126953125, 4.2392578125, 4.48846435546875, 4.7376708984375, 4.98687744140625, 5.236083984375, 5.48529052734375, 5.7344970703125, 5.98370361328125, 6.23291015625, 6.48211669921875, 6.7313232421875, 6.98052978515625, 7.229736328125, 7.47894287109375, 7.7281494140625, 7.97735595703125, 8.2265625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 8.0, 9.0, 4.0, 9.0, 14.0, 18.0, 17.0, 23.0, 19.0, 28.0, 25.0, 37.0, 37.0, 35.0, 38.0, 37.0, 42.0, 50.0, 45.0, 39.0, 40.0, 35.0, 37.0, 38.0, 34.0, 32.0, 31.0, 25.0, 37.0, 32.0, 12.0, 23.0, 11.0, 7.0, 15.0, 10.0, 9.0, 16.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.76953125, -7.48419189453125, -7.1988525390625, -6.91351318359375, -6.628173828125, -6.34283447265625, -6.0574951171875, -5.77215576171875, -5.48681640625, -5.20147705078125, -4.9161376953125, -4.63079833984375, -4.345458984375, -4.06011962890625, -3.7747802734375, -3.48944091796875, -3.2041015625, -2.91876220703125, -2.6334228515625, -2.34808349609375, -2.062744140625, -1.77740478515625, -1.4920654296875, -1.20672607421875, -0.92138671875, -0.63604736328125, -0.3507080078125, -0.06536865234375, 0.219970703125, 0.50531005859375, 0.7906494140625, 1.07598876953125, 1.361328125, 1.64666748046875, 1.9320068359375, 2.21734619140625, 2.502685546875, 2.78802490234375, 3.0733642578125, 3.35870361328125, 3.64404296875, 3.92938232421875, 4.2147216796875, 4.50006103515625, 4.785400390625, 5.07073974609375, 5.3560791015625, 5.64141845703125, 5.9267578125, 6.21209716796875, 6.4974365234375, 6.78277587890625, 7.068115234375, 7.35345458984375, 7.6387939453125, 7.92413330078125, 8.20947265625, 8.49481201171875, 8.7801513671875, 9.06549072265625, 9.350830078125, 9.63616943359375, 9.9215087890625, 10.20684814453125, 10.4921875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 6.0, 4.0, 13.0, 20.0, 25.0, 31.0, 47.0, 67.0, 133.0, 177.0, 257.0, 455.0, 634.0, 1074.0, 1715.0, 2774.0, 4437.0, 7177.0, 11618.0, 18352.0, 29243.0, 44891.0, 66097.0, 91882.0, 115560.0, 131129.0, 131015.0, 115269.0, 90447.0, 64814.0, 43532.0, 28000.0, 17815.0, 11339.0, 6868.0, 4328.0, 2745.0, 1650.0, 1094.0, 659.0, 424.0, 271.0, 163.0, 100.0, 79.0, 41.0, 29.0, 23.0, 15.0, 7.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.17578125, -6.93634033203125, -6.6968994140625, -6.45745849609375, -6.218017578125, -5.97857666015625, -5.7391357421875, -5.49969482421875, -5.26025390625, -5.02081298828125, -4.7813720703125, -4.54193115234375, -4.302490234375, -4.06304931640625, -3.8236083984375, -3.58416748046875, -3.3447265625, -3.10528564453125, -2.8658447265625, -2.62640380859375, -2.386962890625, -2.14752197265625, -1.9080810546875, -1.66864013671875, -1.42919921875, -1.18975830078125, -0.9503173828125, -0.71087646484375, -0.471435546875, -0.23199462890625, 0.0074462890625, 0.24688720703125, 0.486328125, 0.72576904296875, 0.9652099609375, 1.20465087890625, 1.444091796875, 1.68353271484375, 1.9229736328125, 2.16241455078125, 2.40185546875, 2.64129638671875, 2.8807373046875, 3.12017822265625, 3.359619140625, 3.59906005859375, 3.8385009765625, 4.07794189453125, 4.3173828125, 4.55682373046875, 4.7962646484375, 5.03570556640625, 5.275146484375, 5.51458740234375, 5.7540283203125, 5.99346923828125, 6.23291015625, 6.47235107421875, 6.7117919921875, 6.95123291015625, 7.190673828125, 7.43011474609375, 7.6695556640625, 7.90899658203125, 8.1484375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 13.0, 15.0, 20.0, 16.0, 17.0, 24.0, 21.0, 20.0, 34.0, 33.0, 31.0, 43.0, 51.0, 38.0, 39.0, 33.0, 33.0, 51.0, 40.0, 29.0, 40.0, 39.0, 47.0, 37.0, 30.0, 15.0, 32.0, 24.0, 13.0, 18.0, 19.0, 12.0, 10.0, 6.0, 9.0, 9.0, 6.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.953125, -5.78228759765625, -5.6114501953125, -5.44061279296875, -5.269775390625, -5.09893798828125, -4.9281005859375, -4.75726318359375, -4.58642578125, -4.41558837890625, -4.2447509765625, -4.07391357421875, -3.903076171875, -3.73223876953125, -3.5614013671875, -3.39056396484375, -3.2197265625, -3.04888916015625, -2.8780517578125, -2.70721435546875, -2.536376953125, -2.36553955078125, -2.1947021484375, -2.02386474609375, -1.85302734375, -1.68218994140625, -1.5113525390625, -1.34051513671875, -1.169677734375, -0.99884033203125, -0.8280029296875, -0.65716552734375, -0.486328125, -0.31549072265625, -0.1446533203125, 0.02618408203125, 0.197021484375, 0.36785888671875, 0.5386962890625, 0.70953369140625, 0.88037109375, 1.05120849609375, 1.2220458984375, 1.39288330078125, 1.563720703125, 1.73455810546875, 1.9053955078125, 2.07623291015625, 2.2470703125, 2.41790771484375, 2.5887451171875, 2.75958251953125, 2.930419921875, 3.10125732421875, 3.2720947265625, 3.44293212890625, 3.61376953125, 3.78460693359375, 3.9554443359375, 4.12628173828125, 4.297119140625, 4.46795654296875, 4.6387939453125, 4.80963134765625, 4.98046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 4.0, 2.0, 5.0, 8.0, 10.0, 20.0, 14.0, 15.0, 28.0, 36.0, 39.0, 65.0, 84.0, 132.0, 234.0, 304.0, 529.0, 903.0, 1648.0, 2906.0, 5771.0, 11809.0, 24420.0, 50741.0, 99165.0, 167981.0, 218610.0, 197511.0, 128687.0, 69100.0, 34222.0, 16471.0, 7955.0, 4082.0, 2047.0, 1149.0, 650.0, 433.0, 262.0, 178.0, 98.0, 63.0, 45.0, 46.0, 28.0, 21.0, 13.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.73828125, -6.5115966796875, -6.284912109375, -6.0582275390625, -5.83154296875, -5.6048583984375, -5.378173828125, -5.1514892578125, -4.9248046875, -4.6981201171875, -4.471435546875, -4.2447509765625, -4.01806640625, -3.7913818359375, -3.564697265625, -3.3380126953125, -3.111328125, -2.8846435546875, -2.657958984375, -2.4312744140625, -2.20458984375, -1.9779052734375, -1.751220703125, -1.5245361328125, -1.2978515625, -1.0711669921875, -0.844482421875, -0.6177978515625, -0.39111328125, -0.1644287109375, 0.062255859375, 0.2889404296875, 0.515625, 0.7423095703125, 0.968994140625, 1.1956787109375, 1.42236328125, 1.6490478515625, 1.875732421875, 2.1024169921875, 2.3291015625, 2.5557861328125, 2.782470703125, 3.0091552734375, 3.23583984375, 3.4625244140625, 3.689208984375, 3.9158935546875, 4.142578125, 4.3692626953125, 4.595947265625, 4.8226318359375, 5.04931640625, 5.2760009765625, 5.502685546875, 5.7293701171875, 5.9560546875, 6.1827392578125, 6.409423828125, 6.6361083984375, 6.86279296875, 7.0894775390625, 7.316162109375, 7.5428466796875, 7.76953125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 4.0, 7.0, 11.0, 16.0, 18.0, 19.0, 28.0, 29.0, 34.0, 41.0, 59.0, 64.0, 75.0, 79.0, 61.0, 78.0, 73.0, 64.0, 57.0, 37.0, 33.0, 33.0, 15.0, 18.0, 18.0, 8.0, 8.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006952285766601562, -0.0006729438900947571, -0.0006506592035293579, -0.0006283745169639587, -0.0006060898303985596, -0.0005838051438331604, -0.0005615204572677612, -0.0005392357707023621, -0.0005169510841369629, -0.0004946663975715637, -0.00047238171100616455, -0.0004500970244407654, -0.0004278123378753662, -0.00040552765130996704, -0.00038324296474456787, -0.0003609582781791687, -0.00033867359161376953, -0.00031638890504837036, -0.0002941042184829712, -0.000271819531917572, -0.00024953484535217285, -0.00022725015878677368, -0.0002049654722213745, -0.00018268078565597534, -0.00016039609909057617, -0.000138111412525177, -0.00011582672595977783, -9.354203939437866e-05, -7.125735282897949e-05, -4.897266626358032e-05, -2.6687979698181152e-05, -4.403293132781982e-06, 1.7881393432617188e-05, 4.016607999801636e-05, 6.245076656341553e-05, 8.47354531288147e-05, 0.00010702013969421387, 0.00012930482625961304, 0.0001515895128250122, 0.00017387419939041138, 0.00019615888595581055, 0.00021844357252120972, 0.0002407282590866089, 0.00026301294565200806, 0.0002852976322174072, 0.0003075823187828064, 0.00032986700534820557, 0.00035215169191360474, 0.0003744363784790039, 0.0003967210650444031, 0.00041900575160980225, 0.0004412904381752014, 0.0004635751247406006, 0.00048585981130599976, 0.0005081444978713989, 0.0005304291844367981, 0.0005527138710021973, 0.0005749985575675964, 0.0005972832441329956, 0.0006195679306983948, 0.0006418526172637939, 0.0006641373038291931, 0.0006864219903945923, 0.0007087066769599915, 0.0007309913635253906]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 6.0, 13.0, 20.0, 27.0, 30.0, 51.0, 83.0, 118.0, 193.0, 274.0, 398.0, 603.0, 977.0, 1544.0, 2517.0, 3984.0, 6473.0, 10454.0, 17504.0, 28930.0, 46310.0, 72148.0, 104409.0, 135975.0, 150571.0, 140769.0, 112131.0, 78440.0, 51382.0, 32022.0, 19490.0, 11823.0, 7090.0, 4300.0, 2705.0, 1647.0, 1129.0, 707.0, 448.0, 300.0, 204.0, 118.0, 74.0, 51.0, 42.0, 21.0, 18.0, 15.0, 7.0, 7.0, 3.0, 1.0, 4.0, 2.0], "bins": [-5.31640625, -5.16278076171875, -5.0091552734375, -4.85552978515625, -4.701904296875, -4.54827880859375, -4.3946533203125, -4.24102783203125, -4.08740234375, -3.93377685546875, -3.7801513671875, -3.62652587890625, -3.472900390625, -3.31927490234375, -3.1656494140625, -3.01202392578125, -2.8583984375, -2.70477294921875, -2.5511474609375, -2.39752197265625, -2.243896484375, -2.09027099609375, -1.9366455078125, -1.78302001953125, -1.62939453125, -1.47576904296875, -1.3221435546875, -1.16851806640625, -1.014892578125, -0.86126708984375, -0.7076416015625, -0.55401611328125, -0.400390625, -0.24676513671875, -0.0931396484375, 0.06048583984375, 0.214111328125, 0.36773681640625, 0.5213623046875, 0.67498779296875, 0.82861328125, 0.98223876953125, 1.1358642578125, 1.28948974609375, 1.443115234375, 1.59674072265625, 1.7503662109375, 1.90399169921875, 2.0576171875, 2.21124267578125, 2.3648681640625, 2.51849365234375, 2.672119140625, 2.82574462890625, 2.9793701171875, 3.13299560546875, 3.28662109375, 3.44024658203125, 3.5938720703125, 3.74749755859375, 3.901123046875, 4.05474853515625, 4.2083740234375, 4.36199951171875, 4.515625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 6.0, 2.0, 7.0, 8.0, 10.0, 8.0, 12.0, 7.0, 24.0, 26.0, 24.0, 21.0, 22.0, 30.0, 26.0, 46.0, 43.0, 35.0, 54.0, 49.0, 51.0, 51.0, 44.0, 48.0, 56.0, 38.0, 31.0, 31.0, 30.0, 25.0, 25.0, 24.0, 11.0, 19.0, 15.0, 12.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.4111328125, -1.3677978515625, -1.324462890625, -1.2811279296875, -1.23779296875, -1.1944580078125, -1.151123046875, -1.1077880859375, -1.064453125, -1.0211181640625, -0.977783203125, -0.9344482421875, -0.89111328125, -0.8477783203125, -0.804443359375, -0.7611083984375, -0.7177734375, -0.6744384765625, -0.631103515625, -0.5877685546875, -0.54443359375, -0.5010986328125, -0.457763671875, -0.4144287109375, -0.37109375, -0.3277587890625, -0.284423828125, -0.2410888671875, -0.19775390625, -0.1544189453125, -0.111083984375, -0.0677490234375, -0.0244140625, 0.0189208984375, 0.062255859375, 0.1055908203125, 0.14892578125, 0.1922607421875, 0.235595703125, 0.2789306640625, 0.322265625, 0.3656005859375, 0.408935546875, 0.4522705078125, 0.49560546875, 0.5389404296875, 0.582275390625, 0.6256103515625, 0.6689453125, 0.7122802734375, 0.755615234375, 0.7989501953125, 0.84228515625, 0.8856201171875, 0.928955078125, 0.9722900390625, 1.015625, 1.0589599609375, 1.102294921875, 1.1456298828125, 1.18896484375, 1.2322998046875, 1.275634765625, 1.3189697265625, 1.3623046875]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 3.0, 10.0, 9.0, 7.0, 17.0, 15.0, 24.0, 24.0, 28.0, 30.0, 55.0, 43.0, 66.0, 62.0, 57.0, 67.0, 63.0, 67.0, 56.0, 51.0, 46.0, 42.0, 31.0, 34.0, 31.0, 12.0, 10.0, 13.0, 6.0, 9.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-18.98590087890625, -18.519433975219727, -18.052967071533203, -17.58650016784668, -17.120033264160156, -16.653568267822266, -16.187101364135742, -15.720634460449219, -15.254167556762695, -14.787700653076172, -14.321233749389648, -13.854767799377441, -13.388300895690918, -12.921833992004395, -12.455368041992188, -11.988901138305664, -11.52243423461914, -11.055967330932617, -10.589500427246094, -10.123034477233887, -9.656567573547363, -9.19010066986084, -8.723634719848633, -8.25716781616211, -7.790700912475586, -7.3242340087890625, -6.857767581939697, -6.391301155090332, -5.924834251403809, -5.458367347717285, -4.99190092086792, -4.525434494018555, -4.058968544006348, -3.5925018787384033, -3.126035213470459, -2.6595685482025146, -2.1931018829345703, -1.726635217666626, -1.2601685523986816, -0.7937018871307373, -0.32723522186279297, 0.13923144340515137, 0.6056981086730957, 1.07216477394104, 1.5386314392089844, 2.0050981044769287, 2.471564769744873, 2.9380314350128174, 3.4044981002807617, 3.870964765548706, 4.33743143081665, 4.803897857666016, 5.270364761352539, 5.7368316650390625, 6.203298091888428, 6.669764518737793, 7.136231422424316, 7.60269832611084, 8.069164276123047, 8.53563117980957, 9.002098083496094, 9.468564987182617, 9.93503189086914, 10.401497840881348, 10.867964744567871]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 7.0, 4.0, 8.0, 3.0, 12.0, 6.0, 16.0, 15.0, 19.0, 18.0, 23.0, 20.0, 25.0, 29.0, 23.0, 25.0, 22.0, 24.0, 36.0, 27.0, 39.0, 18.0, 38.0, 32.0, 40.0, 43.0, 30.0, 37.0, 36.0, 34.0, 39.0, 35.0, 19.0, 29.0, 24.0, 12.0, 18.0, 12.0, 10.0, 13.0, 12.0, 13.0, 8.0, 7.0, 8.0, 5.0, 7.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.928583145141602, -6.702221393585205, -6.475859642028809, -6.24949836730957, -6.023136615753174, -5.796774864196777, -5.570413589477539, -5.344051837921143, -5.117690086364746, -4.89132833480835, -4.664966583251953, -4.438605308532715, -4.212243556976318, -3.985881805419922, -3.7595202922821045, -3.533158779144287, -3.3067970275878906, -3.080435276031494, -2.8540737628936768, -2.6277122497558594, -2.401350498199463, -2.1749887466430664, -1.948627233505249, -1.722265601158142, -1.4959039688110352, -1.2695423364639282, -1.0431807041168213, -0.8168190717697144, -0.5904574394226074, -0.3640958070755005, -0.13773417472839355, 0.08862745761871338, 0.3149886131286621, 0.541350245475769, 0.767711877822876, 0.9940735101699829, 1.2204351425170898, 1.4467967748641968, 1.6731584072113037, 1.8995200395584106, 2.1258816719055176, 2.352243423461914, 2.5786049365997314, 2.804966449737549, 3.0313282012939453, 3.257689952850342, 3.484051465988159, 3.7104129791259766, 3.936774730682373, 4.1631364822387695, 4.389497756958008, 4.615859508514404, 4.842221260070801, 5.068583011627197, 5.294944763183594, 5.521306037902832, 5.7476677894592285, 5.974029541015625, 6.200390815734863, 6.42675256729126, 6.653114318847656, 6.879476070404053, 7.105837821960449, 7.3321990966796875, 7.558560848236084]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 11.0, 19.0, 26.0, 62.0, 83.0, 146.0, 201.0, 317.0, 506.0, 770.0, 1155.0, 1918.0, 2986.0, 4679.0, 7598.0, 12349.0, 20368.0, 33665.0, 57572.0, 97036.0, 166491.0, 281999.0, 459854.0, 660067.0, 741428.0, 617114.0, 413542.0, 248466.0, 146026.0, 85811.0, 50658.0, 30278.0, 18782.0, 11447.0, 7345.0, 4635.0, 2895.0, 1917.0, 1326.0, 883.0, 595.0, 390.0, 278.0, 180.0, 130.0, 111.0, 53.0, 43.0, 16.0, 21.0, 16.0, 6.0, 7.0, 4.0, 3.0, 2.0], "bins": [-9.0703125, -8.790283203125, -8.51025390625, -8.230224609375, -7.9501953125, -7.670166015625, -7.39013671875, -7.110107421875, -6.830078125, -6.550048828125, -6.27001953125, -5.989990234375, -5.7099609375, -5.429931640625, -5.14990234375, -4.869873046875, -4.58984375, -4.309814453125, -4.02978515625, -3.749755859375, -3.4697265625, -3.189697265625, -2.90966796875, -2.629638671875, -2.349609375, -2.069580078125, -1.78955078125, -1.509521484375, -1.2294921875, -0.949462890625, -0.66943359375, -0.389404296875, -0.109375, 0.170654296875, 0.45068359375, 0.730712890625, 1.0107421875, 1.290771484375, 1.57080078125, 1.850830078125, 2.130859375, 2.410888671875, 2.69091796875, 2.970947265625, 3.2509765625, 3.531005859375, 3.81103515625, 4.091064453125, 4.37109375, 4.651123046875, 4.93115234375, 5.211181640625, 5.4912109375, 5.771240234375, 6.05126953125, 6.331298828125, 6.611328125, 6.891357421875, 7.17138671875, 7.451416015625, 7.7314453125, 8.011474609375, 8.29150390625, 8.571533203125, 8.8515625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 2.0, 13.0, 6.0, 14.0, 13.0, 23.0, 20.0, 17.0, 24.0, 21.0, 26.0, 29.0, 27.0, 28.0, 34.0, 34.0, 52.0, 38.0, 38.0, 42.0, 31.0, 26.0, 41.0, 40.0, 44.0, 35.0, 32.0, 21.0, 28.0, 33.0, 22.0, 17.0, 19.0, 12.0, 14.0, 7.0, 17.0, 7.0, 6.0, 12.0, 11.0, 4.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.5330810546875, -5.359130859375, -5.1851806640625, -5.01123046875, -4.8372802734375, -4.663330078125, -4.4893798828125, -4.3154296875, -4.1414794921875, -3.967529296875, -3.7935791015625, -3.61962890625, -3.4456787109375, -3.271728515625, -3.0977783203125, -2.923828125, -2.7498779296875, -2.575927734375, -2.4019775390625, -2.22802734375, -2.0540771484375, -1.880126953125, -1.7061767578125, -1.5322265625, -1.3582763671875, -1.184326171875, -1.0103759765625, -0.83642578125, -0.6624755859375, -0.488525390625, -0.3145751953125, -0.140625, 0.0333251953125, 0.207275390625, 0.3812255859375, 0.55517578125, 0.7291259765625, 0.903076171875, 1.0770263671875, 1.2509765625, 1.4249267578125, 1.598876953125, 1.7728271484375, 1.94677734375, 2.1207275390625, 2.294677734375, 2.4686279296875, 2.642578125, 2.8165283203125, 2.990478515625, 3.1644287109375, 3.33837890625, 3.5123291015625, 3.686279296875, 3.8602294921875, 4.0341796875, 4.2081298828125, 4.382080078125, 4.5560302734375, 4.72998046875, 4.9039306640625, 5.077880859375, 5.2518310546875, 5.42578125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 4.0, 5.0, 10.0, 15.0, 23.0, 37.0, 80.0, 93.0, 150.0, 245.0, 436.0, 775.0, 1279.0, 2287.0, 4196.0, 7695.0, 14286.0, 27384.0, 52523.0, 101871.0, 196513.0, 364689.0, 609789.0, 823043.0, 784743.0, 542389.0, 313660.0, 166020.0, 86119.0, 44318.0, 22715.0, 12096.0, 6494.0, 3550.0, 2015.0, 1119.0, 652.0, 370.0, 197.0, 138.0, 95.0, 58.0, 33.0, 18.0, 16.0, 12.0, 4.0, 9.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.1015625, -10.741943359375, -10.38232421875, -10.022705078125, -9.6630859375, -9.303466796875, -8.94384765625, -8.584228515625, -8.224609375, -7.864990234375, -7.50537109375, -7.145751953125, -6.7861328125, -6.426513671875, -6.06689453125, -5.707275390625, -5.34765625, -4.988037109375, -4.62841796875, -4.268798828125, -3.9091796875, -3.549560546875, -3.18994140625, -2.830322265625, -2.470703125, -2.111083984375, -1.75146484375, -1.391845703125, -1.0322265625, -0.672607421875, -0.31298828125, 0.046630859375, 0.40625, 0.765869140625, 1.12548828125, 1.485107421875, 1.8447265625, 2.204345703125, 2.56396484375, 2.923583984375, 3.283203125, 3.642822265625, 4.00244140625, 4.362060546875, 4.7216796875, 5.081298828125, 5.44091796875, 5.800537109375, 6.16015625, 6.519775390625, 6.87939453125, 7.239013671875, 7.5986328125, 7.958251953125, 8.31787109375, 8.677490234375, 9.037109375, 9.396728515625, 9.75634765625, 10.115966796875, 10.4755859375, 10.835205078125, 11.19482421875, 11.554443359375, 11.9140625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 6.0, 8.0, 12.0, 13.0, 17.0, 25.0, 17.0, 35.0, 48.0, 44.0, 62.0, 80.0, 91.0, 91.0, 108.0, 134.0, 157.0, 174.0, 202.0, 241.0, 176.0, 214.0, 232.0, 213.0, 204.0, 209.0, 215.0, 195.0, 150.0, 153.0, 99.0, 105.0, 69.0, 65.0, 47.0, 44.0, 26.0, 26.0, 20.0, 12.0, 12.0, 8.0, 5.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.5703125, -3.469451904296875, -3.36859130859375, -3.267730712890625, -3.1668701171875, -3.066009521484375, -2.96514892578125, -2.864288330078125, -2.763427734375, -2.662567138671875, -2.56170654296875, -2.460845947265625, -2.3599853515625, -2.259124755859375, -2.15826416015625, -2.057403564453125, -1.95654296875, -1.855682373046875, -1.75482177734375, -1.653961181640625, -1.5531005859375, -1.452239990234375, -1.35137939453125, -1.250518798828125, -1.149658203125, -1.048797607421875, -0.94793701171875, -0.847076416015625, -0.7462158203125, -0.645355224609375, -0.54449462890625, -0.443634033203125, -0.3427734375, -0.241912841796875, -0.14105224609375, -0.040191650390625, 0.0606689453125, 0.161529541015625, 0.26239013671875, 0.363250732421875, 0.464111328125, 0.564971923828125, 0.66583251953125, 0.766693115234375, 0.8675537109375, 0.968414306640625, 1.06927490234375, 1.170135498046875, 1.27099609375, 1.371856689453125, 1.47271728515625, 1.573577880859375, 1.6744384765625, 1.775299072265625, 1.87615966796875, 1.977020263671875, 2.077880859375, 2.178741455078125, 2.27960205078125, 2.380462646484375, 2.4813232421875, 2.582183837890625, 2.68304443359375, 2.783905029296875, 2.884765625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 3.0, 10.0, 8.0, 17.0, 16.0, 14.0, 26.0, 39.0, 40.0, 32.0, 47.0, 49.0, 58.0, 67.0, 76.0, 58.0, 69.0, 58.0, 47.0, 39.0, 42.0, 42.0, 23.0, 19.0, 22.0, 19.0, 10.0, 11.0, 10.0, 7.0, 4.0, 1.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.940284729003906, -13.529157638549805, -13.11803150177002, -12.706904411315918, -12.295777320861816, -11.884651184082031, -11.47352409362793, -11.062397003173828, -10.651270866394043, -10.240143775939941, -9.829017639160156, -9.417890548706055, -9.006763458251953, -8.595637321472168, -8.184510231018066, -7.773383617401123, -7.3622565269470215, -6.951129913330078, -6.540002822875977, -6.128876209259033, -5.71774959564209, -5.306622505187988, -4.895495891571045, -4.484369277954102, -4.0732421875, -3.6621153354644775, -3.250988721847534, -2.8398618698120117, -2.4287352561950684, -2.017608404159546, -1.6064815521240234, -1.19535493850708, -0.7842283248901367, -0.3731015622615814, 0.03802520036697388, 0.44915199279785156, 0.8602787256240845, 1.2714054584503174, 1.6825323104858398, 2.093658924102783, 2.5047857761383057, 2.915912628173828, 3.3270392417907715, 3.738166093826294, 4.149292945861816, 4.56041955947876, 4.971546173095703, 5.382673263549805, 5.793799877166748, 6.204926490783691, 6.616053581237793, 7.027180194854736, 7.43830680847168, 7.849433898925781, 8.260560989379883, 8.671687126159668, 9.08281421661377, 9.493941307067871, 9.905067443847656, 10.316194534301758, 10.72732162475586, 11.138447761535645, 11.549574851989746, 11.960700988769531, 12.371828079223633]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 12.0, 11.0, 16.0, 15.0, 14.0, 27.0, 18.0, 21.0, 25.0, 34.0, 28.0, 39.0, 44.0, 36.0, 37.0, 49.0, 42.0, 41.0, 35.0, 37.0, 50.0, 56.0, 35.0, 34.0, 32.0, 29.0, 26.0, 19.0, 20.0, 13.0, 15.0, 11.0, 17.0, 6.0, 5.0, 11.0, 7.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.139094829559326, -6.903526782989502, -6.6679582595825195, -6.432390213012695, -6.196821689605713, -5.961253643035889, -5.725685119628906, -5.490117073059082, -5.254549026489258, -5.018980979919434, -4.783412456512451, -4.547844409942627, -4.3122758865356445, -4.07670783996582, -3.841139554977417, -3.6055712699890137, -3.3700027465820312, -3.134434461593628, -2.8988661766052246, -2.6632981300354004, -2.427729606628418, -2.1921615600585938, -1.9565932750701904, -1.721024990081787, -1.4854567050933838, -1.2498884201049805, -1.0143201351165771, -0.7787519693374634, -0.5431836843490601, -0.30761539936065674, -0.07204723358154297, 0.16352105140686035, 0.39908885955810547, 0.6346571445465088, 0.8702253699302673, 1.1057935953140259, 1.3413618803024292, 1.5769301652908325, 1.8124983310699463, 2.0480666160583496, 2.283634901046753, 2.5192031860351562, 2.7547714710235596, 2.990339756011963, 3.225907802581787, 3.4614763259887695, 3.6970443725585938, 3.932612657546997, 4.1681809425354, 4.403748989105225, 4.639317512512207, 4.874885559082031, 5.110454082489014, 5.346022129058838, 5.58159065246582, 5.8171586990356445, 6.052726745605469, 6.288294792175293, 6.523863315582275, 6.7594313621521, 6.994999885559082, 7.230567932128906, 7.4661359786987305, 7.701704502105713, 7.937273025512695]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 12.0, 14.0, 22.0, 32.0, 42.0, 68.0, 84.0, 132.0, 194.0, 303.0, 384.0, 579.0, 824.0, 1337.0, 1889.0, 3136.0, 5131.0, 8618.0, 14522.0, 25898.0, 45253.0, 76911.0, 120279.0, 162969.0, 176781.0, 148956.0, 102950.0, 62866.0, 36458.0, 20691.0, 12143.0, 7073.0, 4300.0, 2646.0, 1649.0, 1058.0, 708.0, 500.0, 306.0, 240.0, 176.0, 112.0, 86.0, 64.0, 40.0, 36.0, 27.0, 13.0, 18.0, 4.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 3.0], "bins": [-4.96484375, -4.8062744140625, -4.647705078125, -4.4891357421875, -4.33056640625, -4.1719970703125, -4.013427734375, -3.8548583984375, -3.6962890625, -3.5377197265625, -3.379150390625, -3.2205810546875, -3.06201171875, -2.9034423828125, -2.744873046875, -2.5863037109375, -2.427734375, -2.2691650390625, -2.110595703125, -1.9520263671875, -1.79345703125, -1.6348876953125, -1.476318359375, -1.3177490234375, -1.1591796875, -1.0006103515625, -0.842041015625, -0.6834716796875, -0.52490234375, -0.3663330078125, -0.207763671875, -0.0491943359375, 0.109375, 0.2679443359375, 0.426513671875, 0.5850830078125, 0.74365234375, 0.9022216796875, 1.060791015625, 1.2193603515625, 1.3779296875, 1.5364990234375, 1.695068359375, 1.8536376953125, 2.01220703125, 2.1707763671875, 2.329345703125, 2.4879150390625, 2.646484375, 2.8050537109375, 2.963623046875, 3.1221923828125, 3.28076171875, 3.4393310546875, 3.597900390625, 3.7564697265625, 3.9150390625, 4.0736083984375, 4.232177734375, 4.3907470703125, 4.54931640625, 4.7078857421875, 4.866455078125, 5.0250244140625, 5.18359375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 9.0, 11.0, 9.0, 13.0, 10.0, 15.0, 18.0, 21.0, 26.0, 30.0, 41.0, 36.0, 38.0, 54.0, 47.0, 52.0, 43.0, 47.0, 50.0, 46.0, 52.0, 43.0, 29.0, 48.0, 28.0, 29.0, 20.0, 21.0, 23.0, 15.0, 17.0, 6.0, 9.0, 9.0, 9.0, 3.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8203125, -8.5372314453125, -8.254150390625, -7.9710693359375, -7.68798828125, -7.4049072265625, -7.121826171875, -6.8387451171875, -6.5556640625, -6.2725830078125, -5.989501953125, -5.7064208984375, -5.42333984375, -5.1402587890625, -4.857177734375, -4.5740966796875, -4.291015625, -4.0079345703125, -3.724853515625, -3.4417724609375, -3.15869140625, -2.8756103515625, -2.592529296875, -2.3094482421875, -2.0263671875, -1.7432861328125, -1.460205078125, -1.1771240234375, -0.89404296875, -0.6109619140625, -0.327880859375, -0.0447998046875, 0.23828125, 0.5213623046875, 0.804443359375, 1.0875244140625, 1.37060546875, 1.6536865234375, 1.936767578125, 2.2198486328125, 2.5029296875, 2.7860107421875, 3.069091796875, 3.3521728515625, 3.63525390625, 3.9183349609375, 4.201416015625, 4.4844970703125, 4.767578125, 5.0506591796875, 5.333740234375, 5.6168212890625, 5.89990234375, 6.1829833984375, 6.466064453125, 6.7491455078125, 7.0322265625, 7.3153076171875, 7.598388671875, 7.8814697265625, 8.16455078125, 8.4476318359375, 8.730712890625, 9.0137939453125, 9.296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 10.0, 8.0, 18.0, 22.0, 20.0, 29.0, 54.0, 70.0, 88.0, 105.0, 202.0, 278.0, 444.0, 759.0, 1307.0, 2399.0, 4501.0, 9048.0, 19501.0, 43399.0, 97719.0, 205267.0, 287462.0, 200178.0, 95401.0, 42320.0, 18931.0, 8930.0, 4421.0, 2333.0, 1287.0, 760.0, 389.0, 260.0, 192.0, 121.0, 88.0, 74.0, 35.0, 30.0, 24.0, 20.0, 13.0, 15.0, 4.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-9.1953125, -8.920654296875, -8.64599609375, -8.371337890625, -8.0966796875, -7.822021484375, -7.54736328125, -7.272705078125, -6.998046875, -6.723388671875, -6.44873046875, -6.174072265625, -5.8994140625, -5.624755859375, -5.35009765625, -5.075439453125, -4.80078125, -4.526123046875, -4.25146484375, -3.976806640625, -3.7021484375, -3.427490234375, -3.15283203125, -2.878173828125, -2.603515625, -2.328857421875, -2.05419921875, -1.779541015625, -1.5048828125, -1.230224609375, -0.95556640625, -0.680908203125, -0.40625, -0.131591796875, 0.14306640625, 0.417724609375, 0.6923828125, 0.967041015625, 1.24169921875, 1.516357421875, 1.791015625, 2.065673828125, 2.34033203125, 2.614990234375, 2.8896484375, 3.164306640625, 3.43896484375, 3.713623046875, 3.98828125, 4.262939453125, 4.53759765625, 4.812255859375, 5.0869140625, 5.361572265625, 5.63623046875, 5.910888671875, 6.185546875, 6.460205078125, 6.73486328125, 7.009521484375, 7.2841796875, 7.558837890625, 7.83349609375, 8.108154296875, 8.3828125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 4.0, 3.0, 2.0, 9.0, 8.0, 9.0, 9.0, 9.0, 13.0, 20.0, 22.0, 24.0, 29.0, 33.0, 31.0, 28.0, 39.0, 41.0, 23.0, 48.0, 42.0, 39.0, 59.0, 37.0, 33.0, 44.0, 41.0, 32.0, 27.0, 36.0, 35.0, 22.0, 22.0, 18.0, 15.0, 17.0, 10.0, 11.0, 17.0, 12.0, 9.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.78515625, -4.63677978515625, -4.4884033203125, -4.34002685546875, -4.191650390625, -4.04327392578125, -3.8948974609375, -3.74652099609375, -3.59814453125, -3.44976806640625, -3.3013916015625, -3.15301513671875, -3.004638671875, -2.85626220703125, -2.7078857421875, -2.55950927734375, -2.4111328125, -2.26275634765625, -2.1143798828125, -1.96600341796875, -1.817626953125, -1.66925048828125, -1.5208740234375, -1.37249755859375, -1.22412109375, -1.07574462890625, -0.9273681640625, -0.77899169921875, -0.630615234375, -0.48223876953125, -0.3338623046875, -0.18548583984375, -0.037109375, 0.11126708984375, 0.2596435546875, 0.40802001953125, 0.556396484375, 0.70477294921875, 0.8531494140625, 1.00152587890625, 1.14990234375, 1.29827880859375, 1.4466552734375, 1.59503173828125, 1.743408203125, 1.89178466796875, 2.0401611328125, 2.18853759765625, 2.3369140625, 2.48529052734375, 2.6336669921875, 2.78204345703125, 2.930419921875, 3.07879638671875, 3.2271728515625, 3.37554931640625, 3.52392578125, 3.67230224609375, 3.8206787109375, 3.96905517578125, 4.117431640625, 4.26580810546875, 4.4141845703125, 4.56256103515625, 4.7109375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 18.0, 15.0, 25.0, 39.0, 55.0, 82.0, 152.0, 228.0, 327.0, 555.0, 865.0, 1370.0, 2219.0, 3477.0, 5655.0, 9406.0, 15627.0, 26624.0, 44688.0, 76406.0, 124199.0, 179110.0, 192496.0, 142902.0, 89957.0, 53642.0, 31530.0, 18353.0, 10845.0, 6743.0, 4115.0, 2541.0, 1515.0, 975.0, 607.0, 433.0, 274.0, 177.0, 104.0, 82.0, 48.0, 29.0, 17.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.283660888671875, -2.20794677734375, -2.132232666015625, -2.0565185546875, -1.980804443359375, -1.90509033203125, -1.829376220703125, -1.753662109375, -1.677947998046875, -1.60223388671875, -1.526519775390625, -1.4508056640625, -1.375091552734375, -1.29937744140625, -1.223663330078125, -1.14794921875, -1.072235107421875, -0.99652099609375, -0.920806884765625, -0.8450927734375, -0.769378662109375, -0.69366455078125, -0.617950439453125, -0.542236328125, -0.466522216796875, -0.39080810546875, -0.315093994140625, -0.2393798828125, -0.163665771484375, -0.08795166015625, -0.012237548828125, 0.0634765625, 0.139190673828125, 0.21490478515625, 0.290618896484375, 0.3663330078125, 0.442047119140625, 0.51776123046875, 0.593475341796875, 0.669189453125, 0.744903564453125, 0.82061767578125, 0.896331787109375, 0.9720458984375, 1.047760009765625, 1.12347412109375, 1.199188232421875, 1.27490234375, 1.350616455078125, 1.42633056640625, 1.502044677734375, 1.5777587890625, 1.653472900390625, 1.72918701171875, 1.804901123046875, 1.880615234375, 1.956329345703125, 2.03204345703125, 2.107757568359375, 2.1834716796875, 2.259185791015625, 2.33489990234375, 2.410614013671875, 2.486328125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 7.0, 3.0, 8.0, 12.0, 16.0, 20.0, 13.0, 22.0, 15.0, 35.0, 43.0, 28.0, 54.0, 54.0, 45.0, 59.0, 60.0, 56.0, 63.0, 59.0, 56.0, 47.0, 33.0, 39.0, 23.0, 28.0, 12.0, 14.0, 17.0, 5.0, 10.0, 8.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012183189392089844, -0.00011802557855844498, -0.00011421926319599152, -0.00011041294783353806, -0.0001066066324710846, -0.00010280031710863113, -9.899400174617767e-05, -9.518768638372421e-05, -9.138137102127075e-05, -8.757505565881729e-05, -8.376874029636383e-05, -7.996242493391037e-05, -7.615610957145691e-05, -7.234979420900345e-05, -6.854347884654999e-05, -6.473716348409653e-05, -6.0930848121643066e-05, -5.7124532759189606e-05, -5.3318217396736145e-05, -4.9511902034282684e-05, -4.5705586671829224e-05, -4.189927130937576e-05, -3.80929559469223e-05, -3.428664058446884e-05, -3.048032522201538e-05, -2.667400985956192e-05, -2.286769449710846e-05, -1.9061379134655e-05, -1.5255063772201538e-05, -1.1448748409748077e-05, -7.642433047294617e-06, -3.836117684841156e-06, -2.9802322387695312e-08, 3.7765130400657654e-06, 7.582828402519226e-06, 1.1389143764972687e-05, 1.5195459127426147e-05, 1.9001774489879608e-05, 2.280808985233307e-05, 2.661440521478653e-05, 3.042072057723999e-05, 3.422703593969345e-05, 3.803335130214691e-05, 4.183966666460037e-05, 4.564598202705383e-05, 4.9452297389507294e-05, 5.3258612751960754e-05, 5.7064928114414215e-05, 6.0871243476867676e-05, 6.467755883932114e-05, 6.84838742017746e-05, 7.229018956422806e-05, 7.609650492668152e-05, 7.990282028913498e-05, 8.370913565158844e-05, 8.75154510140419e-05, 9.132176637649536e-05, 9.512808173894882e-05, 9.893439710140228e-05, 0.00010274071246385574, 0.0001065470278263092, 0.00011035334318876266, 0.00011415965855121613, 0.00011796597391366959, 0.00012177228927612305]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 4.0, 3.0, 7.0, 11.0, 23.0, 26.0, 40.0, 89.0, 103.0, 193.0, 328.0, 544.0, 909.0, 1442.0, 2696.0, 4702.0, 8381.0, 15087.0, 27087.0, 47892.0, 80496.0, 124521.0, 166484.0, 176293.0, 146771.0, 101121.0, 61908.0, 35734.0, 19760.0, 11192.0, 6283.0, 3451.0, 1989.0, 1192.0, 726.0, 427.0, 254.0, 152.0, 81.0, 52.0, 36.0, 26.0, 18.0, 11.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.509765625, -2.43426513671875, -2.3587646484375, -2.28326416015625, -2.207763671875, -2.13226318359375, -2.0567626953125, -1.98126220703125, -1.90576171875, -1.83026123046875, -1.7547607421875, -1.67926025390625, -1.603759765625, -1.52825927734375, -1.4527587890625, -1.37725830078125, -1.3017578125, -1.22625732421875, -1.1507568359375, -1.07525634765625, -0.999755859375, -0.92425537109375, -0.8487548828125, -0.77325439453125, -0.69775390625, -0.62225341796875, -0.5467529296875, -0.47125244140625, -0.395751953125, -0.32025146484375, -0.2447509765625, -0.16925048828125, -0.09375, -0.01824951171875, 0.0572509765625, 0.13275146484375, 0.208251953125, 0.28375244140625, 0.3592529296875, 0.43475341796875, 0.51025390625, 0.58575439453125, 0.6612548828125, 0.73675537109375, 0.812255859375, 0.88775634765625, 0.9632568359375, 1.03875732421875, 1.1142578125, 1.18975830078125, 1.2652587890625, 1.34075927734375, 1.416259765625, 1.49176025390625, 1.5672607421875, 1.64276123046875, 1.71826171875, 1.79376220703125, 1.8692626953125, 1.94476318359375, 2.020263671875, 2.09576416015625, 2.1712646484375, 2.24676513671875, 2.322265625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 2.0, 3.0, 6.0, 9.0, 14.0, 8.0, 15.0, 16.0, 32.0, 23.0, 16.0, 24.0, 36.0, 23.0, 44.0, 52.0, 47.0, 49.0, 61.0, 62.0, 58.0, 43.0, 54.0, 36.0, 38.0, 29.0, 22.0, 34.0, 26.0, 14.0, 22.0, 16.0, 10.0, 8.0, 8.0, 9.0, 4.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5888671875, -0.568603515625, -0.54833984375, -0.528076171875, -0.5078125, -0.487548828125, -0.46728515625, -0.447021484375, -0.4267578125, -0.406494140625, -0.38623046875, -0.365966796875, -0.345703125, -0.325439453125, -0.30517578125, -0.284912109375, -0.2646484375, -0.244384765625, -0.22412109375, -0.203857421875, -0.18359375, -0.163330078125, -0.14306640625, -0.122802734375, -0.1025390625, -0.082275390625, -0.06201171875, -0.041748046875, -0.021484375, -0.001220703125, 0.01904296875, 0.039306640625, 0.0595703125, 0.079833984375, 0.10009765625, 0.120361328125, 0.140625, 0.160888671875, 0.18115234375, 0.201416015625, 0.2216796875, 0.241943359375, 0.26220703125, 0.282470703125, 0.302734375, 0.322998046875, 0.34326171875, 0.363525390625, 0.3837890625, 0.404052734375, 0.42431640625, 0.444580078125, 0.46484375, 0.485107421875, 0.50537109375, 0.525634765625, 0.5458984375, 0.566162109375, 0.58642578125, 0.606689453125, 0.626953125, 0.647216796875, 0.66748046875, 0.687744140625, 0.7080078125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 10.0, 13.0, 14.0, 17.0, 15.0, 25.0, 31.0, 31.0, 36.0, 40.0, 60.0, 51.0, 59.0, 72.0, 59.0, 63.0, 69.0, 55.0, 43.0, 42.0, 37.0, 28.0, 25.0, 24.0, 15.0, 15.0, 12.0, 11.0, 7.0, 2.0, 1.0, 9.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.246387481689453, -13.84239387512207, -13.438399314880371, -13.034405708312988, -12.630411148071289, -12.226417541503906, -11.822423934936523, -11.418429374694824, -11.014434814453125, -10.610441207885742, -10.206446647644043, -9.80245304107666, -9.398458480834961, -8.994464874267578, -8.590471267700195, -8.186476707458496, -7.782483100891113, -7.378489017486572, -6.974494934082031, -6.570501327514648, -6.166506767272949, -5.762513160705566, -5.358519077301025, -4.954524993896484, -4.550530910491943, -4.146536827087402, -3.7425427436828613, -3.3385488986968994, -2.9345548152923584, -2.5305607318878174, -2.1265668869018555, -1.7225728034973145, -1.318577766418457, -0.9145837426185608, -0.5105897188186646, -0.10659575462341309, 0.29739832878112793, 0.701392412185669, 1.1053862571716309, 1.5093803405761719, 1.913374423980713, 2.317368507385254, 2.721362590789795, 3.125356435775757, 3.529350519180298, 3.933344602584839, 4.337338447570801, 4.741332530975342, 5.145326614379883, 5.549320697784424, 5.953314781188965, 6.357308387756348, 6.761302947998047, 7.16529655456543, 7.569290637969971, 7.973284721374512, 8.377279281616211, 8.781272888183594, 9.185267448425293, 9.589261054992676, 9.993255615234375, 10.397249221801758, 10.80124282836914, 11.20523738861084, 11.609230995178223]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 10.0, 7.0, 11.0, 15.0, 13.0, 14.0, 24.0, 28.0, 15.0, 23.0, 29.0, 38.0, 28.0, 44.0, 37.0, 34.0, 44.0, 46.0, 36.0, 48.0, 37.0, 47.0, 49.0, 46.0, 36.0, 26.0, 31.0, 23.0, 25.0, 21.0, 12.0, 15.0, 18.0, 10.0, 10.0, 7.0, 7.0, 8.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.174775123596191, -6.940577030181885, -6.70637845993042, -6.472180366516113, -6.237981796264648, -6.003783702850342, -5.769585609436035, -5.53538703918457, -5.3011884689331055, -5.066990375518799, -4.832791805267334, -4.598593711853027, -4.3643951416015625, -4.130197048187256, -3.89599871635437, -3.6618003845214844, -3.4276022911071777, -3.193403959274292, -2.9592056274414062, -2.7250075340270996, -2.4908089637756348, -2.256610870361328, -2.0224125385284424, -1.7882142066955566, -1.554015874862671, -1.3198175430297852, -1.0856192111968994, -0.8514209985733032, -0.6172226667404175, -0.38302433490753174, -0.14882612228393555, 0.0853722095489502, 0.31957101821899414, 0.5537693500518799, 0.7879676222801208, 1.0221658945083618, 1.2563642263412476, 1.4905625581741333, 1.7247607707977295, 1.9589591026306152, 2.193157434463501, 2.4273557662963867, 2.6615540981292725, 2.895752429962158, 3.129950523376465, 3.3641490936279297, 3.5983471870422363, 3.832545518875122, 4.066743850708008, 4.3009419441223145, 4.535140514373779, 4.769338607788086, 5.003537178039551, 5.237735271453857, 5.471933364868164, 5.706131935119629, 5.940330505371094, 6.1745285987854, 6.408727169036865, 6.642925262451172, 6.877123832702637, 7.111321926116943, 7.34552001953125, 7.579718589782715, 7.8139166831970215]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 15.0, 15.0, 28.0, 25.0, 39.0, 70.0, 85.0, 123.0, 190.0, 281.0, 385.0, 598.0, 937.0, 1482.0, 2294.0, 3858.0, 6574.0, 11296.0, 19405.0, 32995.0, 54846.0, 86527.0, 123113.0, 151909.0, 156515.0, 135331.0, 98698.0, 64921.0, 39188.0, 23345.0, 13239.0, 7778.0, 4654.0, 2769.0, 1796.0, 1124.0, 702.0, 461.0, 299.0, 207.0, 137.0, 80.0, 72.0, 43.0, 33.0, 27.0, 13.0, 16.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.1484375, -7.8951416015625, -7.641845703125, -7.3885498046875, -7.13525390625, -6.8819580078125, -6.628662109375, -6.3753662109375, -6.1220703125, -5.8687744140625, -5.615478515625, -5.3621826171875, -5.10888671875, -4.8555908203125, -4.602294921875, -4.3489990234375, -4.095703125, -3.8424072265625, -3.589111328125, -3.3358154296875, -3.08251953125, -2.8292236328125, -2.575927734375, -2.3226318359375, -2.0693359375, -1.8160400390625, -1.562744140625, -1.3094482421875, -1.05615234375, -0.8028564453125, -0.549560546875, -0.2962646484375, -0.04296875, 0.2103271484375, 0.463623046875, 0.7169189453125, 0.97021484375, 1.2235107421875, 1.476806640625, 1.7301025390625, 1.9833984375, 2.2366943359375, 2.489990234375, 2.7432861328125, 2.99658203125, 3.2498779296875, 3.503173828125, 3.7564697265625, 4.009765625, 4.2630615234375, 4.516357421875, 4.7696533203125, 5.02294921875, 5.2762451171875, 5.529541015625, 5.7828369140625, 6.0361328125, 6.2894287109375, 6.542724609375, 6.7960205078125, 7.04931640625, 7.3026123046875, 7.555908203125, 7.8092041015625, 8.0625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 7.0, 4.0, 9.0, 8.0, 12.0, 11.0, 17.0, 20.0, 41.0, 25.0, 33.0, 31.0, 28.0, 33.0, 30.0, 32.0, 49.0, 33.0, 38.0, 47.0, 48.0, 55.0, 44.0, 38.0, 40.0, 42.0, 37.0, 33.0, 26.0, 20.0, 18.0, 19.0, 13.0, 17.0, 8.0, 9.0, 10.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0078125, -7.7337646484375, -7.459716796875, -7.1856689453125, -6.91162109375, -6.6375732421875, -6.363525390625, -6.0894775390625, -5.8154296875, -5.5413818359375, -5.267333984375, -4.9932861328125, -4.71923828125, -4.4451904296875, -4.171142578125, -3.8970947265625, -3.623046875, -3.3489990234375, -3.074951171875, -2.8009033203125, -2.52685546875, -2.2528076171875, -1.978759765625, -1.7047119140625, -1.4306640625, -1.1566162109375, -0.882568359375, -0.6085205078125, -0.33447265625, -0.0604248046875, 0.213623046875, 0.4876708984375, 0.76171875, 1.0357666015625, 1.309814453125, 1.5838623046875, 1.85791015625, 2.1319580078125, 2.406005859375, 2.6800537109375, 2.9541015625, 3.2281494140625, 3.502197265625, 3.7762451171875, 4.05029296875, 4.3243408203125, 4.598388671875, 4.8724365234375, 5.146484375, 5.4205322265625, 5.694580078125, 5.9686279296875, 6.24267578125, 6.5167236328125, 6.790771484375, 7.0648193359375, 7.3388671875, 7.6129150390625, 7.886962890625, 8.1610107421875, 8.43505859375, 8.7091064453125, 8.983154296875, 9.2572021484375, 9.53125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 26.0, 20.0, 25.0, 40.0, 64.0, 76.0, 144.0, 211.0, 264.0, 453.0, 676.0, 1002.0, 1764.0, 3036.0, 5662.0, 11066.0, 22429.0, 44044.0, 82641.0, 136404.0, 186678.0, 194450.0, 152652.0, 95703.0, 53097.0, 26515.0, 13419.0, 6847.0, 3670.0, 2048.0, 1180.0, 783.0, 490.0, 340.0, 186.0, 130.0, 94.0, 62.0, 44.0, 32.0, 21.0, 14.0, 17.0, 8.0, 5.0, 6.0, 7.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-9.859375, -9.542724609375, -9.22607421875, -8.909423828125, -8.5927734375, -8.276123046875, -7.95947265625, -7.642822265625, -7.326171875, -7.009521484375, -6.69287109375, -6.376220703125, -6.0595703125, -5.742919921875, -5.42626953125, -5.109619140625, -4.79296875, -4.476318359375, -4.15966796875, -3.843017578125, -3.5263671875, -3.209716796875, -2.89306640625, -2.576416015625, -2.259765625, -1.943115234375, -1.62646484375, -1.309814453125, -0.9931640625, -0.676513671875, -0.35986328125, -0.043212890625, 0.2734375, 0.590087890625, 0.90673828125, 1.223388671875, 1.5400390625, 1.856689453125, 2.17333984375, 2.489990234375, 2.806640625, 3.123291015625, 3.43994140625, 3.756591796875, 4.0732421875, 4.389892578125, 4.70654296875, 5.023193359375, 5.33984375, 5.656494140625, 5.97314453125, 6.289794921875, 6.6064453125, 6.923095703125, 7.23974609375, 7.556396484375, 7.873046875, 8.189697265625, 8.50634765625, 8.822998046875, 9.1396484375, 9.456298828125, 9.77294921875, 10.089599609375, 10.40625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 12.0, 5.0, 9.0, 11.0, 14.0, 20.0, 17.0, 19.0, 14.0, 29.0, 31.0, 28.0, 40.0, 39.0, 41.0, 50.0, 47.0, 42.0, 36.0, 48.0, 39.0, 46.0, 38.0, 48.0, 32.0, 39.0, 34.0, 27.0, 17.0, 23.0, 18.0, 17.0, 16.0, 13.0, 9.0, 9.0, 5.0, 7.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.359375, -5.18548583984375, -5.0115966796875, -4.83770751953125, -4.663818359375, -4.48992919921875, -4.3160400390625, -4.14215087890625, -3.96826171875, -3.79437255859375, -3.6204833984375, -3.44659423828125, -3.272705078125, -3.09881591796875, -2.9249267578125, -2.75103759765625, -2.5771484375, -2.40325927734375, -2.2293701171875, -2.05548095703125, -1.881591796875, -1.70770263671875, -1.5338134765625, -1.35992431640625, -1.18603515625, -1.01214599609375, -0.8382568359375, -0.66436767578125, -0.490478515625, -0.31658935546875, -0.1427001953125, 0.03118896484375, 0.205078125, 0.37896728515625, 0.5528564453125, 0.72674560546875, 0.900634765625, 1.07452392578125, 1.2484130859375, 1.42230224609375, 1.59619140625, 1.77008056640625, 1.9439697265625, 2.11785888671875, 2.291748046875, 2.46563720703125, 2.6395263671875, 2.81341552734375, 2.9873046875, 3.16119384765625, 3.3350830078125, 3.50897216796875, 3.682861328125, 3.85675048828125, 4.0306396484375, 4.20452880859375, 4.37841796875, 4.55230712890625, 4.7261962890625, 4.90008544921875, 5.073974609375, 5.24786376953125, 5.4217529296875, 5.59564208984375, 5.76953125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 12.0, 9.0, 18.0, 30.0, 33.0, 70.0, 118.0, 171.0, 246.0, 422.0, 750.0, 1231.0, 2067.0, 3607.0, 6634.0, 12074.0, 22284.0, 41297.0, 74463.0, 123128.0, 174304.0, 191469.0, 156910.0, 103657.0, 60325.0, 33223.0, 17823.0, 9867.0, 5203.0, 2966.0, 1626.0, 995.0, 555.0, 370.0, 222.0, 143.0, 92.0, 51.0, 34.0, 18.0, 10.0, 7.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.81640625, -5.64691162109375, -5.4774169921875, -5.30792236328125, -5.138427734375, -4.96893310546875, -4.7994384765625, -4.62994384765625, -4.46044921875, -4.29095458984375, -4.1214599609375, -3.95196533203125, -3.782470703125, -3.61297607421875, -3.4434814453125, -3.27398681640625, -3.1044921875, -2.93499755859375, -2.7655029296875, -2.59600830078125, -2.426513671875, -2.25701904296875, -2.0875244140625, -1.91802978515625, -1.74853515625, -1.57904052734375, -1.4095458984375, -1.24005126953125, -1.070556640625, -0.90106201171875, -0.7315673828125, -0.56207275390625, -0.392578125, -0.22308349609375, -0.0535888671875, 0.11590576171875, 0.285400390625, 0.45489501953125, 0.6243896484375, 0.79388427734375, 0.96337890625, 1.13287353515625, 1.3023681640625, 1.47186279296875, 1.641357421875, 1.81085205078125, 1.9803466796875, 2.14984130859375, 2.3193359375, 2.48883056640625, 2.6583251953125, 2.82781982421875, 2.997314453125, 3.16680908203125, 3.3363037109375, 3.50579833984375, 3.67529296875, 3.84478759765625, 4.0142822265625, 4.18377685546875, 4.353271484375, 4.52276611328125, 4.6922607421875, 4.86175537109375, 5.03125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 8.0, 5.0, 16.0, 14.0, 18.0, 30.0, 28.0, 45.0, 50.0, 68.0, 73.0, 79.0, 72.0, 65.0, 87.0, 58.0, 57.0, 52.0, 50.0, 32.0, 30.0, 21.0, 10.0, 10.0, 4.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005006790161132812, -0.00047975778579711914, -0.00045883655548095703, -0.0004379153251647949, -0.0004169940948486328, -0.0003960728645324707, -0.0003751516342163086, -0.0003542304039001465, -0.0003333091735839844, -0.00031238794326782227, -0.00029146671295166016, -0.00027054548263549805, -0.00024962425231933594, -0.00022870302200317383, -0.00020778179168701172, -0.0001868605613708496, -0.0001659393310546875, -0.0001450181007385254, -0.00012409687042236328, -0.00010317564010620117, -8.225440979003906e-05, -6.133317947387695e-05, -4.0411949157714844e-05, -1.9490718841552734e-05, 1.430511474609375e-06, 2.2351741790771484e-05, 4.3272972106933594e-05, 6.41942024230957e-05, 8.511543273925781e-05, 0.00010603666305541992, 0.00012695789337158203, 0.00014787912368774414, 0.00016880035400390625, 0.00018972158432006836, 0.00021064281463623047, 0.00023156404495239258, 0.0002524852752685547, 0.0002734065055847168, 0.0002943277359008789, 0.000315248966217041, 0.0003361701965332031, 0.00035709142684936523, 0.00037801265716552734, 0.00039893388748168945, 0.00041985511779785156, 0.00044077634811401367, 0.0004616975784301758, 0.0004826188087463379, 0.0005035400390625, 0.0005244612693786621, 0.0005453824996948242, 0.0005663037300109863, 0.0005872249603271484, 0.0006081461906433105, 0.0006290674209594727, 0.0006499886512756348, 0.0006709098815917969, 0.000691831111907959, 0.0007127523422241211, 0.0007336735725402832, 0.0007545948028564453, 0.0007755160331726074, 0.0007964372634887695, 0.0008173584938049316, 0.0008382797241210938]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 15.0, 12.0, 31.0, 43.0, 82.0, 95.0, 196.0, 282.0, 465.0, 797.0, 1225.0, 2022.0, 3418.0, 5795.0, 10251.0, 17620.0, 30681.0, 53434.0, 87285.0, 128584.0, 162737.0, 167306.0, 137941.0, 95769.0, 59622.0, 35010.0, 20157.0, 11315.0, 6679.0, 3897.0, 2313.0, 1320.0, 801.0, 495.0, 314.0, 213.0, 130.0, 83.0, 35.0, 27.0, 19.0, 10.0, 7.0, 4.0, 5.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.12286376953125, -3.9761962890625, -3.82952880859375, -3.682861328125, -3.53619384765625, -3.3895263671875, -3.24285888671875, -3.09619140625, -2.94952392578125, -2.8028564453125, -2.65618896484375, -2.509521484375, -2.36285400390625, -2.2161865234375, -2.06951904296875, -1.9228515625, -1.77618408203125, -1.6295166015625, -1.48284912109375, -1.336181640625, -1.18951416015625, -1.0428466796875, -0.89617919921875, -0.74951171875, -0.60284423828125, -0.4561767578125, -0.30950927734375, -0.162841796875, -0.01617431640625, 0.1304931640625, 0.27716064453125, 0.423828125, 0.57049560546875, 0.7171630859375, 0.86383056640625, 1.010498046875, 1.15716552734375, 1.3038330078125, 1.45050048828125, 1.59716796875, 1.74383544921875, 1.8905029296875, 2.03717041015625, 2.183837890625, 2.33050537109375, 2.4771728515625, 2.62384033203125, 2.7705078125, 2.91717529296875, 3.0638427734375, 3.21051025390625, 3.357177734375, 3.50384521484375, 3.6505126953125, 3.79718017578125, 3.94384765625, 4.09051513671875, 4.2371826171875, 4.38385009765625, 4.530517578125, 4.67718505859375, 4.8238525390625, 4.97052001953125, 5.1171875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 9.0, 10.0, 13.0, 24.0, 25.0, 22.0, 21.0, 38.0, 38.0, 47.0, 56.0, 65.0, 68.0, 65.0, 74.0, 63.0, 58.0, 53.0, 36.0, 36.0, 43.0, 35.0, 18.0, 17.0, 23.0, 12.0, 9.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.91796875, -1.8644866943359375, -1.811004638671875, -1.7575225830078125, -1.70404052734375, -1.6505584716796875, -1.597076416015625, -1.5435943603515625, -1.4901123046875, -1.4366302490234375, -1.383148193359375, -1.3296661376953125, -1.27618408203125, -1.2227020263671875, -1.169219970703125, -1.1157379150390625, -1.062255859375, -1.0087738037109375, -0.955291748046875, -0.9018096923828125, -0.84832763671875, -0.7948455810546875, -0.741363525390625, -0.6878814697265625, -0.6343994140625, -0.5809173583984375, -0.527435302734375, -0.4739532470703125, -0.42047119140625, -0.3669891357421875, -0.313507080078125, -0.2600250244140625, -0.20654296875, -0.1530609130859375, -0.099578857421875, -0.0460968017578125, 0.00738525390625, 0.0608673095703125, 0.114349365234375, 0.1678314208984375, 0.2213134765625, 0.2747955322265625, 0.328277587890625, 0.3817596435546875, 0.43524169921875, 0.4887237548828125, 0.542205810546875, 0.5956878662109375, 0.649169921875, 0.7026519775390625, 0.756134033203125, 0.8096160888671875, 0.86309814453125, 0.9165802001953125, 0.970062255859375, 1.0235443115234375, 1.0770263671875, 1.1305084228515625, 1.183990478515625, 1.2374725341796875, 1.29095458984375, 1.3444366455078125, 1.397918701171875, 1.4514007568359375, 1.5048828125]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 6.0, 8.0, 10.0, 13.0, 15.0, 22.0, 26.0, 38.0, 37.0, 35.0, 38.0, 43.0, 45.0, 70.0, 74.0, 53.0, 55.0, 65.0, 63.0, 37.0, 48.0, 38.0, 33.0, 25.0, 20.0, 16.0, 19.0, 14.0, 11.0, 2.0, 5.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.539966583251953, -12.150784492492676, -11.761602401733398, -11.372420310974121, -10.983238220214844, -10.594056129455566, -10.204874038696289, -9.815691947937012, -9.426509857177734, -9.037327766418457, -8.64814567565918, -8.258963584899902, -7.869781494140625, -7.480599403381348, -7.09141731262207, -6.702235221862793, -6.313053131103516, -5.923871040344238, -5.534688949584961, -5.145506858825684, -4.756324768066406, -4.367142677307129, -3.9779605865478516, -3.588778495788574, -3.199596405029297, -2.8104143142700195, -2.421232223510742, -2.032050132751465, -1.6428680419921875, -1.2536859512329102, -0.8645038604736328, -0.47532176971435547, -0.08613967895507812, 0.3030424118041992, 0.6922245025634766, 1.081406593322754, 1.4705886840820312, 1.8597707748413086, 2.248952865600586, 2.6381349563598633, 3.0273170471191406, 3.416499137878418, 3.8056812286376953, 4.194863319396973, 4.58404541015625, 4.973227500915527, 5.362409591674805, 5.751591682434082, 6.140773773193359, 6.529955863952637, 6.919137954711914, 7.308320045471191, 7.697502136230469, 8.086684226989746, 8.475866317749023, 8.8650484085083, 9.254230499267578, 9.643412590026855, 10.032594680786133, 10.42177677154541, 10.810958862304688, 11.200140953063965, 11.589323043823242, 11.97850513458252, 12.367687225341797]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 7.0, 9.0, 15.0, 17.0, 15.0, 11.0, 19.0, 23.0, 26.0, 32.0, 29.0, 46.0, 32.0, 35.0, 32.0, 43.0, 46.0, 34.0, 44.0, 49.0, 38.0, 35.0, 48.0, 25.0, 26.0, 40.0, 27.0, 30.0, 20.0, 15.0, 21.0, 14.0, 24.0, 9.0, 12.0, 9.0, 5.0, 4.0, 2.0, 3.0, 7.0, 1.0, 1.0, 3.0, 2.0, 3.0], "bins": [-8.424476623535156, -8.190656661987305, -7.956836223602295, -7.723016262054443, -7.489195823669434, -7.255375862121582, -7.0215559005737305, -6.787735939025879, -6.553915500640869, -6.320095539093018, -6.086275100708008, -5.852455139160156, -5.618635177612305, -5.384814739227295, -5.150994777679443, -4.917174339294434, -4.683354377746582, -4.4495344161987305, -4.215713977813721, -3.981894016265869, -3.7480738162994385, -3.514253616333008, -3.2804336547851562, -3.0466134548187256, -2.812793254852295, -2.5789730548858643, -2.3451528549194336, -2.111332893371582, -1.8775126934051514, -1.6436924934387207, -1.4098724126815796, -1.1760523319244385, -0.942232608795166, -0.7084124684333801, -0.47459232807159424, -0.24077218770980835, -0.006952047348022461, 0.2268681526184082, 0.4606882333755493, 0.6945083141326904, 0.9283285140991211, 1.1621487140655518, 1.3959687948226929, 1.629788875579834, 1.8636090755462646, 2.0974292755126953, 2.331249237060547, 2.5650694370269775, 2.798889636993408, 3.032709836959839, 3.2665300369262695, 3.500349998474121, 3.7341701984405518, 3.9679903984069824, 4.201810359954834, 4.435630798339844, 4.669450759887695, 4.903270721435547, 5.137091159820557, 5.370911121368408, 5.604731559753418, 5.8385515213012695, 6.072371482849121, 6.306191444396973, 6.540011882781982]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 8.0, 6.0, 5.0, 15.0, 15.0, 33.0, 37.0, 87.0, 95.0, 186.0, 250.0, 384.0, 579.0, 893.0, 1410.0, 2176.0, 3543.0, 5546.0, 8808.0, 13938.0, 22745.0, 37895.0, 62651.0, 106221.0, 179838.0, 304332.0, 492508.0, 688119.0, 736856.0, 583638.0, 378858.0, 226537.0, 134071.0, 79512.0, 47437.0, 28799.0, 17169.0, 10838.0, 6655.0, 4227.0, 2592.0, 1656.0, 1068.0, 720.0, 463.0, 280.0, 225.0, 140.0, 91.0, 44.0, 36.0, 26.0, 15.0, 10.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.09375, -7.83447265625, -7.5751953125, -7.31591796875, -7.056640625, -6.79736328125, -6.5380859375, -6.27880859375, -6.01953125, -5.76025390625, -5.5009765625, -5.24169921875, -4.982421875, -4.72314453125, -4.4638671875, -4.20458984375, -3.9453125, -3.68603515625, -3.4267578125, -3.16748046875, -2.908203125, -2.64892578125, -2.3896484375, -2.13037109375, -1.87109375, -1.61181640625, -1.3525390625, -1.09326171875, -0.833984375, -0.57470703125, -0.3154296875, -0.05615234375, 0.203125, 0.46240234375, 0.7216796875, 0.98095703125, 1.240234375, 1.49951171875, 1.7587890625, 2.01806640625, 2.27734375, 2.53662109375, 2.7958984375, 3.05517578125, 3.314453125, 3.57373046875, 3.8330078125, 4.09228515625, 4.3515625, 4.61083984375, 4.8701171875, 5.12939453125, 5.388671875, 5.64794921875, 5.9072265625, 6.16650390625, 6.42578125, 6.68505859375, 6.9443359375, 7.20361328125, 7.462890625, 7.72216796875, 7.9814453125, 8.24072265625, 8.5]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 8.0, 2.0, 6.0, 8.0, 5.0, 12.0, 10.0, 8.0, 10.0, 15.0, 14.0, 17.0, 31.0, 31.0, 39.0, 40.0, 35.0, 39.0, 39.0, 27.0, 47.0, 33.0, 42.0, 46.0, 40.0, 41.0, 37.0, 42.0, 41.0, 34.0, 35.0, 31.0, 19.0, 21.0, 16.0, 17.0, 18.0, 8.0, 9.0, 2.0, 3.0, 6.0, 7.0, 7.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.68359375, -5.51318359375, -5.3427734375, -5.17236328125, -5.001953125, -4.83154296875, -4.6611328125, -4.49072265625, -4.3203125, -4.14990234375, -3.9794921875, -3.80908203125, -3.638671875, -3.46826171875, -3.2978515625, -3.12744140625, -2.95703125, -2.78662109375, -2.6162109375, -2.44580078125, -2.275390625, -2.10498046875, -1.9345703125, -1.76416015625, -1.59375, -1.42333984375, -1.2529296875, -1.08251953125, -0.912109375, -0.74169921875, -0.5712890625, -0.40087890625, -0.23046875, -0.06005859375, 0.1103515625, 0.28076171875, 0.451171875, 0.62158203125, 0.7919921875, 0.96240234375, 1.1328125, 1.30322265625, 1.4736328125, 1.64404296875, 1.814453125, 1.98486328125, 2.1552734375, 2.32568359375, 2.49609375, 2.66650390625, 2.8369140625, 3.00732421875, 3.177734375, 3.34814453125, 3.5185546875, 3.68896484375, 3.859375, 4.02978515625, 4.2001953125, 4.37060546875, 4.541015625, 4.71142578125, 4.8818359375, 5.05224609375, 5.22265625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 8.0, 12.0, 15.0, 20.0, 26.0, 23.0, 39.0, 68.0, 105.0, 182.0, 269.0, 384.0, 628.0, 1026.0, 1672.0, 2916.0, 4865.0, 8408.0, 14244.0, 25597.0, 46782.0, 84261.0, 153363.0, 273453.0, 458918.0, 670818.0, 772627.0, 653047.0, 437110.0, 258494.0, 144807.0, 79366.0, 43149.0, 24531.0, 13610.0, 7838.0, 4661.0, 2636.0, 1594.0, 975.0, 620.0, 394.0, 266.0, 159.0, 91.0, 66.0, 43.0, 30.0, 18.0, 20.0, 9.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-9.28125, -8.9764404296875, -8.671630859375, -8.3668212890625, -8.06201171875, -7.7572021484375, -7.452392578125, -7.1475830078125, -6.8427734375, -6.5379638671875, -6.233154296875, -5.9283447265625, -5.62353515625, -5.3187255859375, -5.013916015625, -4.7091064453125, -4.404296875, -4.0994873046875, -3.794677734375, -3.4898681640625, -3.18505859375, -2.8802490234375, -2.575439453125, -2.2706298828125, -1.9658203125, -1.6610107421875, -1.356201171875, -1.0513916015625, -0.74658203125, -0.4417724609375, -0.136962890625, 0.1678466796875, 0.47265625, 0.7774658203125, 1.082275390625, 1.3870849609375, 1.69189453125, 1.9967041015625, 2.301513671875, 2.6063232421875, 2.9111328125, 3.2159423828125, 3.520751953125, 3.8255615234375, 4.13037109375, 4.4351806640625, 4.739990234375, 5.0447998046875, 5.349609375, 5.6544189453125, 5.959228515625, 6.2640380859375, 6.56884765625, 6.8736572265625, 7.178466796875, 7.4832763671875, 7.7880859375, 8.0928955078125, 8.397705078125, 8.7025146484375, 9.00732421875, 9.3121337890625, 9.616943359375, 9.9217529296875, 10.2265625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 9.0, 8.0, 15.0, 11.0, 28.0, 30.0, 39.0, 39.0, 55.0, 61.0, 65.0, 92.0, 87.0, 122.0, 137.0, 145.0, 176.0, 194.0, 187.0, 214.0, 209.0, 198.0, 216.0, 206.0, 211.0, 182.0, 180.0, 143.0, 130.0, 118.0, 101.0, 95.0, 74.0, 71.0, 53.0, 37.0, 24.0, 18.0, 14.0, 13.0, 20.0, 9.0, 7.0, 8.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.759765625, -2.6719970703125, -2.584228515625, -2.4964599609375, -2.40869140625, -2.3209228515625, -2.233154296875, -2.1453857421875, -2.0576171875, -1.9698486328125, -1.882080078125, -1.7943115234375, -1.70654296875, -1.6187744140625, -1.531005859375, -1.4432373046875, -1.35546875, -1.2677001953125, -1.179931640625, -1.0921630859375, -1.00439453125, -0.9166259765625, -0.828857421875, -0.7410888671875, -0.6533203125, -0.5655517578125, -0.477783203125, -0.3900146484375, -0.30224609375, -0.2144775390625, -0.126708984375, -0.0389404296875, 0.048828125, 0.1365966796875, 0.224365234375, 0.3121337890625, 0.39990234375, 0.4876708984375, 0.575439453125, 0.6632080078125, 0.7509765625, 0.8387451171875, 0.926513671875, 1.0142822265625, 1.10205078125, 1.1898193359375, 1.277587890625, 1.3653564453125, 1.453125, 1.5408935546875, 1.628662109375, 1.7164306640625, 1.80419921875, 1.8919677734375, 1.979736328125, 2.0675048828125, 2.1552734375, 2.2430419921875, 2.330810546875, 2.4185791015625, 2.50634765625, 2.5941162109375, 2.681884765625, 2.7696533203125, 2.857421875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 7.0, 10.0, 15.0, 20.0, 14.0, 18.0, 26.0, 35.0, 29.0, 35.0, 42.0, 51.0, 50.0, 47.0, 50.0, 55.0, 59.0, 52.0, 55.0, 46.0, 49.0, 44.0, 31.0, 19.0, 22.0, 22.0, 14.0, 18.0, 13.0, 9.0, 5.0, 9.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.866893768310547, -10.524741172790527, -10.182588577270508, -9.840435028076172, -9.498282432556152, -9.156129837036133, -8.813977241516113, -8.471824645996094, -8.129672050476074, -7.787519454956055, -7.445366382598877, -7.103213787078857, -6.761061191558838, -6.41890811920166, -6.076755523681641, -5.734602928161621, -5.392449855804443, -5.050297260284424, -4.708144187927246, -4.365991592407227, -4.023838996887207, -3.6816861629486084, -3.3395333290100098, -2.9973807334899902, -2.6552278995513916, -2.313075065612793, -1.9709224700927734, -1.6287696361541748, -1.2866169214248657, -0.9444642066955566, -0.602311372756958, -0.2601587772369385, 0.08199405670166016, 0.4241468012332916, 0.7662995457649231, 1.108452320098877, 1.450605034828186, 1.7927577495574951, 2.1349105834960938, 2.4770631790161133, 2.819216012954712, 3.1613688468933105, 3.50352144241333, 3.8456742763519287, 4.187827110290527, 4.529979705810547, 4.872132301330566, 5.214284896850586, 5.556437969207764, 5.898590564727783, 6.240743637084961, 6.5828962326049805, 6.925048828125, 7.2672014236450195, 7.609354496002197, 7.951507091522217, 8.293660163879395, 8.635812759399414, 8.977965354919434, 9.320117950439453, 9.662271499633789, 10.004424095153809, 10.346576690673828, 10.688729286193848, 11.030881881713867]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 7.0, 9.0, 10.0, 8.0, 10.0, 14.0, 17.0, 17.0, 24.0, 30.0, 31.0, 37.0, 23.0, 33.0, 33.0, 40.0, 47.0, 41.0, 43.0, 35.0, 38.0, 40.0, 42.0, 34.0, 37.0, 25.0, 30.0, 36.0, 26.0, 19.0, 23.0, 16.0, 26.0, 12.0, 11.0, 18.0, 12.0, 3.0, 9.0, 8.0, 3.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0], "bins": [-7.118824005126953, -6.918753147125244, -6.718682289123535, -6.518611907958984, -6.318541049957275, -6.118470191955566, -5.918399810791016, -5.718328952789307, -5.518258094787598, -5.318187236785889, -5.11811637878418, -4.918045997619629, -4.71797513961792, -4.517904281616211, -4.31783390045166, -4.117763042449951, -3.917692184448242, -3.717621326446533, -3.5175507068634033, -3.3174800872802734, -3.1174092292785645, -2.9173383712768555, -2.7172677516937256, -2.5171971321105957, -2.3171262741088867, -2.1170554161071777, -1.9169847965240479, -1.7169140577316284, -1.516843318939209, -1.3167725801467896, -1.1167018413543701, -0.9166311025619507, -0.7165603637695312, -0.5164896249771118, -0.3164188861846924, -0.11634814739227295, 0.08372259140014648, 0.2837933301925659, 0.48386406898498535, 0.6839348077774048, 0.8840055465698242, 1.0840762853622437, 1.284147024154663, 1.4842177629470825, 1.684288501739502, 1.8843592405319214, 2.084429979324341, 2.2845005989074707, 2.4845714569091797, 2.6846423149108887, 2.8847129344940186, 3.0847835540771484, 3.2848544120788574, 3.4849252700805664, 3.6849958896636963, 3.885066509246826, 4.085137367248535, 4.285208225250244, 4.485279083251953, 4.685349464416504, 4.885420322418213, 5.085491180419922, 5.285561561584473, 5.485632419586182, 5.685703277587891]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 15.0, 21.0, 30.0, 36.0, 53.0, 104.0, 104.0, 154.0, 243.0, 365.0, 518.0, 771.0, 1127.0, 1820.0, 2968.0, 5226.0, 9643.0, 18799.0, 37490.0, 73431.0, 133011.0, 195864.0, 209987.0, 159607.0, 94305.0, 49064.0, 24835.0, 12500.0, 6535.0, 3713.0, 2159.0, 1264.0, 881.0, 597.0, 418.0, 316.0, 186.0, 118.0, 94.0, 61.0, 47.0, 29.0, 15.0, 14.0, 5.0, 9.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.13671875, -4.96661376953125, -4.7965087890625, -4.62640380859375, -4.456298828125, -4.28619384765625, -4.1160888671875, -3.94598388671875, -3.77587890625, -3.60577392578125, -3.4356689453125, -3.26556396484375, -3.095458984375, -2.92535400390625, -2.7552490234375, -2.58514404296875, -2.4150390625, -2.24493408203125, -2.0748291015625, -1.90472412109375, -1.734619140625, -1.56451416015625, -1.3944091796875, -1.22430419921875, -1.05419921875, -0.88409423828125, -0.7139892578125, -0.54388427734375, -0.373779296875, -0.20367431640625, -0.0335693359375, 0.13653564453125, 0.306640625, 0.47674560546875, 0.6468505859375, 0.81695556640625, 0.987060546875, 1.15716552734375, 1.3272705078125, 1.49737548828125, 1.66748046875, 1.83758544921875, 2.0076904296875, 2.17779541015625, 2.347900390625, 2.51800537109375, 2.6881103515625, 2.85821533203125, 3.0283203125, 3.19842529296875, 3.3685302734375, 3.53863525390625, 3.708740234375, 3.87884521484375, 4.0489501953125, 4.21905517578125, 4.38916015625, 4.55926513671875, 4.7293701171875, 4.89947509765625, 5.069580078125, 5.23968505859375, 5.4097900390625, 5.57989501953125, 5.75]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 7.0, 4.0, 6.0, 14.0, 12.0, 14.0, 10.0, 17.0, 17.0, 23.0, 23.0, 21.0, 21.0, 26.0, 25.0, 38.0, 41.0, 37.0, 31.0, 49.0, 41.0, 32.0, 35.0, 30.0, 30.0, 38.0, 26.0, 28.0, 23.0, 31.0, 27.0, 27.0, 28.0, 27.0, 17.0, 16.0, 17.0, 17.0, 20.0, 7.0, 9.0, 10.0, 9.0, 2.0, 3.0, 4.0, 3.0, 0.0, 3.0], "bins": [-7.51953125, -7.31396484375, -7.1083984375, -6.90283203125, -6.697265625, -6.49169921875, -6.2861328125, -6.08056640625, -5.875, -5.66943359375, -5.4638671875, -5.25830078125, -5.052734375, -4.84716796875, -4.6416015625, -4.43603515625, -4.23046875, -4.02490234375, -3.8193359375, -3.61376953125, -3.408203125, -3.20263671875, -2.9970703125, -2.79150390625, -2.5859375, -2.38037109375, -2.1748046875, -1.96923828125, -1.763671875, -1.55810546875, -1.3525390625, -1.14697265625, -0.94140625, -0.73583984375, -0.5302734375, -0.32470703125, -0.119140625, 0.08642578125, 0.2919921875, 0.49755859375, 0.703125, 0.90869140625, 1.1142578125, 1.31982421875, 1.525390625, 1.73095703125, 1.9365234375, 2.14208984375, 2.34765625, 2.55322265625, 2.7587890625, 2.96435546875, 3.169921875, 3.37548828125, 3.5810546875, 3.78662109375, 3.9921875, 4.19775390625, 4.4033203125, 4.60888671875, 4.814453125, 5.02001953125, 5.2255859375, 5.43115234375, 5.63671875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 10.0, 17.0, 10.0, 42.0, 49.0, 53.0, 96.0, 125.0, 237.0, 327.0, 578.0, 1019.0, 1821.0, 3613.0, 7752.0, 18167.0, 46055.0, 120476.0, 278462.0, 316430.0, 152879.0, 58644.0, 22674.0, 9643.0, 4234.0, 2194.0, 1136.0, 664.0, 403.0, 247.0, 157.0, 110.0, 75.0, 43.0, 32.0, 21.0, 17.0, 12.0, 4.0, 5.0, 4.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.821044921875, -7.53271484375, -7.244384765625, -6.9560546875, -6.667724609375, -6.37939453125, -6.091064453125, -5.802734375, -5.514404296875, -5.22607421875, -4.937744140625, -4.6494140625, -4.361083984375, -4.07275390625, -3.784423828125, -3.49609375, -3.207763671875, -2.91943359375, -2.631103515625, -2.3427734375, -2.054443359375, -1.76611328125, -1.477783203125, -1.189453125, -0.901123046875, -0.61279296875, -0.324462890625, -0.0361328125, 0.252197265625, 0.54052734375, 0.828857421875, 1.1171875, 1.405517578125, 1.69384765625, 1.982177734375, 2.2705078125, 2.558837890625, 2.84716796875, 3.135498046875, 3.423828125, 3.712158203125, 4.00048828125, 4.288818359375, 4.5771484375, 4.865478515625, 5.15380859375, 5.442138671875, 5.73046875, 6.018798828125, 6.30712890625, 6.595458984375, 6.8837890625, 7.172119140625, 7.46044921875, 7.748779296875, 8.037109375, 8.325439453125, 8.61376953125, 8.902099609375, 9.1904296875, 9.478759765625, 9.76708984375, 10.055419921875, 10.34375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 5.0, 10.0, 12.0, 14.0, 14.0, 21.0, 26.0, 21.0, 31.0, 27.0, 28.0, 29.0, 30.0, 32.0, 43.0, 41.0, 42.0, 48.0, 34.0, 46.0, 32.0, 31.0, 41.0, 36.0, 34.0, 30.0, 24.0, 27.0, 23.0, 25.0, 24.0, 26.0, 15.0, 8.0, 11.0, 14.0, 8.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.2421875, -4.10302734375, -3.9638671875, -3.82470703125, -3.685546875, -3.54638671875, -3.4072265625, -3.26806640625, -3.12890625, -2.98974609375, -2.8505859375, -2.71142578125, -2.572265625, -2.43310546875, -2.2939453125, -2.15478515625, -2.015625, -1.87646484375, -1.7373046875, -1.59814453125, -1.458984375, -1.31982421875, -1.1806640625, -1.04150390625, -0.90234375, -0.76318359375, -0.6240234375, -0.48486328125, -0.345703125, -0.20654296875, -0.0673828125, 0.07177734375, 0.2109375, 0.35009765625, 0.4892578125, 0.62841796875, 0.767578125, 0.90673828125, 1.0458984375, 1.18505859375, 1.32421875, 1.46337890625, 1.6025390625, 1.74169921875, 1.880859375, 2.02001953125, 2.1591796875, 2.29833984375, 2.4375, 2.57666015625, 2.7158203125, 2.85498046875, 2.994140625, 3.13330078125, 3.2724609375, 3.41162109375, 3.55078125, 3.68994140625, 3.8291015625, 3.96826171875, 4.107421875, 4.24658203125, 4.3857421875, 4.52490234375, 4.6640625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 12.0, 8.0, 8.0, 18.0, 38.0, 39.0, 42.0, 72.0, 106.0, 133.0, 200.0, 308.0, 458.0, 702.0, 1100.0, 1712.0, 3091.0, 5646.0, 11598.0, 27527.0, 70096.0, 186104.0, 349501.0, 233836.0, 91248.0, 34548.0, 14566.0, 6683.0, 3509.0, 2014.0, 1253.0, 778.0, 502.0, 355.0, 240.0, 151.0, 110.0, 76.0, 49.0, 36.0, 28.0, 19.0, 15.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.36328125, -4.225341796875, -4.08740234375, -3.949462890625, -3.8115234375, -3.673583984375, -3.53564453125, -3.397705078125, -3.259765625, -3.121826171875, -2.98388671875, -2.845947265625, -2.7080078125, -2.570068359375, -2.43212890625, -2.294189453125, -2.15625, -2.018310546875, -1.88037109375, -1.742431640625, -1.6044921875, -1.466552734375, -1.32861328125, -1.190673828125, -1.052734375, -0.914794921875, -0.77685546875, -0.638916015625, -0.5009765625, -0.363037109375, -0.22509765625, -0.087158203125, 0.05078125, 0.188720703125, 0.32666015625, 0.464599609375, 0.6025390625, 0.740478515625, 0.87841796875, 1.016357421875, 1.154296875, 1.292236328125, 1.43017578125, 1.568115234375, 1.7060546875, 1.843994140625, 1.98193359375, 2.119873046875, 2.2578125, 2.395751953125, 2.53369140625, 2.671630859375, 2.8095703125, 2.947509765625, 3.08544921875, 3.223388671875, 3.361328125, 3.499267578125, 3.63720703125, 3.775146484375, 3.9130859375, 4.051025390625, 4.18896484375, 4.326904296875, 4.46484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 8.0, 9.0, 7.0, 14.0, 20.0, 37.0, 81.0, 72.0, 134.0, 111.0, 143.0, 107.0, 93.0, 64.0, 38.0, 26.0, 16.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000263214111328125, -0.00025552138686180115, -0.0002478286623954773, -0.00024013593792915344, -0.0002324432134628296, -0.00022475048899650574, -0.00021705776453018188, -0.00020936504006385803, -0.00020167231559753418, -0.00019397959113121033, -0.00018628686666488647, -0.00017859414219856262, -0.00017090141773223877, -0.00016320869326591492, -0.00015551596879959106, -0.0001478232443332672, -0.00014013051986694336, -0.0001324377954006195, -0.00012474507093429565, -0.0001170523464679718, -0.00010935962200164795, -0.0001016668975353241, -9.397417306900024e-05, -8.628144860267639e-05, -7.858872413635254e-05, -7.089599967002869e-05, -6.320327520370483e-05, -5.551055073738098e-05, -4.781782627105713e-05, -4.0125101804733276e-05, -3.2432377338409424e-05, -2.473965287208557e-05, -1.704692840576172e-05, -9.354203939437866e-06, -1.6614794731140137e-06, 6.031244993209839e-06, 1.3723969459533691e-05, 2.1416693925857544e-05, 2.9109418392181396e-05, 3.680214285850525e-05, 4.44948673248291e-05, 5.2187591791152954e-05, 5.988031625747681e-05, 6.757304072380066e-05, 7.526576519012451e-05, 8.295848965644836e-05, 9.065121412277222e-05, 9.834393858909607e-05, 0.00010603666305541992, 0.00011372938752174377, 0.00012142211198806763, 0.00012911483645439148, 0.00013680756092071533, 0.00014450028538703918, 0.00015219300985336304, 0.0001598857343196869, 0.00016757845878601074, 0.0001752711832523346, 0.00018296390771865845, 0.0001906566321849823, 0.00019834935665130615, 0.00020604208111763, 0.00021373480558395386, 0.0002214275300502777, 0.00022912025451660156]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 6.0, 2.0, 10.0, 14.0, 18.0, 21.0, 36.0, 26.0, 54.0, 59.0, 110.0, 122.0, 168.0, 254.0, 301.0, 421.0, 551.0, 863.0, 1233.0, 2008.0, 3624.0, 7886.0, 24153.0, 88454.0, 280332.0, 386006.0, 176286.0, 48434.0, 13889.0, 5261.0, 2650.0, 1577.0, 1038.0, 714.0, 511.0, 376.0, 283.0, 221.0, 145.0, 96.0, 85.0, 71.0, 41.0, 29.0, 31.0, 23.0, 17.0, 9.0, 11.0, 8.0, 7.0, 4.0, 5.0, 3.0, 0.0, 0.0, 3.0], "bins": [-5.30859375, -5.14410400390625, -4.9796142578125, -4.81512451171875, -4.650634765625, -4.48614501953125, -4.3216552734375, -4.15716552734375, -3.99267578125, -3.82818603515625, -3.6636962890625, -3.49920654296875, -3.334716796875, -3.17022705078125, -3.0057373046875, -2.84124755859375, -2.6767578125, -2.51226806640625, -2.3477783203125, -2.18328857421875, -2.018798828125, -1.85430908203125, -1.6898193359375, -1.52532958984375, -1.36083984375, -1.19635009765625, -1.0318603515625, -0.86737060546875, -0.702880859375, -0.53839111328125, -0.3739013671875, -0.20941162109375, -0.044921875, 0.11956787109375, 0.2840576171875, 0.44854736328125, 0.613037109375, 0.77752685546875, 0.9420166015625, 1.10650634765625, 1.27099609375, 1.43548583984375, 1.5999755859375, 1.76446533203125, 1.928955078125, 2.09344482421875, 2.2579345703125, 2.42242431640625, 2.5869140625, 2.75140380859375, 2.9158935546875, 3.08038330078125, 3.244873046875, 3.40936279296875, 3.5738525390625, 3.73834228515625, 3.90283203125, 4.06732177734375, 4.2318115234375, 4.39630126953125, 4.560791015625, 4.72528076171875, 4.8897705078125, 5.05426025390625, 5.21875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 15.0, 27.0, 38.0, 79.0, 109.0, 135.0, 149.0, 140.0, 96.0, 79.0, 50.0, 26.0, 14.0, 6.0, 5.0, 3.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8798828125, -1.823883056640625, -1.76788330078125, -1.711883544921875, -1.6558837890625, -1.599884033203125, -1.54388427734375, -1.487884521484375, -1.431884765625, -1.375885009765625, -1.31988525390625, -1.263885498046875, -1.2078857421875, -1.151885986328125, -1.09588623046875, -1.039886474609375, -0.98388671875, -0.927886962890625, -0.87188720703125, -0.815887451171875, -0.7598876953125, -0.703887939453125, -0.64788818359375, -0.591888427734375, -0.535888671875, -0.479888916015625, -0.42388916015625, -0.367889404296875, -0.3118896484375, -0.255889892578125, -0.19989013671875, -0.143890380859375, -0.087890625, -0.031890869140625, 0.02410888671875, 0.080108642578125, 0.1361083984375, 0.192108154296875, 0.24810791015625, 0.304107666015625, 0.360107421875, 0.416107177734375, 0.47210693359375, 0.528106689453125, 0.5841064453125, 0.640106201171875, 0.69610595703125, 0.752105712890625, 0.80810546875, 0.864105224609375, 0.92010498046875, 0.976104736328125, 1.0321044921875, 1.088104248046875, 1.14410400390625, 1.200103759765625, 1.256103515625, 1.312103271484375, 1.36810302734375, 1.424102783203125, 1.4801025390625, 1.536102294921875, 1.59210205078125, 1.648101806640625, 1.7041015625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 13.0, 6.0, 15.0, 20.0, 19.0, 26.0, 25.0, 18.0, 33.0, 43.0, 46.0, 50.0, 56.0, 59.0, 48.0, 63.0, 60.0, 53.0, 54.0, 40.0, 48.0, 36.0, 20.0, 24.0, 26.0, 17.0, 14.0, 11.0, 11.0, 11.0, 7.0, 10.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.571693420410156, -11.223751068115234, -10.875808715820312, -10.52786636352539, -10.179924011230469, -9.831981658935547, -9.484039306640625, -9.136096954345703, -8.788154602050781, -8.44021224975586, -8.092269897460938, -7.744327545166016, -7.396385192871094, -7.048442840576172, -6.70050048828125, -6.352558135986328, -6.004615783691406, -5.656673431396484, -5.3087310791015625, -4.960788726806641, -4.612846374511719, -4.264904022216797, -3.916961669921875, -3.569019317626953, -3.2210769653320312, -2.8731346130371094, -2.5251922607421875, -2.1772499084472656, -1.8293075561523438, -1.4813652038574219, -1.1334228515625, -0.7854804992675781, -0.43753910064697266, -0.08959674835205078, 0.2583456039428711, 0.606287956237793, 0.9542303085327148, 1.3021726608276367, 1.6501150131225586, 1.9980573654174805, 2.3459997177124023, 2.693942070007324, 3.041884422302246, 3.389826774597168, 3.73776912689209, 4.085711479187012, 4.433653831481934, 4.7815961837768555, 5.129538536071777, 5.477480888366699, 5.825423240661621, 6.173365592956543, 6.521307945251465, 6.869250297546387, 7.217192649841309, 7.5651350021362305, 7.913077354431152, 8.261019706726074, 8.608962059020996, 8.956904411315918, 9.30484676361084, 9.652789115905762, 10.000731468200684, 10.348673820495605, 10.696616172790527]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 6.0, 12.0, 6.0, 9.0, 13.0, 6.0, 19.0, 15.0, 16.0, 24.0, 27.0, 44.0, 24.0, 32.0, 36.0, 38.0, 40.0, 39.0, 34.0, 41.0, 41.0, 48.0, 36.0, 37.0, 27.0, 40.0, 25.0, 35.0, 35.0, 24.0, 19.0, 23.0, 15.0, 18.0, 12.0, 18.0, 16.0, 8.0, 4.0, 11.0, 5.0, 5.0, 0.0, 4.0, 4.0, 1.0, 2.0, 3.0], "bins": [-7.158749103546143, -6.960467338562012, -6.762185573577881, -6.56390380859375, -6.365622043609619, -6.167340278625488, -5.969058990478516, -5.770776748657227, -5.572495460510254, -5.374213695526123, -5.175931930541992, -4.977650165557861, -4.7793684005737305, -4.5810866355896, -4.382804870605469, -4.184523582458496, -3.986241340637207, -3.787959575653076, -3.5896778106689453, -3.3913960456848145, -3.1931142807006836, -2.9948325157165527, -2.796550989151001, -2.59826922416687, -2.3999874591827393, -2.2017056941986084, -2.0034239292144775, -1.8051422834396362, -1.6068605184555054, -1.4085787534713745, -1.2102971076965332, -1.0120153427124023, -0.8137340545654297, -0.6154522895812988, -0.41717058420181274, -0.21888887882232666, -0.0206071138381958, 0.17767465114593506, 0.37595629692077637, 0.5742380619049072, 0.7725198268890381, 0.970801591873169, 1.1690833568572998, 1.3673650026321411, 1.565646767616272, 1.7639285326004028, 1.9622101783752441, 2.160491943359375, 2.358773708343506, 2.5570554733276367, 2.7553372383117676, 2.9536190032958984, 3.1519007682800293, 3.35018253326416, 3.548464059829712, 3.7467458248138428, 3.9450275897979736, 4.143309116363525, 4.341590881347656, 4.539872646331787, 4.738154411315918, 4.936436176300049, 5.13471794128418, 5.3329997062683105, 5.531281471252441]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 9.0, 18.0, 17.0, 19.0, 27.0, 62.0, 77.0, 113.0, 193.0, 305.0, 401.0, 693.0, 1041.0, 1733.0, 2661.0, 4255.0, 6756.0, 10694.0, 16621.0, 25957.0, 38952.0, 56550.0, 77120.0, 99180.0, 116674.0, 123568.0, 117279.0, 100003.0, 78358.0, 56824.0, 39405.0, 26182.0, 17016.0, 11009.0, 6781.0, 4415.0, 2842.0, 1718.0, 1148.0, 673.0, 404.0, 255.0, 174.0, 109.0, 77.0, 65.0, 41.0, 31.0, 15.0, 16.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-6.0078125, -5.82305908203125, -5.6383056640625, -5.45355224609375, -5.268798828125, -5.08404541015625, -4.8992919921875, -4.71453857421875, -4.52978515625, -4.34503173828125, -4.1602783203125, -3.97552490234375, -3.790771484375, -3.60601806640625, -3.4212646484375, -3.23651123046875, -3.0517578125, -2.86700439453125, -2.6822509765625, -2.49749755859375, -2.312744140625, -2.12799072265625, -1.9432373046875, -1.75848388671875, -1.57373046875, -1.38897705078125, -1.2042236328125, -1.01947021484375, -0.834716796875, -0.64996337890625, -0.4652099609375, -0.28045654296875, -0.095703125, 0.08905029296875, 0.2738037109375, 0.45855712890625, 0.643310546875, 0.82806396484375, 1.0128173828125, 1.19757080078125, 1.38232421875, 1.56707763671875, 1.7518310546875, 1.93658447265625, 2.121337890625, 2.30609130859375, 2.4908447265625, 2.67559814453125, 2.8603515625, 3.04510498046875, 3.2298583984375, 3.41461181640625, 3.599365234375, 3.78411865234375, 3.9688720703125, 4.15362548828125, 4.33837890625, 4.52313232421875, 4.7078857421875, 4.89263916015625, 5.077392578125, 5.26214599609375, 5.4468994140625, 5.63165283203125, 5.81640625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 6.0, 11.0, 5.0, 5.0, 9.0, 12.0, 13.0, 16.0, 20.0, 16.0, 23.0, 19.0, 35.0, 30.0, 37.0, 29.0, 38.0, 44.0, 41.0, 34.0, 41.0, 50.0, 41.0, 37.0, 38.0, 47.0, 32.0, 27.0, 29.0, 34.0, 15.0, 26.0, 24.0, 12.0, 15.0, 13.0, 17.0, 5.0, 10.0, 8.0, 7.0, 9.0, 9.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.21875, -6.99462890625, -6.7705078125, -6.54638671875, -6.322265625, -6.09814453125, -5.8740234375, -5.64990234375, -5.42578125, -5.20166015625, -4.9775390625, -4.75341796875, -4.529296875, -4.30517578125, -4.0810546875, -3.85693359375, -3.6328125, -3.40869140625, -3.1845703125, -2.96044921875, -2.736328125, -2.51220703125, -2.2880859375, -2.06396484375, -1.83984375, -1.61572265625, -1.3916015625, -1.16748046875, -0.943359375, -0.71923828125, -0.4951171875, -0.27099609375, -0.046875, 0.17724609375, 0.4013671875, 0.62548828125, 0.849609375, 1.07373046875, 1.2978515625, 1.52197265625, 1.74609375, 1.97021484375, 2.1943359375, 2.41845703125, 2.642578125, 2.86669921875, 3.0908203125, 3.31494140625, 3.5390625, 3.76318359375, 3.9873046875, 4.21142578125, 4.435546875, 4.65966796875, 4.8837890625, 5.10791015625, 5.33203125, 5.55615234375, 5.7802734375, 6.00439453125, 6.228515625, 6.45263671875, 6.6767578125, 6.90087890625, 7.125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 10.0, 22.0, 17.0, 37.0, 62.0, 75.0, 118.0, 189.0, 309.0, 474.0, 752.0, 1291.0, 2286.0, 3877.0, 7381.0, 13186.0, 24328.0, 43186.0, 73154.0, 113349.0, 151865.0, 169692.0, 153474.0, 114845.0, 74610.0, 44252.0, 24654.0, 13690.0, 7512.0, 4176.0, 2276.0, 1380.0, 759.0, 454.0, 277.0, 180.0, 110.0, 79.0, 46.0, 40.0, 27.0, 14.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.703125, -8.4434814453125, -8.183837890625, -7.9241943359375, -7.66455078125, -7.4049072265625, -7.145263671875, -6.8856201171875, -6.6259765625, -6.3663330078125, -6.106689453125, -5.8470458984375, -5.58740234375, -5.3277587890625, -5.068115234375, -4.8084716796875, -4.548828125, -4.2891845703125, -4.029541015625, -3.7698974609375, -3.51025390625, -3.2506103515625, -2.990966796875, -2.7313232421875, -2.4716796875, -2.2120361328125, -1.952392578125, -1.6927490234375, -1.43310546875, -1.1734619140625, -0.913818359375, -0.6541748046875, -0.39453125, -0.1348876953125, 0.124755859375, 0.3843994140625, 0.64404296875, 0.9036865234375, 1.163330078125, 1.4229736328125, 1.6826171875, 1.9422607421875, 2.201904296875, 2.4615478515625, 2.72119140625, 2.9808349609375, 3.240478515625, 3.5001220703125, 3.759765625, 4.0194091796875, 4.279052734375, 4.5386962890625, 4.79833984375, 5.0579833984375, 5.317626953125, 5.5772705078125, 5.8369140625, 6.0965576171875, 6.356201171875, 6.6158447265625, 6.87548828125, 7.1351318359375, 7.394775390625, 7.6544189453125, 7.9140625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 6.0, 4.0, 8.0, 6.0, 10.0, 8.0, 17.0, 13.0, 13.0, 18.0, 21.0, 30.0, 29.0, 31.0, 34.0, 37.0, 31.0, 43.0, 32.0, 31.0, 37.0, 41.0, 31.0, 31.0, 34.0, 48.0, 42.0, 33.0, 26.0, 34.0, 28.0, 27.0, 22.0, 25.0, 15.0, 16.0, 19.0, 11.0, 13.0, 8.0, 11.0, 9.0, 1.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.66796875, -4.5281982421875, -4.388427734375, -4.2486572265625, -4.10888671875, -3.9691162109375, -3.829345703125, -3.6895751953125, -3.5498046875, -3.4100341796875, -3.270263671875, -3.1304931640625, -2.99072265625, -2.8509521484375, -2.711181640625, -2.5714111328125, -2.431640625, -2.2918701171875, -2.152099609375, -2.0123291015625, -1.87255859375, -1.7327880859375, -1.593017578125, -1.4532470703125, -1.3134765625, -1.1737060546875, -1.033935546875, -0.8941650390625, -0.75439453125, -0.6146240234375, -0.474853515625, -0.3350830078125, -0.1953125, -0.0555419921875, 0.084228515625, 0.2239990234375, 0.36376953125, 0.5035400390625, 0.643310546875, 0.7830810546875, 0.9228515625, 1.0626220703125, 1.202392578125, 1.3421630859375, 1.48193359375, 1.6217041015625, 1.761474609375, 1.9012451171875, 2.041015625, 2.1807861328125, 2.320556640625, 2.4603271484375, 2.60009765625, 2.7398681640625, 2.879638671875, 3.0194091796875, 3.1591796875, 3.2989501953125, 3.438720703125, 3.5784912109375, 3.71826171875, 3.8580322265625, 3.997802734375, 4.1375732421875, 4.27734375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 7.0, 5.0, 7.0, 19.0, 23.0, 42.0, 47.0, 84.0, 120.0, 177.0, 272.0, 417.0, 661.0, 1028.0, 1669.0, 2677.0, 4360.0, 7193.0, 11435.0, 19345.0, 31278.0, 49744.0, 76799.0, 110031.0, 139863.0, 152909.0, 137617.0, 105133.0, 72695.0, 46957.0, 29619.0, 17953.0, 10841.0, 6524.0, 4072.0, 2517.0, 1559.0, 1017.0, 676.0, 402.0, 278.0, 169.0, 123.0, 68.0, 46.0, 29.0, 22.0, 13.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.283203125, -3.171661376953125, -3.06011962890625, -2.948577880859375, -2.8370361328125, -2.725494384765625, -2.61395263671875, -2.502410888671875, -2.390869140625, -2.279327392578125, -2.16778564453125, -2.056243896484375, -1.9447021484375, -1.833160400390625, -1.72161865234375, -1.610076904296875, -1.49853515625, -1.386993408203125, -1.27545166015625, -1.163909912109375, -1.0523681640625, -0.940826416015625, -0.82928466796875, -0.717742919921875, -0.606201171875, -0.494659423828125, -0.38311767578125, -0.271575927734375, -0.1600341796875, -0.048492431640625, 0.06304931640625, 0.174591064453125, 0.2861328125, 0.397674560546875, 0.50921630859375, 0.620758056640625, 0.7322998046875, 0.843841552734375, 0.95538330078125, 1.066925048828125, 1.178466796875, 1.290008544921875, 1.40155029296875, 1.513092041015625, 1.6246337890625, 1.736175537109375, 1.84771728515625, 1.959259033203125, 2.07080078125, 2.182342529296875, 2.29388427734375, 2.405426025390625, 2.5169677734375, 2.628509521484375, 2.74005126953125, 2.851593017578125, 2.963134765625, 3.074676513671875, 3.18621826171875, 3.297760009765625, 3.4093017578125, 3.520843505859375, 3.63238525390625, 3.743927001953125, 3.85546875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 3.0, 8.0, 12.0, 12.0, 11.0, 21.0, 19.0, 18.0, 34.0, 34.0, 30.0, 54.0, 47.0, 48.0, 51.0, 60.0, 69.0, 53.0, 65.0, 63.0, 48.0, 35.0, 34.0, 29.0, 18.0, 30.0, 16.0, 19.0, 14.0, 6.0, 7.0, 7.0, 6.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0], "bins": [-0.0005145072937011719, -0.0005019828677177429, -0.000489458441734314, -0.000476934015750885, -0.00046440958976745605, -0.0004518851637840271, -0.00043936073780059814, -0.0004268363118171692, -0.00041431188583374023, -0.0004017874598503113, -0.0003892630338668823, -0.00037673860788345337, -0.0003642141819000244, -0.00035168975591659546, -0.0003391653299331665, -0.00032664090394973755, -0.0003141164779663086, -0.00030159205198287964, -0.0002890676259994507, -0.00027654320001602173, -0.0002640187740325928, -0.0002514943480491638, -0.00023896992206573486, -0.0002264454960823059, -0.00021392107009887695, -0.000201396644115448, -0.00018887221813201904, -0.0001763477921485901, -0.00016382336616516113, -0.00015129894018173218, -0.00013877451419830322, -0.00012625008821487427, -0.00011372566223144531, -0.00010120123624801636, -8.86768102645874e-05, -7.615238428115845e-05, -6.362795829772949e-05, -5.110353231430054e-05, -3.857910633087158e-05, -2.6054680347442627e-05, -1.3530254364013672e-05, -1.0058283805847168e-06, 1.1518597602844238e-05, 2.4043023586273193e-05, 3.656744956970215e-05, 4.9091875553131104e-05, 6.161630153656006e-05, 7.414072751998901e-05, 8.666515350341797e-05, 9.918957948684692e-05, 0.00011171400547027588, 0.00012423843145370483, 0.0001367628574371338, 0.00014928728342056274, 0.0001618117094039917, 0.00017433613538742065, 0.0001868605613708496, 0.00019938498735427856, 0.00021190941333770752, 0.00022443383932113647, 0.00023695826530456543, 0.0002494826912879944, 0.00026200711727142334, 0.0002745315432548523, 0.00028705596923828125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 17.0, 11.0, 25.0, 38.0, 57.0, 86.0, 178.0, 289.0, 483.0, 831.0, 1510.0, 2662.0, 4837.0, 9217.0, 17901.0, 33906.0, 63845.0, 110386.0, 166724.0, 196716.0, 172682.0, 118251.0, 68929.0, 37210.0, 19544.0, 10067.0, 5386.0, 2981.0, 1614.0, 867.0, 534.0, 280.0, 183.0, 113.0, 67.0, 37.0, 47.0, 17.0, 7.0, 6.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.57421875, -4.4293212890625, -4.284423828125, -4.1395263671875, -3.99462890625, -3.8497314453125, -3.704833984375, -3.5599365234375, -3.4150390625, -3.2701416015625, -3.125244140625, -2.9803466796875, -2.83544921875, -2.6905517578125, -2.545654296875, -2.4007568359375, -2.255859375, -2.1109619140625, -1.966064453125, -1.8211669921875, -1.67626953125, -1.5313720703125, -1.386474609375, -1.2415771484375, -1.0966796875, -0.9517822265625, -0.806884765625, -0.6619873046875, -0.51708984375, -0.3721923828125, -0.227294921875, -0.0823974609375, 0.0625, 0.2073974609375, 0.352294921875, 0.4971923828125, 0.64208984375, 0.7869873046875, 0.931884765625, 1.0767822265625, 1.2216796875, 1.3665771484375, 1.511474609375, 1.6563720703125, 1.80126953125, 1.9461669921875, 2.091064453125, 2.2359619140625, 2.380859375, 2.5257568359375, 2.670654296875, 2.8155517578125, 2.96044921875, 3.1053466796875, 3.250244140625, 3.3951416015625, 3.5400390625, 3.6849365234375, 3.829833984375, 3.9747314453125, 4.11962890625, 4.2645263671875, 4.409423828125, 4.5543212890625, 4.69921875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 5.0, 4.0, 11.0, 8.0, 5.0, 11.0, 12.0, 15.0, 16.0, 18.0, 22.0, 27.0, 39.0, 44.0, 40.0, 40.0, 41.0, 62.0, 59.0, 43.0, 52.0, 49.0, 48.0, 40.0, 45.0, 34.0, 27.0, 30.0, 22.0, 30.0, 18.0, 12.0, 12.0, 11.0, 9.0, 13.0, 2.0, 6.0, 9.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.99853515625, -0.9681015014648438, -0.9376678466796875, -0.9072341918945312, -0.876800537109375, -0.8463668823242188, -0.8159332275390625, -0.7854995727539062, -0.75506591796875, -0.7246322631835938, -0.6941986083984375, -0.6637649536132812, -0.633331298828125, -0.6028976440429688, -0.5724639892578125, -0.5420303344726562, -0.5115966796875, -0.48116302490234375, -0.4507293701171875, -0.42029571533203125, -0.389862060546875, -0.35942840576171875, -0.3289947509765625, -0.29856109619140625, -0.26812744140625, -0.23769378662109375, -0.2072601318359375, -0.17682647705078125, -0.146392822265625, -0.11595916748046875, -0.0855255126953125, -0.05509185791015625, -0.024658203125, 0.00577545166015625, 0.0362091064453125, 0.06664276123046875, 0.097076416015625, 0.12751007080078125, 0.1579437255859375, 0.18837738037109375, 0.21881103515625, 0.24924468994140625, 0.2796783447265625, 0.31011199951171875, 0.340545654296875, 0.37097930908203125, 0.4014129638671875, 0.43184661865234375, 0.4622802734375, 0.49271392822265625, 0.5231475830078125, 0.5535812377929688, 0.584014892578125, 0.6144485473632812, 0.6448822021484375, 0.6753158569335938, 0.70574951171875, 0.7361831665039062, 0.7666168212890625, 0.7970504760742188, 0.827484130859375, 0.8579177856445312, 0.8883514404296875, 0.9187850952148438, 0.94921875]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 13.0, 12.0, 14.0, 18.0, 30.0, 33.0, 21.0, 37.0, 44.0, 37.0, 58.0, 45.0, 68.0, 62.0, 56.0, 44.0, 66.0, 58.0, 39.0, 35.0, 38.0, 27.0, 18.0, 22.0, 14.0, 14.0, 12.0, 8.0, 12.0, 4.0, 10.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.416698455810547, -11.070732116699219, -10.724766731262207, -10.378800392150879, -10.03283405303955, -9.686868667602539, -9.340902328491211, -8.994935989379883, -8.648969650268555, -8.303003311157227, -7.957037448883057, -7.611071586608887, -7.265105247497559, -6.919139385223389, -6.573173522949219, -6.227207183837891, -5.881241798400879, -5.535275936126709, -5.189309597015381, -4.843343734741211, -4.497377395629883, -4.151411533355713, -3.805445671081543, -3.459479570388794, -3.113513469696045, -2.767547369003296, -2.421581268310547, -2.075615406036377, -1.729649305343628, -1.383683204650879, -1.037717342376709, -0.69175124168396, -0.34578514099121094, 0.00018090009689331055, 0.34614694118499756, 0.692112922668457, 1.038079023361206, 1.384045124053955, 1.730010986328125, 2.075977087020874, 2.421943187713623, 2.767909288406372, 3.113875389099121, 3.459841251373291, 3.80580735206604, 4.151773452758789, 4.497739315032959, 4.843705177307129, 5.189671516418457, 5.535637378692627, 5.881603717803955, 6.227569580078125, 6.573535919189453, 6.919501781463623, 7.265467643737793, 7.611433982849121, 7.957399845123291, 8.303365707397461, 8.649332046508789, 8.995298385620117, 9.341263771057129, 9.687230110168457, 10.033195495605469, 10.379161834716797, 10.725128173828125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 4.0, 5.0, 12.0, 16.0, 20.0, 22.0, 24.0, 20.0, 38.0, 34.0, 33.0, 40.0, 51.0, 39.0, 44.0, 57.0, 56.0, 47.0, 45.0, 23.0, 33.0, 45.0, 38.0, 39.0, 45.0, 34.0, 17.0, 19.0, 20.0, 14.0, 16.0, 11.0, 8.0, 7.0, 2.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.361013412475586, -8.113677024841309, -7.866341590881348, -7.61900520324707, -7.371669292449951, -7.124333381652832, -6.876997470855713, -6.629661560058594, -6.382325172424316, -6.134989261627197, -5.887653350830078, -5.640316963195801, -5.392981052398682, -5.1456451416015625, -4.898309230804443, -4.650973320007324, -4.403636932373047, -4.156301021575928, -3.9089648723602295, -3.6616289615631104, -3.414292812347412, -3.166956901550293, -2.919620990753174, -2.6722848415374756, -2.4249491691589355, -2.1776132583618164, -1.9302771091461182, -1.682941198348999, -1.4356050491333008, -1.1882691383361816, -0.940933108329773, -0.6935970783233643, -0.446260929107666, -0.19892491400241852, 0.04841110110282898, 0.2957471013069153, 0.543083131313324, 0.7904191017150879, 1.0377551317214966, 1.2850911617279053, 1.532427191734314, 1.7797632217407227, 2.027099132537842, 2.27443528175354, 2.521771192550659, 2.7691073417663574, 3.0164432525634766, 3.2637791633605957, 3.511115312576294, 3.758451223373413, 4.005787372589111, 4.2531232833862305, 4.50045919418335, 4.747795104980469, 4.995131492614746, 5.242467403411865, 5.489803314208984, 5.7371392250061035, 5.984475135803223, 6.2318115234375, 6.479147434234619, 6.726483345031738, 6.973819255828857, 7.221155166625977, 7.468491554260254]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 8.0, 8.0, 14.0, 23.0, 30.0, 55.0, 119.0, 169.0, 233.0, 414.0, 676.0, 1124.0, 1917.0, 3302.0, 5731.0, 10424.0, 19163.0, 36468.0, 71243.0, 142327.0, 288019.0, 558395.0, 892536.0, 921983.0, 601782.0, 315178.0, 157232.0, 78000.0, 40341.0, 20937.0, 11385.0, 6274.0, 3535.0, 2005.0, 1253.0, 744.0, 434.0, 272.0, 193.0, 123.0, 64.0, 50.0, 29.0, 25.0, 15.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.84375, -9.52685546875, -9.2099609375, -8.89306640625, -8.576171875, -8.25927734375, -7.9423828125, -7.62548828125, -7.30859375, -6.99169921875, -6.6748046875, -6.35791015625, -6.041015625, -5.72412109375, -5.4072265625, -5.09033203125, -4.7734375, -4.45654296875, -4.1396484375, -3.82275390625, -3.505859375, -3.18896484375, -2.8720703125, -2.55517578125, -2.23828125, -1.92138671875, -1.6044921875, -1.28759765625, -0.970703125, -0.65380859375, -0.3369140625, -0.02001953125, 0.296875, 0.61376953125, 0.9306640625, 1.24755859375, 1.564453125, 1.88134765625, 2.1982421875, 2.51513671875, 2.83203125, 3.14892578125, 3.4658203125, 3.78271484375, 4.099609375, 4.41650390625, 4.7333984375, 5.05029296875, 5.3671875, 5.68408203125, 6.0009765625, 6.31787109375, 6.634765625, 6.95166015625, 7.2685546875, 7.58544921875, 7.90234375, 8.21923828125, 8.5361328125, 8.85302734375, 9.169921875, 9.48681640625, 9.8037109375, 10.12060546875, 10.4375]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 4.0, 9.0, 14.0, 24.0, 16.0, 31.0, 22.0, 28.0, 30.0, 43.0, 36.0, 38.0, 46.0, 36.0, 43.0, 43.0, 40.0, 32.0, 51.0, 42.0, 45.0, 37.0, 48.0, 40.0, 30.0, 22.0, 29.0, 17.0, 15.0, 16.0, 19.0, 6.0, 9.0, 9.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.78125, -5.6080322265625, -5.434814453125, -5.2615966796875, -5.08837890625, -4.9151611328125, -4.741943359375, -4.5687255859375, -4.3955078125, -4.2222900390625, -4.049072265625, -3.8758544921875, -3.70263671875, -3.5294189453125, -3.356201171875, -3.1829833984375, -3.009765625, -2.8365478515625, -2.663330078125, -2.4901123046875, -2.31689453125, -2.1436767578125, -1.970458984375, -1.7972412109375, -1.6240234375, -1.4508056640625, -1.277587890625, -1.1043701171875, -0.93115234375, -0.7579345703125, -0.584716796875, -0.4114990234375, -0.23828125, -0.0650634765625, 0.108154296875, 0.2813720703125, 0.45458984375, 0.6278076171875, 0.801025390625, 0.9742431640625, 1.1474609375, 1.3206787109375, 1.493896484375, 1.6671142578125, 1.84033203125, 2.0135498046875, 2.186767578125, 2.3599853515625, 2.533203125, 2.7064208984375, 2.879638671875, 3.0528564453125, 3.22607421875, 3.3992919921875, 3.572509765625, 3.7457275390625, 3.9189453125, 4.0921630859375, 4.265380859375, 4.4385986328125, 4.61181640625, 4.7850341796875, 4.958251953125, 5.1314697265625, 5.3046875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 10.0, 9.0, 15.0, 17.0, 36.0, 48.0, 63.0, 111.0, 170.0, 271.0, 429.0, 715.0, 1236.0, 2087.0, 3749.0, 6885.0, 12810.0, 24460.0, 47976.0, 93440.0, 183395.0, 348800.0, 608011.0, 853223.0, 817280.0, 549646.0, 307073.0, 160905.0, 82480.0, 41739.0, 21769.0, 11421.0, 6032.0, 3313.0, 1892.0, 1114.0, 655.0, 360.0, 229.0, 138.0, 80.0, 65.0, 38.0, 29.0, 21.0, 15.0, 6.0, 6.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-10.859375, -10.529296875, -10.19921875, -9.869140625, -9.5390625, -9.208984375, -8.87890625, -8.548828125, -8.21875, -7.888671875, -7.55859375, -7.228515625, -6.8984375, -6.568359375, -6.23828125, -5.908203125, -5.578125, -5.248046875, -4.91796875, -4.587890625, -4.2578125, -3.927734375, -3.59765625, -3.267578125, -2.9375, -2.607421875, -2.27734375, -1.947265625, -1.6171875, -1.287109375, -0.95703125, -0.626953125, -0.296875, 0.033203125, 0.36328125, 0.693359375, 1.0234375, 1.353515625, 1.68359375, 2.013671875, 2.34375, 2.673828125, 3.00390625, 3.333984375, 3.6640625, 3.994140625, 4.32421875, 4.654296875, 4.984375, 5.314453125, 5.64453125, 5.974609375, 6.3046875, 6.634765625, 6.96484375, 7.294921875, 7.625, 7.955078125, 8.28515625, 8.615234375, 8.9453125, 9.275390625, 9.60546875, 9.935546875, 10.265625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 2.0, 13.0, 16.0, 20.0, 19.0, 20.0, 36.0, 53.0, 61.0, 74.0, 85.0, 122.0, 138.0, 150.0, 156.0, 206.0, 233.0, 251.0, 262.0, 255.0, 257.0, 234.0, 261.0, 197.0, 191.0, 168.0, 135.0, 99.0, 83.0, 64.0, 41.0, 40.0, 39.0, 20.0, 15.0, 14.0, 10.0, 8.0, 7.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.306640625, -3.2080078125, -3.109375, -3.0107421875, -2.912109375, -2.8134765625, -2.71484375, -2.6162109375, -2.517578125, -2.4189453125, -2.3203125, -2.2216796875, -2.123046875, -2.0244140625, -1.92578125, -1.8271484375, -1.728515625, -1.6298828125, -1.53125, -1.4326171875, -1.333984375, -1.2353515625, -1.13671875, -1.0380859375, -0.939453125, -0.8408203125, -0.7421875, -0.6435546875, -0.544921875, -0.4462890625, -0.34765625, -0.2490234375, -0.150390625, -0.0517578125, 0.046875, 0.1455078125, 0.244140625, 0.3427734375, 0.44140625, 0.5400390625, 0.638671875, 0.7373046875, 0.8359375, 0.9345703125, 1.033203125, 1.1318359375, 1.23046875, 1.3291015625, 1.427734375, 1.5263671875, 1.625, 1.7236328125, 1.822265625, 1.9208984375, 2.01953125, 2.1181640625, 2.216796875, 2.3154296875, 2.4140625, 2.5126953125, 2.611328125, 2.7099609375, 2.80859375, 2.9072265625, 3.005859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 7.0, 8.0, 13.0, 17.0, 19.0, 18.0, 23.0, 30.0, 35.0, 41.0, 34.0, 39.0, 51.0, 65.0, 50.0, 56.0, 65.0, 47.0, 44.0, 50.0, 44.0, 33.0, 38.0, 27.0, 16.0, 21.0, 21.0, 19.0, 15.0, 8.0, 7.0, 8.0, 8.0, 4.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.058485984802246, -9.7316312789917, -9.404777526855469, -9.077922821044922, -8.751068115234375, -8.424213409423828, -8.097358703613281, -7.770504951477051, -7.443650245666504, -7.116795539855957, -6.789941310882568, -6.46308708190918, -6.136232376098633, -5.809377670288086, -5.482523441314697, -5.155669212341309, -4.828814506530762, -4.501959800720215, -4.175105571746826, -3.8482511043548584, -3.5213966369628906, -3.194542169570923, -2.867687702178955, -2.5408332347869873, -2.2139787673950195, -1.8871243000030518, -1.560269832611084, -1.2334153652191162, -0.9065608978271484, -0.5797064304351807, -0.2528519630432129, 0.07400250434875488, 0.40085697174072266, 0.7277114391326904, 1.0545659065246582, 1.381420373916626, 1.7082748413085938, 2.0351293087005615, 2.3619837760925293, 2.688838243484497, 3.015692710876465, 3.3425471782684326, 3.6694016456604004, 3.996256113052368, 4.323110580444336, 4.649965286254883, 4.9768195152282715, 5.30367374420166, 5.630528450012207, 5.957383155822754, 6.284237384796143, 6.611091613769531, 6.937946319580078, 7.264801025390625, 7.591655254364014, 7.918509483337402, 8.24536418914795, 8.572218894958496, 8.899072647094727, 9.225927352905273, 9.55278205871582, 9.879636764526367, 10.206491470336914, 10.533345222473145, 10.860199928283691]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 2.0, 5.0, 11.0, 11.0, 17.0, 15.0, 17.0, 20.0, 29.0, 28.0, 35.0, 30.0, 35.0, 44.0, 41.0, 37.0, 49.0, 36.0, 54.0, 46.0, 46.0, 39.0, 39.0, 23.0, 39.0, 28.0, 25.0, 34.0, 22.0, 27.0, 22.0, 16.0, 13.0, 12.0, 9.0, 8.0, 6.0, 7.0, 4.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.039731502532959, -6.835515975952148, -6.63129997253418, -6.427084445953369, -6.222868919372559, -6.01865291595459, -5.814437389373779, -5.610221862792969, -5.406005859375, -5.2017903327941895, -4.997574329376221, -4.79335880279541, -4.5891432762146, -4.384927749633789, -4.18071174621582, -3.9764962196350098, -3.772280693054199, -3.5680649280548096, -3.363849401473999, -3.1596336364746094, -2.955418109893799, -2.751202344894409, -2.5469865798950195, -2.342771053314209, -2.1385552883148193, -1.9343396425247192, -1.7301239967346191, -1.5259082317352295, -1.3216925859451294, -1.1174769401550293, -0.9132611751556396, -0.7090455293655396, -0.5048298835754395, -0.30061420798301697, -0.09639853239059448, 0.10781717300415039, 0.3120328187942505, 0.5162484645843506, 0.7204642295837402, 0.9246798753738403, 1.1288955211639404, 1.3331111669540405, 1.5373268127441406, 1.7415425777435303, 1.9457582235336304, 2.1499738693237305, 2.35418963432312, 2.5584053993225098, 2.7626209259033203, 2.96683669090271, 3.1710522174835205, 3.37526798248291, 3.5794835090637207, 3.7836992740631104, 3.9879150390625, 4.1921305656433105, 4.396346092224121, 4.600561618804932, 4.8047776222229, 5.008993148803711, 5.2132086753845215, 5.417424201965332, 5.621640205383301, 5.825855731964111, 6.03007173538208]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 9.0, 12.0, 16.0, 13.0, 26.0, 30.0, 45.0, 62.0, 96.0, 138.0, 221.0, 282.0, 498.0, 793.0, 1277.0, 2109.0, 3977.0, 7883.0, 16124.0, 33453.0, 70449.0, 137646.0, 217921.0, 230630.0, 159375.0, 84183.0, 41190.0, 19282.0, 9492.0, 4835.0, 2555.0, 1482.0, 853.0, 565.0, 353.0, 220.0, 125.0, 110.0, 66.0, 43.0, 42.0, 25.0, 23.0, 5.0, 6.0, 7.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.84765625, -5.671142578125, -5.49462890625, -5.318115234375, -5.1416015625, -4.965087890625, -4.78857421875, -4.612060546875, -4.435546875, -4.259033203125, -4.08251953125, -3.906005859375, -3.7294921875, -3.552978515625, -3.37646484375, -3.199951171875, -3.0234375, -2.846923828125, -2.67041015625, -2.493896484375, -2.3173828125, -2.140869140625, -1.96435546875, -1.787841796875, -1.611328125, -1.434814453125, -1.25830078125, -1.081787109375, -0.9052734375, -0.728759765625, -0.55224609375, -0.375732421875, -0.19921875, -0.022705078125, 0.15380859375, 0.330322265625, 0.5068359375, 0.683349609375, 0.85986328125, 1.036376953125, 1.212890625, 1.389404296875, 1.56591796875, 1.742431640625, 1.9189453125, 2.095458984375, 2.27197265625, 2.448486328125, 2.625, 2.801513671875, 2.97802734375, 3.154541015625, 3.3310546875, 3.507568359375, 3.68408203125, 3.860595703125, 4.037109375, 4.213623046875, 4.39013671875, 4.566650390625, 4.7431640625, 4.919677734375, 5.09619140625, 5.272705078125, 5.44921875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 5.0, 8.0, 7.0, 9.0, 9.0, 14.0, 12.0, 22.0, 21.0, 26.0, 28.0, 32.0, 31.0, 39.0, 42.0, 45.0, 45.0, 44.0, 39.0, 37.0, 46.0, 54.0, 42.0, 34.0, 38.0, 31.0, 31.0, 26.0, 25.0, 24.0, 22.0, 15.0, 18.0, 14.0, 10.0, 9.0, 13.0, 8.0, 8.0, 5.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.89453125, -7.66717529296875, -7.4398193359375, -7.21246337890625, -6.985107421875, -6.75775146484375, -6.5303955078125, -6.30303955078125, -6.07568359375, -5.84832763671875, -5.6209716796875, -5.39361572265625, -5.166259765625, -4.93890380859375, -4.7115478515625, -4.48419189453125, -4.2568359375, -4.02947998046875, -3.8021240234375, -3.57476806640625, -3.347412109375, -3.12005615234375, -2.8927001953125, -2.66534423828125, -2.43798828125, -2.21063232421875, -1.9832763671875, -1.75592041015625, -1.528564453125, -1.30120849609375, -1.0738525390625, -0.84649658203125, -0.619140625, -0.39178466796875, -0.1644287109375, 0.06292724609375, 0.290283203125, 0.51763916015625, 0.7449951171875, 0.97235107421875, 1.19970703125, 1.42706298828125, 1.6544189453125, 1.88177490234375, 2.109130859375, 2.33648681640625, 2.5638427734375, 2.79119873046875, 3.0185546875, 3.24591064453125, 3.4732666015625, 3.70062255859375, 3.927978515625, 4.15533447265625, 4.3826904296875, 4.61004638671875, 4.83740234375, 5.06475830078125, 5.2921142578125, 5.51947021484375, 5.746826171875, 5.97418212890625, 6.2015380859375, 6.42889404296875, 6.65625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 16.0, 13.0, 18.0, 17.0, 25.0, 31.0, 64.0, 75.0, 122.0, 176.0, 245.0, 392.0, 562.0, 947.0, 1653.0, 2827.0, 5380.0, 10926.0, 23824.0, 56534.0, 138850.0, 287931.0, 281792.0, 134677.0, 54788.0, 23310.0, 10831.0, 5237.0, 2972.0, 1581.0, 968.0, 542.0, 378.0, 266.0, 174.0, 119.0, 91.0, 47.0, 32.0, 34.0, 26.0, 18.0, 9.0, 5.0, 2.0, 7.0, 7.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.840087890625, -7.57861328125, -7.317138671875, -7.0556640625, -6.794189453125, -6.53271484375, -6.271240234375, -6.009765625, -5.748291015625, -5.48681640625, -5.225341796875, -4.9638671875, -4.702392578125, -4.44091796875, -4.179443359375, -3.91796875, -3.656494140625, -3.39501953125, -3.133544921875, -2.8720703125, -2.610595703125, -2.34912109375, -2.087646484375, -1.826171875, -1.564697265625, -1.30322265625, -1.041748046875, -0.7802734375, -0.518798828125, -0.25732421875, 0.004150390625, 0.265625, 0.527099609375, 0.78857421875, 1.050048828125, 1.3115234375, 1.572998046875, 1.83447265625, 2.095947265625, 2.357421875, 2.618896484375, 2.88037109375, 3.141845703125, 3.4033203125, 3.664794921875, 3.92626953125, 4.187744140625, 4.44921875, 4.710693359375, 4.97216796875, 5.233642578125, 5.4951171875, 5.756591796875, 6.01806640625, 6.279541015625, 6.541015625, 6.802490234375, 7.06396484375, 7.325439453125, 7.5869140625, 7.848388671875, 8.10986328125, 8.371337890625, 8.6328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 4.0, 6.0, 11.0, 6.0, 7.0, 15.0, 16.0, 14.0, 26.0, 17.0, 23.0, 28.0, 27.0, 36.0, 28.0, 27.0, 41.0, 27.0, 41.0, 32.0, 46.0, 39.0, 42.0, 42.0, 45.0, 34.0, 31.0, 37.0, 26.0, 30.0, 20.0, 18.0, 20.0, 21.0, 15.0, 22.0, 11.0, 8.0, 12.0, 6.0, 6.0, 2.0, 7.0, 4.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.974609375, -3.851348876953125, -3.72808837890625, -3.604827880859375, -3.4815673828125, -3.358306884765625, -3.23504638671875, -3.111785888671875, -2.988525390625, -2.865264892578125, -2.74200439453125, -2.618743896484375, -2.4954833984375, -2.372222900390625, -2.24896240234375, -2.125701904296875, -2.00244140625, -1.879180908203125, -1.75592041015625, -1.632659912109375, -1.5093994140625, -1.386138916015625, -1.26287841796875, -1.139617919921875, -1.016357421875, -0.893096923828125, -0.76983642578125, -0.646575927734375, -0.5233154296875, -0.400054931640625, -0.27679443359375, -0.153533935546875, -0.0302734375, 0.092987060546875, 0.21624755859375, 0.339508056640625, 0.4627685546875, 0.586029052734375, 0.70928955078125, 0.832550048828125, 0.955810546875, 1.079071044921875, 1.20233154296875, 1.325592041015625, 1.4488525390625, 1.572113037109375, 1.69537353515625, 1.818634033203125, 1.94189453125, 2.065155029296875, 2.18841552734375, 2.311676025390625, 2.4349365234375, 2.558197021484375, 2.68145751953125, 2.804718017578125, 2.927978515625, 3.051239013671875, 3.17449951171875, 3.297760009765625, 3.4210205078125, 3.544281005859375, 3.66754150390625, 3.790802001953125, 3.9140625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 4.0, 8.0, 10.0, 6.0, 10.0, 23.0, 37.0, 46.0, 63.0, 69.0, 114.0, 138.0, 194.0, 290.0, 392.0, 610.0, 789.0, 1202.0, 1816.0, 2705.0, 4054.0, 6774.0, 10859.0, 18451.0, 32108.0, 56797.0, 103452.0, 177006.0, 227192.0, 170724.0, 99449.0, 55022.0, 30873.0, 17917.0, 10730.0, 6418.0, 4001.0, 2647.0, 1679.0, 1130.0, 818.0, 541.0, 359.0, 296.0, 219.0, 134.0, 119.0, 76.0, 64.0, 36.0, 27.0, 18.0, 23.0, 7.0, 4.0, 9.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.47265625, -2.394073486328125, -2.31549072265625, -2.236907958984375, -2.1583251953125, -2.079742431640625, -2.00115966796875, -1.922576904296875, -1.843994140625, -1.765411376953125, -1.68682861328125, -1.608245849609375, -1.5296630859375, -1.451080322265625, -1.37249755859375, -1.293914794921875, -1.21533203125, -1.136749267578125, -1.05816650390625, -0.979583740234375, -0.9010009765625, -0.822418212890625, -0.74383544921875, -0.665252685546875, -0.586669921875, -0.508087158203125, -0.42950439453125, -0.350921630859375, -0.2723388671875, -0.193756103515625, -0.11517333984375, -0.036590576171875, 0.0419921875, 0.120574951171875, 0.19915771484375, 0.277740478515625, 0.3563232421875, 0.434906005859375, 0.51348876953125, 0.592071533203125, 0.670654296875, 0.749237060546875, 0.82781982421875, 0.906402587890625, 0.9849853515625, 1.063568115234375, 1.14215087890625, 1.220733642578125, 1.29931640625, 1.377899169921875, 1.45648193359375, 1.535064697265625, 1.6136474609375, 1.692230224609375, 1.77081298828125, 1.849395751953125, 1.927978515625, 2.006561279296875, 2.08514404296875, 2.163726806640625, 2.2423095703125, 2.320892333984375, 2.39947509765625, 2.478057861328125, 2.556640625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 5.0, 2.0, 2.0, 5.0, 5.0, 14.0, 14.0, 16.0, 25.0, 34.0, 45.0, 49.0, 55.0, 65.0, 94.0, 83.0, 77.0, 85.0, 74.0, 50.0, 43.0, 41.0, 25.0, 33.0, 15.0, 9.0, 5.0, 9.0, 11.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00013530254364013672, -0.00013064779341220856, -0.0001259930431842804, -0.00012133829295635223, -0.00011668354272842407, -0.00011202879250049591, -0.00010737404227256775, -0.00010271929204463959, -9.806454181671143e-05, -9.340979158878326e-05, -8.87550413608551e-05, -8.410029113292694e-05, -7.944554090499878e-05, -7.479079067707062e-05, -7.013604044914246e-05, -6.54812902212143e-05, -6.082653999328613e-05, -5.617178976535797e-05, -5.151703953742981e-05, -4.686228930950165e-05, -4.2207539081573486e-05, -3.7552788853645325e-05, -3.289803862571716e-05, -2.8243288397789e-05, -2.358853816986084e-05, -1.8933787941932678e-05, -1.4279037714004517e-05, -9.624287486076355e-06, -4.969537258148193e-06, -3.1478703022003174e-07, 4.33996319770813e-06, 8.994713425636292e-06, 1.3649463653564453e-05, 1.8304213881492615e-05, 2.2958964109420776e-05, 2.7613714337348938e-05, 3.22684645652771e-05, 3.692321479320526e-05, 4.157796502113342e-05, 4.6232715249061584e-05, 5.0887465476989746e-05, 5.554221570491791e-05, 6.019696593284607e-05, 6.485171616077423e-05, 6.950646638870239e-05, 7.416121661663055e-05, 7.881596684455872e-05, 8.347071707248688e-05, 8.812546730041504e-05, 9.27802175283432e-05, 9.743496775627136e-05, 0.00010208971798419952, 0.00010674446821212769, 0.00011139921844005585, 0.00011605396866798401, 0.00012070871889591217, 0.00012536346912384033, 0.0001300182193517685, 0.00013467296957969666, 0.00013932771980762482, 0.00014398247003555298, 0.00014863722026348114, 0.0001532919704914093, 0.00015794672071933746, 0.00016260147094726562]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 11.0, 12.0, 25.0, 37.0, 53.0, 70.0, 103.0, 147.0, 238.0, 314.0, 591.0, 838.0, 1230.0, 1955.0, 3012.0, 5140.0, 9008.0, 15996.0, 30253.0, 59942.0, 116122.0, 195561.0, 230537.0, 172987.0, 96941.0, 48975.0, 25197.0, 13461.0, 7534.0, 4500.0, 2773.0, 1698.0, 1120.0, 692.0, 500.0, 303.0, 188.0, 151.0, 97.0, 82.0, 51.0, 33.0, 21.0, 17.0, 8.0, 12.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.716796875, -2.630157470703125, -2.54351806640625, -2.456878662109375, -2.3702392578125, -2.283599853515625, -2.19696044921875, -2.110321044921875, -2.023681640625, -1.937042236328125, -1.85040283203125, -1.763763427734375, -1.6771240234375, -1.590484619140625, -1.50384521484375, -1.417205810546875, -1.33056640625, -1.243927001953125, -1.15728759765625, -1.070648193359375, -0.9840087890625, -0.897369384765625, -0.81072998046875, -0.724090576171875, -0.637451171875, -0.550811767578125, -0.46417236328125, -0.377532958984375, -0.2908935546875, -0.204254150390625, -0.11761474609375, -0.030975341796875, 0.0556640625, 0.142303466796875, 0.22894287109375, 0.315582275390625, 0.4022216796875, 0.488861083984375, 0.57550048828125, 0.662139892578125, 0.748779296875, 0.835418701171875, 0.92205810546875, 1.008697509765625, 1.0953369140625, 1.181976318359375, 1.26861572265625, 1.355255126953125, 1.44189453125, 1.528533935546875, 1.61517333984375, 1.701812744140625, 1.7884521484375, 1.875091552734375, 1.96173095703125, 2.048370361328125, 2.135009765625, 2.221649169921875, 2.30828857421875, 2.394927978515625, 2.4815673828125, 2.568206787109375, 2.65484619140625, 2.741485595703125, 2.828125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 9.0, 15.0, 12.0, 21.0, 26.0, 27.0, 40.0, 51.0, 60.0, 78.0, 72.0, 59.0, 71.0, 72.0, 64.0, 63.0, 58.0, 43.0, 27.0, 36.0, 19.0, 15.0, 13.0, 11.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86669921875, -0.838775634765625, -0.81085205078125, -0.782928466796875, -0.7550048828125, -0.727081298828125, -0.69915771484375, -0.671234130859375, -0.643310546875, -0.615386962890625, -0.58746337890625, -0.559539794921875, -0.5316162109375, -0.503692626953125, -0.47576904296875, -0.447845458984375, -0.419921875, -0.391998291015625, -0.36407470703125, -0.336151123046875, -0.3082275390625, -0.280303955078125, -0.25238037109375, -0.224456787109375, -0.196533203125, -0.168609619140625, -0.14068603515625, -0.112762451171875, -0.0848388671875, -0.056915283203125, -0.02899169921875, -0.001068115234375, 0.02685546875, 0.054779052734375, 0.08270263671875, 0.110626220703125, 0.1385498046875, 0.166473388671875, 0.19439697265625, 0.222320556640625, 0.250244140625, 0.278167724609375, 0.30609130859375, 0.334014892578125, 0.3619384765625, 0.389862060546875, 0.41778564453125, 0.445709228515625, 0.4736328125, 0.501556396484375, 0.52947998046875, 0.557403564453125, 0.5853271484375, 0.613250732421875, 0.64117431640625, 0.669097900390625, 0.697021484375, 0.724945068359375, 0.75286865234375, 0.780792236328125, 0.8087158203125, 0.836639404296875, 0.86456298828125, 0.892486572265625, 0.92041015625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 9.0, 11.0, 13.0, 13.0, 21.0, 25.0, 27.0, 38.0, 26.0, 44.0, 41.0, 47.0, 54.0, 64.0, 61.0, 62.0, 52.0, 46.0, 58.0, 42.0, 32.0, 40.0, 28.0, 24.0, 16.0, 23.0, 19.0, 14.0, 8.0, 9.0, 5.0, 8.0, 3.0, 2.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.569692611694336, -10.22970199584961, -9.8897123336792, -9.549721717834473, -9.209731101989746, -8.86974048614502, -8.52975082397461, -8.189760208129883, -7.849769592285156, -7.509779453277588, -7.169788837432861, -6.829798698425293, -6.489808082580566, -6.149817943572998, -5.80982780456543, -5.469837188720703, -5.129847049713135, -4.789856910705566, -4.44986629486084, -4.1098761558532715, -3.769885540008545, -3.4298954010009766, -3.089905023574829, -2.7499146461486816, -2.409924268722534, -2.0699338912963867, -1.7299435138702393, -1.3899532556533813, -1.0499628782272339, -0.7099725008010864, -0.3699822425842285, -0.029991865158081055, 0.3099985122680664, 0.6499888896942139, 0.9899792075157166, 1.3299695253372192, 1.6699599027633667, 2.0099501609802246, 2.349940538406372, 2.6899309158325195, 3.029921293258667, 3.3699116706848145, 3.709902048110962, 4.049892425537109, 4.389882564544678, 4.729873180389404, 5.069863319396973, 5.409853935241699, 5.749844074249268, 6.089834213256836, 6.4298248291015625, 6.769814968109131, 7.109805583953857, 7.449795722961426, 7.789786338806152, 8.129776000976562, 8.469766616821289, 8.809757232666016, 9.149746894836426, 9.489737510681152, 9.829728126525879, 10.169718742370605, 10.509708404541016, 10.849699020385742, 11.189689636230469]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 6.0, 4.0, 3.0, 5.0, 14.0, 13.0, 9.0, 22.0, 15.0, 23.0, 28.0, 31.0, 24.0, 41.0, 40.0, 42.0, 37.0, 41.0, 40.0, 50.0, 51.0, 48.0, 35.0, 47.0, 29.0, 32.0, 37.0, 26.0, 29.0, 27.0, 25.0, 25.0, 20.0, 16.0, 14.0, 9.0, 10.0, 7.0, 8.0, 4.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.939610958099365, -6.736649036407471, -6.533687114715576, -6.330724716186523, -6.127762794494629, -5.924800872802734, -5.72183895111084, -5.518877029418945, -5.315915107727051, -5.112953186035156, -4.909991264343262, -4.707029342651367, -4.5040669441223145, -4.30110502243042, -4.098143100738525, -3.895181179046631, -3.692218780517578, -3.4892568588256836, -3.28629469871521, -3.0833327770233154, -2.880370616912842, -2.6774086952209473, -2.4744467735290527, -2.271484851837158, -2.0685226917266846, -1.8655606508255005, -1.6625986099243164, -1.4596366882324219, -1.2566746473312378, -1.0537126064300537, -0.8507506847381592, -0.6477886438369751, -0.4448270797729492, -0.24186506867408752, -0.03890305757522583, 0.16405892372131348, 0.36702096462249756, 0.5699830055236816, 0.7729449272155762, 0.9759069681167603, 1.1788690090179443, 1.3818310499191284, 1.5847930908203125, 1.787755012512207, 1.9907170534133911, 2.193679094314575, 2.3966410160064697, 2.5996031761169434, 2.802565097808838, 3.0055270195007324, 3.208489179611206, 3.4114511013031006, 3.614413261413574, 3.8173751831054688, 4.020337104797363, 4.223299026489258, 4.426260948181152, 4.629222869873047, 4.832184791564941, 5.035146713256836, 5.238109111785889, 5.441071033477783, 5.644032955169678, 5.846994876861572, 6.049957275390625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 15.0, 18.0, 26.0, 41.0, 63.0, 94.0, 173.0, 237.0, 403.0, 610.0, 1059.0, 1722.0, 2980.0, 4978.0, 8442.0, 14240.0, 23931.0, 39258.0, 61559.0, 91051.0, 121824.0, 142317.0, 143440.0, 125145.0, 95260.0, 64905.0, 41619.0, 25329.0, 15426.0, 9033.0, 5319.0, 3239.0, 1881.0, 1137.0, 672.0, 432.0, 267.0, 155.0, 85.0, 58.0, 44.0, 28.0, 18.0, 10.0, 9.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.296875, -6.09417724609375, -5.8914794921875, -5.68878173828125, -5.486083984375, -5.28338623046875, -5.0806884765625, -4.87799072265625, -4.67529296875, -4.47259521484375, -4.2698974609375, -4.06719970703125, -3.864501953125, -3.66180419921875, -3.4591064453125, -3.25640869140625, -3.0537109375, -2.85101318359375, -2.6483154296875, -2.44561767578125, -2.242919921875, -2.04022216796875, -1.8375244140625, -1.63482666015625, -1.43212890625, -1.22943115234375, -1.0267333984375, -0.82403564453125, -0.621337890625, -0.41864013671875, -0.2159423828125, -0.01324462890625, 0.189453125, 0.39215087890625, 0.5948486328125, 0.79754638671875, 1.000244140625, 1.20294189453125, 1.4056396484375, 1.60833740234375, 1.81103515625, 2.01373291015625, 2.2164306640625, 2.41912841796875, 2.621826171875, 2.82452392578125, 3.0272216796875, 3.22991943359375, 3.4326171875, 3.63531494140625, 3.8380126953125, 4.04071044921875, 4.243408203125, 4.44610595703125, 4.6488037109375, 4.85150146484375, 5.05419921875, 5.25689697265625, 5.4595947265625, 5.66229248046875, 5.864990234375, 6.06768798828125, 6.2703857421875, 6.47308349609375, 6.67578125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 6.0, 6.0, 6.0, 11.0, 13.0, 18.0, 13.0, 14.0, 27.0, 26.0, 30.0, 36.0, 44.0, 30.0, 39.0, 39.0, 42.0, 47.0, 48.0, 46.0, 33.0, 50.0, 47.0, 36.0, 37.0, 26.0, 38.0, 24.0, 28.0, 30.0, 20.0, 16.0, 15.0, 16.0, 15.0, 5.0, 2.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-8.703125, -8.467529296875, -8.23193359375, -7.996337890625, -7.7607421875, -7.525146484375, -7.28955078125, -7.053955078125, -6.818359375, -6.582763671875, -6.34716796875, -6.111572265625, -5.8759765625, -5.640380859375, -5.40478515625, -5.169189453125, -4.93359375, -4.697998046875, -4.46240234375, -4.226806640625, -3.9912109375, -3.755615234375, -3.52001953125, -3.284423828125, -3.048828125, -2.813232421875, -2.57763671875, -2.342041015625, -2.1064453125, -1.870849609375, -1.63525390625, -1.399658203125, -1.1640625, -0.928466796875, -0.69287109375, -0.457275390625, -0.2216796875, 0.013916015625, 0.24951171875, 0.485107421875, 0.720703125, 0.956298828125, 1.19189453125, 1.427490234375, 1.6630859375, 1.898681640625, 2.13427734375, 2.369873046875, 2.60546875, 2.841064453125, 3.07666015625, 3.312255859375, 3.5478515625, 3.783447265625, 4.01904296875, 4.254638671875, 4.490234375, 4.725830078125, 4.96142578125, 5.197021484375, 5.4326171875, 5.668212890625, 5.90380859375, 6.139404296875, 6.375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 13.0, 16.0, 15.0, 41.0, 41.0, 83.0, 127.0, 192.0, 327.0, 517.0, 893.0, 1574.0, 2675.0, 5187.0, 9335.0, 17714.0, 31916.0, 56993.0, 94969.0, 139322.0, 171948.0, 169747.0, 134694.0, 90356.0, 54075.0, 29948.0, 15993.0, 8822.0, 4788.0, 2627.0, 1505.0, 846.0, 476.0, 282.0, 179.0, 102.0, 75.0, 49.0, 31.0, 19.0, 13.0, 11.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4453125, -7.2047119140625, -6.964111328125, -6.7235107421875, -6.48291015625, -6.2423095703125, -6.001708984375, -5.7611083984375, -5.5205078125, -5.2799072265625, -5.039306640625, -4.7987060546875, -4.55810546875, -4.3175048828125, -4.076904296875, -3.8363037109375, -3.595703125, -3.3551025390625, -3.114501953125, -2.8739013671875, -2.63330078125, -2.3927001953125, -2.152099609375, -1.9114990234375, -1.6708984375, -1.4302978515625, -1.189697265625, -0.9490966796875, -0.70849609375, -0.4678955078125, -0.227294921875, 0.0133056640625, 0.25390625, 0.4945068359375, 0.735107421875, 0.9757080078125, 1.21630859375, 1.4569091796875, 1.697509765625, 1.9381103515625, 2.1787109375, 2.4193115234375, 2.659912109375, 2.9005126953125, 3.14111328125, 3.3817138671875, 3.622314453125, 3.8629150390625, 4.103515625, 4.3441162109375, 4.584716796875, 4.8253173828125, 5.06591796875, 5.3065185546875, 5.547119140625, 5.7877197265625, 6.0283203125, 6.2689208984375, 6.509521484375, 6.7501220703125, 6.99072265625, 7.2313232421875, 7.471923828125, 7.7125244140625, 7.953125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 8.0, 3.0, 6.0, 4.0, 9.0, 13.0, 9.0, 12.0, 19.0, 15.0, 15.0, 15.0, 20.0, 20.0, 27.0, 30.0, 28.0, 25.0, 42.0, 40.0, 42.0, 33.0, 39.0, 34.0, 44.0, 47.0, 41.0, 36.0, 26.0, 30.0, 34.0, 32.0, 30.0, 34.0, 22.0, 12.0, 17.0, 13.0, 15.0, 10.0, 10.0, 10.0, 8.0, 4.0, 7.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.88885498046875, -3.7620849609375, -3.63531494140625, -3.508544921875, -3.38177490234375, -3.2550048828125, -3.12823486328125, -3.00146484375, -2.87469482421875, -2.7479248046875, -2.62115478515625, -2.494384765625, -2.36761474609375, -2.2408447265625, -2.11407470703125, -1.9873046875, -1.86053466796875, -1.7337646484375, -1.60699462890625, -1.480224609375, -1.35345458984375, -1.2266845703125, -1.09991455078125, -0.97314453125, -0.84637451171875, -0.7196044921875, -0.59283447265625, -0.466064453125, -0.33929443359375, -0.2125244140625, -0.08575439453125, 0.041015625, 0.16778564453125, 0.2945556640625, 0.42132568359375, 0.548095703125, 0.67486572265625, 0.8016357421875, 0.92840576171875, 1.05517578125, 1.18194580078125, 1.3087158203125, 1.43548583984375, 1.562255859375, 1.68902587890625, 1.8157958984375, 1.94256591796875, 2.0693359375, 2.19610595703125, 2.3228759765625, 2.44964599609375, 2.576416015625, 2.70318603515625, 2.8299560546875, 2.95672607421875, 3.08349609375, 3.21026611328125, 3.3370361328125, 3.46380615234375, 3.590576171875, 3.71734619140625, 3.8441162109375, 3.97088623046875, 4.09765625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 12.0, 7.0, 23.0, 30.0, 36.0, 46.0, 85.0, 131.0, 153.0, 221.0, 354.0, 569.0, 729.0, 1242.0, 2040.0, 3613.0, 7029.0, 14667.0, 32529.0, 70873.0, 140004.0, 218780.0, 231322.0, 162096.0, 85146.0, 39654.0, 18167.0, 8472.0, 4125.0, 2297.0, 1344.0, 905.0, 586.0, 404.0, 271.0, 193.0, 128.0, 94.0, 55.0, 37.0, 20.0, 23.0, 16.0, 9.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.87109375, -4.714599609375, -4.55810546875, -4.401611328125, -4.2451171875, -4.088623046875, -3.93212890625, -3.775634765625, -3.619140625, -3.462646484375, -3.30615234375, -3.149658203125, -2.9931640625, -2.836669921875, -2.68017578125, -2.523681640625, -2.3671875, -2.210693359375, -2.05419921875, -1.897705078125, -1.7412109375, -1.584716796875, -1.42822265625, -1.271728515625, -1.115234375, -0.958740234375, -0.80224609375, -0.645751953125, -0.4892578125, -0.332763671875, -0.17626953125, -0.019775390625, 0.13671875, 0.293212890625, 0.44970703125, 0.606201171875, 0.7626953125, 0.919189453125, 1.07568359375, 1.232177734375, 1.388671875, 1.545166015625, 1.70166015625, 1.858154296875, 2.0146484375, 2.171142578125, 2.32763671875, 2.484130859375, 2.640625, 2.797119140625, 2.95361328125, 3.110107421875, 3.2666015625, 3.423095703125, 3.57958984375, 3.736083984375, 3.892578125, 4.049072265625, 4.20556640625, 4.362060546875, 4.5185546875, 4.675048828125, 4.83154296875, 4.988037109375, 5.14453125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 15.0, 12.0, 23.0, 21.0, 43.0, 72.0, 59.0, 87.0, 76.0, 96.0, 78.0, 82.0, 75.0, 58.0, 46.0, 34.0, 33.0, 14.0, 10.0, 10.0, 9.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00064849853515625, -0.0006302446126937866, -0.0006119906902313232, -0.0005937367677688599, -0.0005754828453063965, -0.0005572289228439331, -0.0005389750003814697, -0.0005207210779190063, -0.000502467155456543, -0.0004842132329940796, -0.0004659593105316162, -0.00044770538806915283, -0.00042945146560668945, -0.0004111975431442261, -0.0003929436206817627, -0.0003746896982192993, -0.00035643577575683594, -0.00033818185329437256, -0.0003199279308319092, -0.0003016740083694458, -0.0002834200859069824, -0.00026516616344451904, -0.00024691224098205566, -0.00022865831851959229, -0.0002104043960571289, -0.00019215047359466553, -0.00017389655113220215, -0.00015564262866973877, -0.0001373887062072754, -0.00011913478374481201, -0.00010088086128234863, -8.262693881988525e-05, -6.437301635742188e-05, -4.6119093894958496e-05, -2.7865171432495117e-05, -9.611248970031738e-06, 8.64267349243164e-06, 2.689659595489502e-05, 4.51505184173584e-05, 6.340444087982178e-05, 8.165836334228516e-05, 9.991228580474854e-05, 0.00011816620826721191, 0.0001364201307296753, 0.00015467405319213867, 0.00017292797565460205, 0.00019118189811706543, 0.0002094358205795288, 0.0002276897430419922, 0.00024594366550445557, 0.00026419758796691895, 0.0002824515104293823, 0.0003007054328918457, 0.0003189593553543091, 0.00033721327781677246, 0.00035546720027923584, 0.0003737211227416992, 0.0003919750452041626, 0.000410228967666626, 0.00042848289012908936, 0.00044673681259155273, 0.0004649907350540161, 0.0004832446575164795, 0.0005014985799789429, 0.0005197525024414062]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 7.0, 15.0, 22.0, 26.0, 47.0, 57.0, 75.0, 128.0, 177.0, 260.0, 373.0, 538.0, 831.0, 1399.0, 2476.0, 4196.0, 7743.0, 15395.0, 30826.0, 61711.0, 112978.0, 175230.0, 208052.0, 178337.0, 116817.0, 63714.0, 32580.0, 15804.0, 7922.0, 4217.0, 2530.0, 1401.0, 876.0, 574.0, 388.0, 252.0, 177.0, 120.0, 84.0, 47.0, 38.0, 27.0, 23.0, 17.0, 14.0, 12.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.30078125, -4.16436767578125, -4.0279541015625, -3.89154052734375, -3.755126953125, -3.61871337890625, -3.4822998046875, -3.34588623046875, -3.20947265625, -3.07305908203125, -2.9366455078125, -2.80023193359375, -2.663818359375, -2.52740478515625, -2.3909912109375, -2.25457763671875, -2.1181640625, -1.98175048828125, -1.8453369140625, -1.70892333984375, -1.572509765625, -1.43609619140625, -1.2996826171875, -1.16326904296875, -1.02685546875, -0.89044189453125, -0.7540283203125, -0.61761474609375, -0.481201171875, -0.34478759765625, -0.2083740234375, -0.07196044921875, 0.064453125, 0.20086669921875, 0.3372802734375, 0.47369384765625, 0.610107421875, 0.74652099609375, 0.8829345703125, 1.01934814453125, 1.15576171875, 1.29217529296875, 1.4285888671875, 1.56500244140625, 1.701416015625, 1.83782958984375, 1.9742431640625, 2.11065673828125, 2.2470703125, 2.38348388671875, 2.5198974609375, 2.65631103515625, 2.792724609375, 2.92913818359375, 3.0655517578125, 3.20196533203125, 3.33837890625, 3.47479248046875, 3.6112060546875, 3.74761962890625, 3.884033203125, 4.02044677734375, 4.1568603515625, 4.29327392578125, 4.4296875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 8.0, 5.0, 20.0, 16.0, 32.0, 36.0, 42.0, 58.0, 56.0, 64.0, 66.0, 70.0, 78.0, 67.0, 66.0, 63.0, 62.0, 42.0, 36.0, 24.0, 27.0, 14.0, 11.0, 6.0, 9.0, 5.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0498046875, -1.008087158203125, -0.96636962890625, -0.924652099609375, -0.8829345703125, -0.841217041015625, -0.79949951171875, -0.757781982421875, -0.716064453125, -0.674346923828125, -0.63262939453125, -0.590911865234375, -0.5491943359375, -0.507476806640625, -0.46575927734375, -0.424041748046875, -0.38232421875, -0.340606689453125, -0.29888916015625, -0.257171630859375, -0.2154541015625, -0.173736572265625, -0.13201904296875, -0.090301513671875, -0.048583984375, -0.006866455078125, 0.03485107421875, 0.076568603515625, 0.1182861328125, 0.160003662109375, 0.20172119140625, 0.243438720703125, 0.28515625, 0.326873779296875, 0.36859130859375, 0.410308837890625, 0.4520263671875, 0.493743896484375, 0.53546142578125, 0.577178955078125, 0.618896484375, 0.660614013671875, 0.70233154296875, 0.744049072265625, 0.7857666015625, 0.827484130859375, 0.86920166015625, 0.910919189453125, 0.95263671875, 0.994354248046875, 1.03607177734375, 1.077789306640625, 1.1195068359375, 1.161224365234375, 1.20294189453125, 1.244659423828125, 1.286376953125, 1.328094482421875, 1.36981201171875, 1.411529541015625, 1.4532470703125, 1.494964599609375, 1.53668212890625, 1.578399658203125, 1.6201171875]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 4.0, 8.0, 14.0, 9.0, 6.0, 9.0, 21.0, 26.0, 24.0, 27.0, 39.0, 36.0, 46.0, 47.0, 38.0, 58.0, 51.0, 52.0, 61.0, 52.0, 44.0, 54.0, 46.0, 46.0, 16.0, 29.0, 28.0, 19.0, 15.0, 9.0, 11.0, 18.0, 10.0, 6.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.436745643615723, -9.117323875427246, -8.797903060913086, -8.47848129272461, -8.159059524536133, -7.839638710021973, -7.520216941833496, -7.200795650482178, -6.881374359130859, -6.561953067779541, -6.242531776428223, -5.923110008239746, -5.603688716888428, -5.284267425537109, -4.964845657348633, -4.6454243659973145, -4.326003074645996, -4.006581783294678, -3.6871602535247803, -3.367738723754883, -3.0483174324035645, -2.728896141052246, -2.4094746112823486, -2.090053081512451, -1.7706317901611328, -1.451210379600525, -1.131788969039917, -0.8123675584793091, -0.49294614791870117, -0.17352473735809326, 0.14589667320251465, 0.4653182029724121, 0.7847385406494141, 1.104159951210022, 1.4235813617706299, 1.7430027723312378, 2.0624241828918457, 2.381845474243164, 2.7012670040130615, 3.020688533782959, 3.3401098251342773, 3.6595311164855957, 3.978952646255493, 4.298374176025391, 4.617795467376709, 4.937216758728027, 5.256638526916504, 5.576059818267822, 5.895481109619141, 6.214902400970459, 6.534323692321777, 6.853745460510254, 7.173166751861572, 7.492588043212891, 7.812009811401367, 8.131431579589844, 8.450852394104004, 8.77027416229248, 9.08969497680664, 9.409116744995117, 9.728538513183594, 10.047959327697754, 10.36738109588623, 10.68680191040039, 11.006223678588867]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 6.0, 5.0, 2.0, 6.0, 9.0, 11.0, 13.0, 16.0, 12.0, 25.0, 21.0, 29.0, 28.0, 41.0, 31.0, 31.0, 45.0, 45.0, 46.0, 39.0, 58.0, 44.0, 44.0, 43.0, 37.0, 37.0, 39.0, 38.0, 22.0, 23.0, 29.0, 21.0, 24.0, 14.0, 15.0, 10.0, 13.0, 8.0, 6.0, 10.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0410990715026855, -6.825225353240967, -6.609351634979248, -6.393477916717529, -6.177604675292969, -5.96173095703125, -5.745857238769531, -5.5299835205078125, -5.314109802246094, -5.098236083984375, -4.882362365722656, -4.6664886474609375, -4.450614929199219, -4.2347412109375, -4.0188679695129395, -3.8029942512512207, -3.587120532989502, -3.371246814727783, -3.1553730964660645, -2.939499616622925, -2.723625898361206, -2.5077521800994873, -2.2918787002563477, -2.076004981994629, -1.8601312637329102, -1.6442575454711914, -1.4283839464187622, -1.212510347366333, -0.9966366291046143, -0.7807629108428955, -0.5648893117904663, -0.3490157127380371, -0.13314151763916016, 0.08273214101791382, 0.2986057996749878, 0.5144794583320618, 0.7303531169891357, 0.9462268352508545, 1.1621004343032837, 1.377974033355713, 1.5938477516174316, 1.8097214698791504, 2.025595188140869, 2.241468667984009, 2.4573423862457275, 2.6732161045074463, 2.889089584350586, 3.1049633026123047, 3.3208370208740234, 3.536710739135742, 3.752584457397461, 3.9684579372406006, 4.184331893920898, 4.400205612182617, 4.616078853607178, 4.8319525718688965, 5.047826290130615, 5.263700008392334, 5.479573726654053, 5.6954474449157715, 5.911320686340332, 6.127194404602051, 6.3430681228637695, 6.558941841125488, 6.774815559387207]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 11.0, 13.0, 18.0, 22.0, 26.0, 56.0, 69.0, 81.0, 148.0, 171.0, 287.0, 477.0, 683.0, 1079.0, 1834.0, 2926.0, 5066.0, 8923.0, 16487.0, 30499.0, 59987.0, 118933.0, 238500.0, 465918.0, 802926.0, 959200.0, 702516.0, 381856.0, 192645.0, 95919.0, 49304.0, 25651.0, 13567.0, 7686.0, 4277.0, 2471.0, 1479.0, 929.0, 568.0, 330.0, 254.0, 186.0, 105.0, 69.0, 46.0, 31.0, 19.0, 8.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0], "bins": [-11.1328125, -10.81787109375, -10.5029296875, -10.18798828125, -9.873046875, -9.55810546875, -9.2431640625, -8.92822265625, -8.61328125, -8.29833984375, -7.9833984375, -7.66845703125, -7.353515625, -7.03857421875, -6.7236328125, -6.40869140625, -6.09375, -5.77880859375, -5.4638671875, -5.14892578125, -4.833984375, -4.51904296875, -4.2041015625, -3.88916015625, -3.57421875, -3.25927734375, -2.9443359375, -2.62939453125, -2.314453125, -1.99951171875, -1.6845703125, -1.36962890625, -1.0546875, -0.73974609375, -0.4248046875, -0.10986328125, 0.205078125, 0.52001953125, 0.8349609375, 1.14990234375, 1.46484375, 1.77978515625, 2.0947265625, 2.40966796875, 2.724609375, 3.03955078125, 3.3544921875, 3.66943359375, 3.984375, 4.29931640625, 4.6142578125, 4.92919921875, 5.244140625, 5.55908203125, 5.8740234375, 6.18896484375, 6.50390625, 6.81884765625, 7.1337890625, 7.44873046875, 7.763671875, 8.07861328125, 8.3935546875, 8.70849609375, 9.0234375]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 6.0, 7.0, 11.0, 14.0, 12.0, 20.0, 19.0, 23.0, 29.0, 31.0, 19.0, 32.0, 37.0, 35.0, 56.0, 48.0, 38.0, 53.0, 39.0, 45.0, 56.0, 50.0, 49.0, 41.0, 28.0, 26.0, 28.0, 19.0, 15.0, 25.0, 15.0, 24.0, 12.0, 7.0, 3.0, 9.0, 1.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.302978515625, -5.13720703125, -4.971435546875, -4.8056640625, -4.639892578125, -4.47412109375, -4.308349609375, -4.142578125, -3.976806640625, -3.81103515625, -3.645263671875, -3.4794921875, -3.313720703125, -3.14794921875, -2.982177734375, -2.81640625, -2.650634765625, -2.48486328125, -2.319091796875, -2.1533203125, -1.987548828125, -1.82177734375, -1.656005859375, -1.490234375, -1.324462890625, -1.15869140625, -0.992919921875, -0.8271484375, -0.661376953125, -0.49560546875, -0.329833984375, -0.1640625, 0.001708984375, 0.16748046875, 0.333251953125, 0.4990234375, 0.664794921875, 0.83056640625, 0.996337890625, 1.162109375, 1.327880859375, 1.49365234375, 1.659423828125, 1.8251953125, 1.990966796875, 2.15673828125, 2.322509765625, 2.48828125, 2.654052734375, 2.81982421875, 2.985595703125, 3.1513671875, 3.317138671875, 3.48291015625, 3.648681640625, 3.814453125, 3.980224609375, 4.14599609375, 4.311767578125, 4.4775390625, 4.643310546875, 4.80908203125, 4.974853515625, 5.140625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 7.0, 13.0, 7.0, 13.0, 30.0, 43.0, 47.0, 104.0, 161.0, 240.0, 344.0, 596.0, 1018.0, 1823.0, 3079.0, 5688.0, 11113.0, 22175.0, 46412.0, 97765.0, 208197.0, 426807.0, 768023.0, 984909.0, 774820.0, 433811.0, 212800.0, 99308.0, 46984.0, 22776.0, 11503.0, 5951.0, 3261.0, 1748.0, 1010.0, 622.0, 371.0, 246.0, 146.0, 119.0, 60.0, 44.0, 32.0, 18.0, 8.0, 11.0, 11.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-12.1171875, -11.755615234375, -11.39404296875, -11.032470703125, -10.6708984375, -10.309326171875, -9.94775390625, -9.586181640625, -9.224609375, -8.863037109375, -8.50146484375, -8.139892578125, -7.7783203125, -7.416748046875, -7.05517578125, -6.693603515625, -6.33203125, -5.970458984375, -5.60888671875, -5.247314453125, -4.8857421875, -4.524169921875, -4.16259765625, -3.801025390625, -3.439453125, -3.077880859375, -2.71630859375, -2.354736328125, -1.9931640625, -1.631591796875, -1.27001953125, -0.908447265625, -0.546875, -0.185302734375, 0.17626953125, 0.537841796875, 0.8994140625, 1.260986328125, 1.62255859375, 1.984130859375, 2.345703125, 2.707275390625, 3.06884765625, 3.430419921875, 3.7919921875, 4.153564453125, 4.51513671875, 4.876708984375, 5.23828125, 5.599853515625, 5.96142578125, 6.322998046875, 6.6845703125, 7.046142578125, 7.40771484375, 7.769287109375, 8.130859375, 8.492431640625, 8.85400390625, 9.215576171875, 9.5771484375, 9.938720703125, 10.30029296875, 10.661865234375, 11.0234375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 5.0, 8.0, 10.0, 16.0, 11.0, 22.0, 36.0, 36.0, 52.0, 76.0, 97.0, 126.0, 133.0, 155.0, 168.0, 228.0, 231.0, 260.0, 277.0, 273.0, 300.0, 265.0, 225.0, 174.0, 189.0, 142.0, 115.0, 114.0, 70.0, 66.0, 40.0, 44.0, 30.0, 14.0, 12.0, 19.0, 15.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.505859375, -3.406280517578125, -3.30670166015625, -3.207122802734375, -3.1075439453125, -3.007965087890625, -2.90838623046875, -2.808807373046875, -2.709228515625, -2.609649658203125, -2.51007080078125, -2.410491943359375, -2.3109130859375, -2.211334228515625, -2.11175537109375, -2.012176513671875, -1.91259765625, -1.813018798828125, -1.71343994140625, -1.613861083984375, -1.5142822265625, -1.414703369140625, -1.31512451171875, -1.215545654296875, -1.115966796875, -1.016387939453125, -0.91680908203125, -0.817230224609375, -0.7176513671875, -0.618072509765625, -0.51849365234375, -0.418914794921875, -0.3193359375, -0.219757080078125, -0.12017822265625, -0.020599365234375, 0.0789794921875, 0.178558349609375, 0.27813720703125, 0.377716064453125, 0.477294921875, 0.576873779296875, 0.67645263671875, 0.776031494140625, 0.8756103515625, 0.975189208984375, 1.07476806640625, 1.174346923828125, 1.27392578125, 1.373504638671875, 1.47308349609375, 1.572662353515625, 1.6722412109375, 1.771820068359375, 1.87139892578125, 1.970977783203125, 2.070556640625, 2.170135498046875, 2.26971435546875, 2.369293212890625, 2.4688720703125, 2.568450927734375, 2.66802978515625, 2.767608642578125, 2.8671875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 9.0, 12.0, 21.0, 21.0, 23.0, 29.0, 31.0, 40.0, 39.0, 49.0, 40.0, 59.0, 65.0, 56.0, 55.0, 52.0, 49.0, 45.0, 47.0, 43.0, 37.0, 35.0, 20.0, 24.0, 15.0, 13.0, 9.0, 9.0, 19.0, 3.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.409107208251953, -9.07264232635498, -8.736177444458008, -8.399711608886719, -8.063246726989746, -7.726781845092773, -7.390316963195801, -7.05385160446167, -6.717386245727539, -6.380921363830566, -6.0444560050964355, -5.707991123199463, -5.371525764465332, -5.035060882568359, -4.698596000671387, -4.362130641937256, -4.025665760040283, -3.6892006397247314, -3.3527355194091797, -3.016270637512207, -2.679805278778076, -2.3433403968811035, -2.0068752765655518, -1.67041015625, -1.3339450359344482, -0.9974799156188965, -0.6610148549079895, -0.3245497941970825, 0.011915326118469238, 0.348380446434021, 0.6848454475402832, 1.021310567855835, 1.3577756881713867, 1.6942408084869385, 2.0307059288024902, 2.367170810699463, 2.7036361694335938, 3.0401010513305664, 3.376566171646118, 3.71303129196167, 4.049496650695801, 4.385961532592773, 4.722426891326904, 5.058891773223877, 5.395357131958008, 5.7318220138549805, 6.068286895751953, 6.404752254486084, 6.741217136383057, 7.077682018280029, 7.41414737701416, 7.750612258911133, 8.087077140808105, 8.423542976379395, 8.760007858276367, 9.09647274017334, 9.432937622070312, 9.769402503967285, 10.105867385864258, 10.442333221435547, 10.77879810333252, 11.115262985229492, 11.451727867126465, 11.788192749023438, 12.124658584594727]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 3.0, 10.0, 8.0, 3.0, 4.0, 17.0, 11.0, 12.0, 15.0, 14.0, 31.0, 23.0, 25.0, 30.0, 38.0, 31.0, 41.0, 50.0, 50.0, 44.0, 38.0, 46.0, 39.0, 39.0, 43.0, 40.0, 32.0, 46.0, 38.0, 25.0, 20.0, 18.0, 16.0, 20.0, 16.0, 12.0, 14.0, 13.0, 8.0, 7.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.220620632171631, -6.032851219177246, -5.845081329345703, -5.657311916351318, -5.469542503356934, -5.281772613525391, -5.094003200531006, -4.906233787536621, -4.718463897705078, -4.530694484710693, -4.34292459487915, -4.155155181884766, -3.967385768890381, -3.779616117477417, -3.591846466064453, -3.4040770530700684, -3.2163076400756836, -3.0285379886627197, -2.840768575668335, -2.652998924255371, -2.4652295112609863, -2.2774598598480225, -2.0896902084350586, -1.9019206762313843, -1.71415114402771, -1.5263816118240356, -1.3386120796203613, -1.1508424282073975, -0.9630728960037231, -0.7753033638000488, -0.587533712387085, -0.39976418018341064, -0.21199464797973633, -0.024225085973739624, 0.16354447603225708, 0.35131406784057617, 0.5390836000442505, 0.7268531322479248, 0.9146227836608887, 1.102392315864563, 1.2901618480682373, 1.4779313802719116, 1.665700912475586, 1.8534705638885498, 2.0412402153015137, 2.2290096282958984, 2.4167792797088623, 2.604548931121826, 2.792318344116211, 2.980087995529175, 3.1678574085235596, 3.3556270599365234, 3.543396472930908, 3.731166124343872, 3.918935775756836, 4.106705188751221, 4.2944746017456055, 4.48224401473999, 4.670013904571533, 4.857783317565918, 5.045552730560303, 5.2333221435546875, 5.4210920333862305, 5.608861446380615, 5.796631336212158]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 8.0, 9.0, 13.0, 19.0, 24.0, 42.0, 72.0, 98.0, 149.0, 238.0, 345.0, 554.0, 838.0, 1316.0, 2138.0, 3398.0, 5113.0, 8335.0, 13137.0, 20051.0, 30887.0, 46337.0, 66731.0, 91252.0, 114666.0, 130123.0, 127782.0, 110807.0, 86775.0, 62808.0, 43430.0, 28919.0, 18798.0, 12133.0, 7692.0, 4947.0, 3073.0, 2012.0, 1195.0, 899.0, 484.0, 330.0, 202.0, 129.0, 87.0, 60.0, 44.0, 26.0, 10.0, 8.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.64453125, -2.561676025390625, -2.47882080078125, -2.395965576171875, -2.3131103515625, -2.230255126953125, -2.14739990234375, -2.064544677734375, -1.981689453125, -1.898834228515625, -1.81597900390625, -1.733123779296875, -1.6502685546875, -1.567413330078125, -1.48455810546875, -1.401702880859375, -1.31884765625, -1.235992431640625, -1.15313720703125, -1.070281982421875, -0.9874267578125, -0.904571533203125, -0.82171630859375, -0.738861083984375, -0.656005859375, -0.573150634765625, -0.49029541015625, -0.407440185546875, -0.3245849609375, -0.241729736328125, -0.15887451171875, -0.076019287109375, 0.0068359375, 0.089691162109375, 0.17254638671875, 0.255401611328125, 0.3382568359375, 0.421112060546875, 0.50396728515625, 0.586822509765625, 0.669677734375, 0.752532958984375, 0.83538818359375, 0.918243408203125, 1.0010986328125, 1.083953857421875, 1.16680908203125, 1.249664306640625, 1.33251953125, 1.415374755859375, 1.49822998046875, 1.581085205078125, 1.6639404296875, 1.746795654296875, 1.82965087890625, 1.912506103515625, 1.995361328125, 2.078216552734375, 2.16107177734375, 2.243927001953125, 2.3267822265625, 2.409637451171875, 2.49249267578125, 2.575347900390625, 2.658203125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 7.0, 1.0, 7.0, 3.0, 10.0, 13.0, 11.0, 15.0, 11.0, 14.0, 20.0, 25.0, 34.0, 30.0, 27.0, 33.0, 31.0, 38.0, 36.0, 41.0, 46.0, 43.0, 38.0, 46.0, 37.0, 45.0, 32.0, 42.0, 28.0, 34.0, 24.0, 22.0, 36.0, 18.0, 20.0, 13.0, 10.0, 14.0, 13.0, 9.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.1517333984375, -5.947998046875, -5.7442626953125, -5.54052734375, -5.3367919921875, -5.133056640625, -4.9293212890625, -4.7255859375, -4.5218505859375, -4.318115234375, -4.1143798828125, -3.91064453125, -3.7069091796875, -3.503173828125, -3.2994384765625, -3.095703125, -2.8919677734375, -2.688232421875, -2.4844970703125, -2.28076171875, -2.0770263671875, -1.873291015625, -1.6695556640625, -1.4658203125, -1.2620849609375, -1.058349609375, -0.8546142578125, -0.65087890625, -0.4471435546875, -0.243408203125, -0.0396728515625, 0.1640625, 0.3677978515625, 0.571533203125, 0.7752685546875, 0.97900390625, 1.1827392578125, 1.386474609375, 1.5902099609375, 1.7939453125, 1.9976806640625, 2.201416015625, 2.4051513671875, 2.60888671875, 2.8126220703125, 3.016357421875, 3.2200927734375, 3.423828125, 3.6275634765625, 3.831298828125, 4.0350341796875, 4.23876953125, 4.4425048828125, 4.646240234375, 4.8499755859375, 5.0537109375, 5.2574462890625, 5.461181640625, 5.6649169921875, 5.86865234375, 6.0723876953125, 6.276123046875, 6.4798583984375, 6.68359375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 8.0, 15.0, 16.0, 24.0, 31.0, 47.0, 75.0, 123.0, 213.0, 371.0, 620.0, 1026.0, 1617.0, 2968.0, 5409.0, 9626.0, 17606.0, 32989.0, 62038.0, 113318.0, 185624.0, 223820.0, 171164.0, 100684.0, 54503.0, 29462.0, 15457.0, 8611.0, 4690.0, 2635.0, 1524.0, 911.0, 523.0, 298.0, 173.0, 105.0, 75.0, 55.0, 36.0, 23.0, 13.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.40234375, -5.24530029296875, -5.0882568359375, -4.93121337890625, -4.774169921875, -4.61712646484375, -4.4600830078125, -4.30303955078125, -4.14599609375, -3.98895263671875, -3.8319091796875, -3.67486572265625, -3.517822265625, -3.36077880859375, -3.2037353515625, -3.04669189453125, -2.8896484375, -2.73260498046875, -2.5755615234375, -2.41851806640625, -2.261474609375, -2.10443115234375, -1.9473876953125, -1.79034423828125, -1.63330078125, -1.47625732421875, -1.3192138671875, -1.16217041015625, -1.005126953125, -0.84808349609375, -0.6910400390625, -0.53399658203125, -0.376953125, -0.21990966796875, -0.0628662109375, 0.09417724609375, 0.251220703125, 0.40826416015625, 0.5653076171875, 0.72235107421875, 0.87939453125, 1.03643798828125, 1.1934814453125, 1.35052490234375, 1.507568359375, 1.66461181640625, 1.8216552734375, 1.97869873046875, 2.1357421875, 2.29278564453125, 2.4498291015625, 2.60687255859375, 2.763916015625, 2.92095947265625, 3.0780029296875, 3.23504638671875, 3.39208984375, 3.54913330078125, 3.7061767578125, 3.86322021484375, 4.020263671875, 4.17730712890625, 4.3343505859375, 4.49139404296875, 4.6484375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 11.0, 8.0, 7.0, 8.0, 8.0, 14.0, 13.0, 23.0, 23.0, 23.0, 35.0, 19.0, 33.0, 36.0, 31.0, 44.0, 49.0, 48.0, 45.0, 55.0, 53.0, 47.0, 54.0, 41.0, 37.0, 38.0, 34.0, 25.0, 23.0, 23.0, 19.0, 17.0, 16.0, 9.0, 10.0, 9.0, 3.0, 3.0, 8.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.68878173828125, -4.5494384765625, -4.41009521484375, -4.270751953125, -4.13140869140625, -3.9920654296875, -3.85272216796875, -3.71337890625, -3.57403564453125, -3.4346923828125, -3.29534912109375, -3.156005859375, -3.01666259765625, -2.8773193359375, -2.73797607421875, -2.5986328125, -2.45928955078125, -2.3199462890625, -2.18060302734375, -2.041259765625, -1.90191650390625, -1.7625732421875, -1.62322998046875, -1.48388671875, -1.34454345703125, -1.2052001953125, -1.06585693359375, -0.926513671875, -0.78717041015625, -0.6478271484375, -0.50848388671875, -0.369140625, -0.22979736328125, -0.0904541015625, 0.04888916015625, 0.188232421875, 0.32757568359375, 0.4669189453125, 0.60626220703125, 0.74560546875, 0.88494873046875, 1.0242919921875, 1.16363525390625, 1.302978515625, 1.44232177734375, 1.5816650390625, 1.72100830078125, 1.8603515625, 1.99969482421875, 2.1390380859375, 2.27838134765625, 2.417724609375, 2.55706787109375, 2.6964111328125, 2.83575439453125, 2.97509765625, 3.11444091796875, 3.2537841796875, 3.39312744140625, 3.532470703125, 3.67181396484375, 3.8111572265625, 3.95050048828125, 4.08984375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [5.0, 1.0, 5.0, 5.0, 8.0, 7.0, 14.0, 22.0, 33.0, 46.0, 64.0, 74.0, 150.0, 206.0, 303.0, 477.0, 702.0, 1161.0, 1820.0, 2999.0, 5015.0, 8478.0, 14666.0, 25752.0, 45747.0, 80872.0, 136567.0, 198150.0, 197710.0, 137923.0, 81478.0, 45953.0, 25967.0, 14775.0, 8523.0, 5007.0, 2955.0, 1780.0, 1095.0, 687.0, 466.0, 276.0, 196.0, 126.0, 88.0, 80.0, 46.0, 27.0, 18.0, 15.0, 8.0, 8.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7158203125, -1.6545562744140625, -1.593292236328125, -1.5320281982421875, -1.47076416015625, -1.4095001220703125, -1.348236083984375, -1.2869720458984375, -1.2257080078125, -1.1644439697265625, -1.103179931640625, -1.0419158935546875, -0.98065185546875, -0.9193878173828125, -0.858123779296875, -0.7968597412109375, -0.735595703125, -0.6743316650390625, -0.613067626953125, -0.5518035888671875, -0.49053955078125, -0.4292755126953125, -0.368011474609375, -0.3067474365234375, -0.2454833984375, -0.1842193603515625, -0.122955322265625, -0.0616912841796875, -0.00042724609375, 0.0608367919921875, 0.122100830078125, 0.1833648681640625, 0.24462890625, 0.3058929443359375, 0.367156982421875, 0.4284210205078125, 0.48968505859375, 0.5509490966796875, 0.612213134765625, 0.6734771728515625, 0.7347412109375, 0.7960052490234375, 0.857269287109375, 0.9185333251953125, 0.97979736328125, 1.0410614013671875, 1.102325439453125, 1.1635894775390625, 1.224853515625, 1.2861175537109375, 1.347381591796875, 1.4086456298828125, 1.46990966796875, 1.5311737060546875, 1.592437744140625, 1.6537017822265625, 1.7149658203125, 1.7762298583984375, 1.837493896484375, 1.8987579345703125, 1.96002197265625, 2.0212860107421875, 2.082550048828125, 2.1438140869140625, 2.205078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 4.0, 6.0, 13.0, 8.0, 14.0, 12.0, 19.0, 21.0, 31.0, 41.0, 35.0, 49.0, 46.0, 46.0, 56.0, 50.0, 56.0, 58.0, 43.0, 68.0, 44.0, 53.0, 37.0, 35.0, 22.0, 21.0, 16.0, 14.0, 13.0, 15.0, 10.0, 4.0, 9.0, 4.0, 2.0, 2.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.279085159301758e-05, -8.005835115909576e-05, -7.732585072517395e-05, -7.459335029125214e-05, -7.186084985733032e-05, -6.912834942340851e-05, -6.63958489894867e-05, -6.366334855556488e-05, -6.0930848121643066e-05, -5.819834768772125e-05, -5.546584725379944e-05, -5.2733346819877625e-05, -5.000084638595581e-05, -4.7268345952033997e-05, -4.453584551811218e-05, -4.180334508419037e-05, -3.9070844650268555e-05, -3.633834421634674e-05, -3.360584378242493e-05, -3.087334334850311e-05, -2.81408429145813e-05, -2.5408342480659485e-05, -2.267584204673767e-05, -1.9943341612815857e-05, -1.7210841178894043e-05, -1.4478340744972229e-05, -1.1745840311050415e-05, -9.013339877128601e-06, -6.280839443206787e-06, -3.548339009284973e-06, -8.158385753631592e-07, 1.9166618585586548e-06, 4.649162292480469e-06, 7.381662726402283e-06, 1.0114163160324097e-05, 1.284666359424591e-05, 1.5579164028167725e-05, 1.831166446208954e-05, 2.1044164896011353e-05, 2.3776665329933167e-05, 2.650916576385498e-05, 2.9241666197776794e-05, 3.197416663169861e-05, 3.470666706562042e-05, 3.7439167499542236e-05, 4.017166793346405e-05, 4.2904168367385864e-05, 4.563666880130768e-05, 4.836916923522949e-05, 5.1101669669151306e-05, 5.383417010307312e-05, 5.6566670536994934e-05, 5.929917097091675e-05, 6.203167140483856e-05, 6.476417183876038e-05, 6.749667227268219e-05, 7.0229172706604e-05, 7.296167314052582e-05, 7.569417357444763e-05, 7.842667400836945e-05, 8.115917444229126e-05, 8.389167487621307e-05, 8.662417531013489e-05, 8.93566757440567e-05, 9.208917617797852e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 5.0, 5.0, 10.0, 14.0, 21.0, 31.0, 45.0, 49.0, 93.0, 125.0, 208.0, 305.0, 449.0, 698.0, 1117.0, 1773.0, 2795.0, 4578.0, 7646.0, 12153.0, 19389.0, 31172.0, 47170.0, 70305.0, 98198.0, 123818.0, 139512.0, 133533.0, 111280.0, 83073.0, 56898.0, 37738.0, 24158.0, 15096.0, 9359.0, 5791.0, 3676.0, 2299.0, 1452.0, 900.0, 571.0, 361.0, 225.0, 156.0, 107.0, 58.0, 43.0, 42.0, 13.0, 20.0, 10.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3193359375, -1.27496337890625, -1.2305908203125, -1.18621826171875, -1.141845703125, -1.09747314453125, -1.0531005859375, -1.00872802734375, -0.96435546875, -0.91998291015625, -0.8756103515625, -0.83123779296875, -0.786865234375, -0.74249267578125, -0.6981201171875, -0.65374755859375, -0.609375, -0.56500244140625, -0.5206298828125, -0.47625732421875, -0.431884765625, -0.38751220703125, -0.3431396484375, -0.29876708984375, -0.25439453125, -0.21002197265625, -0.1656494140625, -0.12127685546875, -0.076904296875, -0.03253173828125, 0.0118408203125, 0.05621337890625, 0.1005859375, 0.14495849609375, 0.1893310546875, 0.23370361328125, 0.278076171875, 0.32244873046875, 0.3668212890625, 0.41119384765625, 0.45556640625, 0.49993896484375, 0.5443115234375, 0.58868408203125, 0.633056640625, 0.67742919921875, 0.7218017578125, 0.76617431640625, 0.810546875, 0.85491943359375, 0.8992919921875, 0.94366455078125, 0.988037109375, 1.03240966796875, 1.0767822265625, 1.12115478515625, 1.16552734375, 1.20989990234375, 1.2542724609375, 1.29864501953125, 1.343017578125, 1.38739013671875, 1.4317626953125, 1.47613525390625, 1.5205078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 8.0, 11.0, 13.0, 18.0, 24.0, 22.0, 22.0, 20.0, 25.0, 38.0, 43.0, 48.0, 54.0, 49.0, 53.0, 67.0, 63.0, 61.0, 56.0, 46.0, 47.0, 40.0, 27.0, 22.0, 27.0, 19.0, 14.0, 6.0, 11.0, 3.0, 4.0, 5.0, 10.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.53564453125, -0.5194625854492188, -0.5032806396484375, -0.48709869384765625, -0.470916748046875, -0.45473480224609375, -0.4385528564453125, -0.42237091064453125, -0.40618896484375, -0.39000701904296875, -0.3738250732421875, -0.35764312744140625, -0.341461181640625, -0.32527923583984375, -0.3090972900390625, -0.29291534423828125, -0.2767333984375, -0.26055145263671875, -0.2443695068359375, -0.22818756103515625, -0.212005615234375, -0.19582366943359375, -0.1796417236328125, -0.16345977783203125, -0.14727783203125, -0.13109588623046875, -0.1149139404296875, -0.09873199462890625, -0.082550048828125, -0.06636810302734375, -0.0501861572265625, -0.03400421142578125, -0.017822265625, -0.00164031982421875, 0.0145416259765625, 0.03072357177734375, 0.046905517578125, 0.06308746337890625, 0.0792694091796875, 0.09545135498046875, 0.11163330078125, 0.12781524658203125, 0.1439971923828125, 0.16017913818359375, 0.176361083984375, 0.19254302978515625, 0.2087249755859375, 0.22490692138671875, 0.2410888671875, 0.25727081298828125, 0.2734527587890625, 0.28963470458984375, 0.305816650390625, 0.32199859619140625, 0.3381805419921875, 0.35436248779296875, 0.37054443359375, 0.38672637939453125, 0.4029083251953125, 0.41909027099609375, 0.435272216796875, 0.45145416259765625, 0.4676361083984375, 0.48381805419921875, 0.5]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 9.0, 3.0, 11.0, 14.0, 17.0, 27.0, 25.0, 23.0, 38.0, 35.0, 41.0, 54.0, 47.0, 49.0, 67.0, 60.0, 52.0, 47.0, 49.0, 47.0, 50.0, 35.0, 35.0, 35.0, 18.0, 20.0, 16.0, 15.0, 9.0, 14.0, 9.0, 9.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.170534133911133, -8.839683532714844, -8.508831977844238, -8.17798137664795, -7.847130298614502, -7.516279220581055, -7.185428142547607, -6.85457706451416, -6.523726463317871, -6.192875385284424, -5.862024307250977, -5.5311737060546875, -5.20032262802124, -4.869471549987793, -4.538620471954346, -4.207769393920898, -3.876918315887451, -3.546067237854004, -3.2152163982391357, -2.8843653202056885, -2.5535144805908203, -2.222663402557373, -1.8918123245239258, -1.5609614849090576, -1.2301104068756104, -0.8992594480514526, -0.5684084296226501, -0.23755741119384766, 0.09329354763031006, 0.4241445064544678, 0.754995584487915, 1.0858464241027832, 1.4166975021362305, 1.7475484609603882, 2.078399419784546, 2.409250497817993, 2.7401013374328613, 3.0709524154663086, 3.401803493499756, 3.732654333114624, 4.063505172729492, 4.3943562507629395, 4.725207328796387, 5.056057929992676, 5.386909008026123, 5.71776008605957, 6.048611164093018, 6.379462242126465, 6.710313320159912, 7.041164398193359, 7.372015476226807, 7.702866554260254, 8.033717155456543, 8.364568710327148, 8.695419311523438, 9.026269912719727, 9.357121467590332, 9.687972068786621, 10.018823623657227, 10.349674224853516, 10.680525779724121, 11.01137638092041, 11.342227935791016, 11.673078536987305, 12.003929138183594]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 8.0, 4.0, 10.0, 16.0, 9.0, 11.0, 19.0, 19.0, 21.0, 26.0, 29.0, 33.0, 32.0, 35.0, 49.0, 53.0, 40.0, 46.0, 34.0, 46.0, 41.0, 40.0, 47.0, 29.0, 46.0, 42.0, 33.0, 21.0, 16.0, 19.0, 20.0, 15.0, 18.0, 13.0, 15.0, 9.0, 6.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.102931499481201, -5.916293621063232, -5.729656219482422, -5.543018341064453, -5.356380462646484, -5.169742584228516, -4.983105182647705, -4.796467304229736, -4.609829902648926, -4.423192024230957, -4.2365546226501465, -4.049916744232178, -3.863278865814209, -3.6766412258148193, -3.4900035858154297, -3.303365707397461, -3.116727828979492, -2.9300901889801025, -2.743452310562134, -2.556814670562744, -2.3701767921447754, -2.1835391521453857, -1.996901512145996, -1.810263752937317, -1.6236259937286377, -1.4369882345199585, -1.2503504753112793, -1.0637128353118896, -0.8770750761032104, -0.6904373168945312, -0.5037996768951416, -0.3171619176864624, -0.130523681640625, 0.05611404776573181, 0.24275177717208862, 0.42938947677612305, 0.6160272359848022, 0.8026649951934814, 0.9893026351928711, 1.1759403944015503, 1.3625781536102295, 1.5492159128189087, 1.735853672027588, 1.9224913120269775, 2.109128952026367, 2.295766830444336, 2.4824044704437256, 2.6690421104431152, 2.855679988861084, 3.0423176288604736, 3.2289555072784424, 3.415593147277832, 3.602231025695801, 3.7888686656951904, 3.97550630569458, 4.162144184112549, 4.348781585693359, 4.535419464111328, 4.722056865692139, 4.908694744110107, 5.095332622528076, 5.281970024108887, 5.4686079025268555, 5.655245780944824, 5.841883659362793]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 3.0, 5.0, 9.0, 15.0, 21.0, 20.0, 41.0, 60.0, 93.0, 119.0, 176.0, 260.0, 389.0, 655.0, 957.0, 1403.0, 2189.0, 3328.0, 5140.0, 7864.0, 12088.0, 18230.0, 27885.0, 40917.0, 57034.0, 77661.0, 97934.0, 113154.0, 119761.0, 113445.0, 96991.0, 76660.0, 56112.0, 39474.0, 26696.0, 17744.0, 11677.0, 7745.0, 4934.0, 3317.0, 2115.0, 1426.0, 935.0, 643.0, 405.0, 259.0, 192.0, 119.0, 72.0, 66.0, 48.0, 23.0, 20.0, 12.0, 11.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-4.8515625, -4.6973876953125, -4.543212890625, -4.3890380859375, -4.23486328125, -4.0806884765625, -3.926513671875, -3.7723388671875, -3.6181640625, -3.4639892578125, -3.309814453125, -3.1556396484375, -3.00146484375, -2.8472900390625, -2.693115234375, -2.5389404296875, -2.384765625, -2.2305908203125, -2.076416015625, -1.9222412109375, -1.76806640625, -1.6138916015625, -1.459716796875, -1.3055419921875, -1.1513671875, -0.9971923828125, -0.843017578125, -0.6888427734375, -0.53466796875, -0.3804931640625, -0.226318359375, -0.0721435546875, 0.08203125, 0.2362060546875, 0.390380859375, 0.5445556640625, 0.69873046875, 0.8529052734375, 1.007080078125, 1.1612548828125, 1.3154296875, 1.4696044921875, 1.623779296875, 1.7779541015625, 1.93212890625, 2.0863037109375, 2.240478515625, 2.3946533203125, 2.548828125, 2.7030029296875, 2.857177734375, 3.0113525390625, 3.16552734375, 3.3197021484375, 3.473876953125, 3.6280517578125, 3.7822265625, 3.9364013671875, 4.090576171875, 4.2447509765625, 4.39892578125, 4.5531005859375, 4.707275390625, 4.8614501953125, 5.015625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 5.0, 8.0, 14.0, 14.0, 15.0, 14.0, 20.0, 10.0, 16.0, 27.0, 32.0, 20.0, 33.0, 38.0, 32.0, 42.0, 39.0, 43.0, 35.0, 57.0, 35.0, 38.0, 43.0, 38.0, 41.0, 43.0, 39.0, 23.0, 21.0, 27.0, 15.0, 23.0, 10.0, 12.0, 14.0, 8.0, 11.0, 5.0, 4.0, 2.0, 8.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 4.0], "bins": [-7.28125, -7.07537841796875, -6.8695068359375, -6.66363525390625, -6.457763671875, -6.25189208984375, -6.0460205078125, -5.84014892578125, -5.63427734375, -5.42840576171875, -5.2225341796875, -5.01666259765625, -4.810791015625, -4.60491943359375, -4.3990478515625, -4.19317626953125, -3.9873046875, -3.78143310546875, -3.5755615234375, -3.36968994140625, -3.163818359375, -2.95794677734375, -2.7520751953125, -2.54620361328125, -2.34033203125, -2.13446044921875, -1.9285888671875, -1.72271728515625, -1.516845703125, -1.31097412109375, -1.1051025390625, -0.89923095703125, -0.693359375, -0.48748779296875, -0.2816162109375, -0.07574462890625, 0.130126953125, 0.33599853515625, 0.5418701171875, 0.74774169921875, 0.95361328125, 1.15948486328125, 1.3653564453125, 1.57122802734375, 1.777099609375, 1.98297119140625, 2.1888427734375, 2.39471435546875, 2.6005859375, 2.80645751953125, 3.0123291015625, 3.21820068359375, 3.424072265625, 3.62994384765625, 3.8358154296875, 4.04168701171875, 4.24755859375, 4.45343017578125, 4.6593017578125, 4.86517333984375, 5.071044921875, 5.27691650390625, 5.4827880859375, 5.68865966796875, 5.89453125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 9.0, 13.0, 25.0, 37.0, 49.0, 97.0, 150.0, 238.0, 426.0, 780.0, 1339.0, 2305.0, 4040.0, 7014.0, 11907.0, 20567.0, 34895.0, 56025.0, 84582.0, 117433.0, 141691.0, 149265.0, 132665.0, 102369.0, 70131.0, 45261.0, 27442.0, 16056.0, 9208.0, 5312.0, 2983.0, 1746.0, 1003.0, 574.0, 329.0, 221.0, 140.0, 91.0, 46.0, 28.0, 31.0, 6.0, 10.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.51953125, -6.32354736328125, -6.1275634765625, -5.93157958984375, -5.735595703125, -5.53961181640625, -5.3436279296875, -5.14764404296875, -4.95166015625, -4.75567626953125, -4.5596923828125, -4.36370849609375, -4.167724609375, -3.97174072265625, -3.7757568359375, -3.57977294921875, -3.3837890625, -3.18780517578125, -2.9918212890625, -2.79583740234375, -2.599853515625, -2.40386962890625, -2.2078857421875, -2.01190185546875, -1.81591796875, -1.61993408203125, -1.4239501953125, -1.22796630859375, -1.031982421875, -0.83599853515625, -0.6400146484375, -0.44403076171875, -0.248046875, -0.05206298828125, 0.1439208984375, 0.33990478515625, 0.535888671875, 0.73187255859375, 0.9278564453125, 1.12384033203125, 1.31982421875, 1.51580810546875, 1.7117919921875, 1.90777587890625, 2.103759765625, 2.29974365234375, 2.4957275390625, 2.69171142578125, 2.8876953125, 3.08367919921875, 3.2796630859375, 3.47564697265625, 3.671630859375, 3.86761474609375, 4.0635986328125, 4.25958251953125, 4.45556640625, 4.65155029296875, 4.8475341796875, 5.04351806640625, 5.239501953125, 5.43548583984375, 5.6314697265625, 5.82745361328125, 6.0234375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 3.0, 11.0, 8.0, 10.0, 13.0, 18.0, 19.0, 20.0, 21.0, 22.0, 40.0, 37.0, 43.0, 48.0, 38.0, 29.0, 46.0, 35.0, 46.0, 51.0, 42.0, 42.0, 46.0, 49.0, 31.0, 27.0, 38.0, 28.0, 19.0, 21.0, 18.0, 14.0, 18.0, 12.0, 11.0, 10.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.499420166015625, -4.36602783203125, -4.232635498046875, -4.0992431640625, -3.965850830078125, -3.83245849609375, -3.699066162109375, -3.565673828125, -3.432281494140625, -3.29888916015625, -3.165496826171875, -3.0321044921875, -2.898712158203125, -2.76531982421875, -2.631927490234375, -2.49853515625, -2.365142822265625, -2.23175048828125, -2.098358154296875, -1.9649658203125, -1.831573486328125, -1.69818115234375, -1.564788818359375, -1.431396484375, -1.298004150390625, -1.16461181640625, -1.031219482421875, -0.8978271484375, -0.764434814453125, -0.63104248046875, -0.497650146484375, -0.3642578125, -0.230865478515625, -0.09747314453125, 0.035919189453125, 0.1693115234375, 0.302703857421875, 0.43609619140625, 0.569488525390625, 0.702880859375, 0.836273193359375, 0.96966552734375, 1.103057861328125, 1.2364501953125, 1.369842529296875, 1.50323486328125, 1.636627197265625, 1.77001953125, 1.903411865234375, 2.03680419921875, 2.170196533203125, 2.3035888671875, 2.436981201171875, 2.57037353515625, 2.703765869140625, 2.837158203125, 2.970550537109375, 3.10394287109375, 3.237335205078125, 3.3707275390625, 3.504119873046875, 3.63751220703125, 3.770904541015625, 3.904296875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 24.0, 18.0, 41.0, 50.0, 64.0, 92.0, 163.0, 214.0, 352.0, 619.0, 985.0, 1679.0, 2746.0, 4701.0, 7940.0, 13629.0, 22497.0, 37570.0, 59519.0, 89776.0, 124210.0, 149981.0, 150940.0, 127974.0, 93173.0, 62388.0, 38861.0, 23657.0, 13998.0, 8281.0, 4944.0, 2870.0, 1776.0, 1093.0, 616.0, 348.0, 274.0, 156.0, 117.0, 87.0, 41.0, 28.0, 22.0, 10.0, 10.0, 3.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.23828125, -3.140289306640625, -3.04229736328125, -2.944305419921875, -2.8463134765625, -2.748321533203125, -2.65032958984375, -2.552337646484375, -2.454345703125, -2.356353759765625, -2.25836181640625, -2.160369873046875, -2.0623779296875, -1.964385986328125, -1.86639404296875, -1.768402099609375, -1.67041015625, -1.572418212890625, -1.47442626953125, -1.376434326171875, -1.2784423828125, -1.180450439453125, -1.08245849609375, -0.984466552734375, -0.886474609375, -0.788482666015625, -0.69049072265625, -0.592498779296875, -0.4945068359375, -0.396514892578125, -0.29852294921875, -0.200531005859375, -0.1025390625, -0.004547119140625, 0.09344482421875, 0.191436767578125, 0.2894287109375, 0.387420654296875, 0.48541259765625, 0.583404541015625, 0.681396484375, 0.779388427734375, 0.87738037109375, 0.975372314453125, 1.0733642578125, 1.171356201171875, 1.26934814453125, 1.367340087890625, 1.46533203125, 1.563323974609375, 1.66131591796875, 1.759307861328125, 1.8572998046875, 1.955291748046875, 2.05328369140625, 2.151275634765625, 2.249267578125, 2.347259521484375, 2.44525146484375, 2.543243408203125, 2.6412353515625, 2.739227294921875, 2.83721923828125, 2.935211181640625, 3.033203125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 7.0, 15.0, 10.0, 17.0, 19.0, 25.0, 33.0, 27.0, 37.0, 36.0, 38.0, 47.0, 57.0, 64.0, 73.0, 55.0, 44.0, 47.0, 42.0, 43.0, 41.0, 36.0, 37.0, 29.0, 21.0, 23.0, 10.0, 11.0, 16.0, 7.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003685951232910156, -0.00035870447754859924, -0.00034881383180618286, -0.0003389231860637665, -0.0003290325403213501, -0.0003191418945789337, -0.00030925124883651733, -0.00029936060309410095, -0.00028946995735168457, -0.0002795793116092682, -0.0002696886658668518, -0.0002597980201244354, -0.00024990737438201904, -0.00024001672863960266, -0.00023012608289718628, -0.0002202354371547699, -0.00021034479141235352, -0.00020045414566993713, -0.00019056349992752075, -0.00018067285418510437, -0.000170782208442688, -0.0001608915627002716, -0.00015100091695785522, -0.00014111027121543884, -0.00013121962547302246, -0.00012132897973060608, -0.0001114383339881897, -0.00010154768824577332, -9.165704250335693e-05, -8.176639676094055e-05, -7.187575101852417e-05, -6.198510527610779e-05, -5.2094459533691406e-05, -4.2203813791275024e-05, -3.231316804885864e-05, -2.242252230644226e-05, -1.2531876564025879e-05, -2.641230821609497e-06, 7.249414920806885e-06, 1.7140060663223267e-05, 2.703070640563965e-05, 3.692135214805603e-05, 4.681199789047241e-05, 5.6702643632888794e-05, 6.659328937530518e-05, 7.648393511772156e-05, 8.637458086013794e-05, 9.626522660255432e-05, 0.0001061558723449707, 0.00011604651808738708, 0.00012593716382980347, 0.00013582780957221985, 0.00014571845531463623, 0.0001556091010570526, 0.000165499746799469, 0.00017539039254188538, 0.00018528103828430176, 0.00019517168402671814, 0.00020506232976913452, 0.0002149529755115509, 0.00022484362125396729, 0.00023473426699638367, 0.00024462491273880005, 0.00025451555848121643, 0.0002644062042236328]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 13.0, 12.0, 14.0, 34.0, 41.0, 75.0, 107.0, 140.0, 249.0, 365.0, 544.0, 822.0, 1328.0, 2106.0, 3392.0, 5178.0, 7998.0, 12713.0, 19686.0, 29960.0, 45639.0, 65781.0, 90497.0, 114293.0, 128860.0, 128271.0, 112805.0, 88071.0, 63971.0, 43961.0, 29100.0, 18805.0, 12288.0, 7579.0, 4861.0, 3264.0, 2013.0, 1318.0, 789.0, 543.0, 347.0, 261.0, 156.0, 119.0, 59.0, 49.0, 26.0, 24.0, 8.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0], "bins": [-2.76171875, -2.67791748046875, -2.5941162109375, -2.51031494140625, -2.426513671875, -2.34271240234375, -2.2589111328125, -2.17510986328125, -2.09130859375, -2.00750732421875, -1.9237060546875, -1.83990478515625, -1.756103515625, -1.67230224609375, -1.5885009765625, -1.50469970703125, -1.4208984375, -1.33709716796875, -1.2532958984375, -1.16949462890625, -1.085693359375, -1.00189208984375, -0.9180908203125, -0.83428955078125, -0.75048828125, -0.66668701171875, -0.5828857421875, -0.49908447265625, -0.415283203125, -0.33148193359375, -0.2476806640625, -0.16387939453125, -0.080078125, 0.00372314453125, 0.0875244140625, 0.17132568359375, 0.255126953125, 0.33892822265625, 0.4227294921875, 0.50653076171875, 0.59033203125, 0.67413330078125, 0.7579345703125, 0.84173583984375, 0.925537109375, 1.00933837890625, 1.0931396484375, 1.17694091796875, 1.2607421875, 1.34454345703125, 1.4283447265625, 1.51214599609375, 1.595947265625, 1.67974853515625, 1.7635498046875, 1.84735107421875, 1.93115234375, 2.01495361328125, 2.0987548828125, 2.18255615234375, 2.266357421875, 2.35015869140625, 2.4339599609375, 2.51776123046875, 2.6015625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 3.0, 5.0, 4.0, 10.0, 24.0, 22.0, 23.0, 31.0, 35.0, 49.0, 47.0, 55.0, 60.0, 58.0, 49.0, 54.0, 55.0, 57.0, 48.0, 51.0, 46.0, 42.0, 47.0, 19.0, 21.0, 13.0, 15.0, 13.0, 8.0, 4.0, 2.0, 7.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2216796875, -1.1896591186523438, -1.1576385498046875, -1.1256179809570312, -1.093597412109375, -1.0615768432617188, -1.0295562744140625, -0.9975357055664062, -0.96551513671875, -0.9334945678710938, -0.9014739990234375, -0.8694534301757812, -0.837432861328125, -0.8054122924804688, -0.7733917236328125, -0.7413711547851562, -0.7093505859375, -0.6773300170898438, -0.6453094482421875, -0.6132888793945312, -0.581268310546875, -0.5492477416992188, -0.5172271728515625, -0.48520660400390625, -0.45318603515625, -0.42116546630859375, -0.3891448974609375, -0.35712432861328125, -0.325103759765625, -0.29308319091796875, -0.2610626220703125, -0.22904205322265625, -0.197021484375, -0.16500091552734375, -0.1329803466796875, -0.10095977783203125, -0.068939208984375, -0.03691864013671875, -0.0048980712890625, 0.02712249755859375, 0.05914306640625, 0.09116363525390625, 0.1231842041015625, 0.15520477294921875, 0.187225341796875, 0.21924591064453125, 0.2512664794921875, 0.28328704833984375, 0.3153076171875, 0.34732818603515625, 0.3793487548828125, 0.41136932373046875, 0.443389892578125, 0.47541046142578125, 0.5074310302734375, 0.5394515991210938, 0.57147216796875, 0.6034927368164062, 0.6355133056640625, 0.6675338745117188, 0.699554443359375, 0.7315750122070312, 0.7635955810546875, 0.7956161499023438, 0.82763671875]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 7.0, 8.0, 17.0, 17.0, 29.0, 34.0, 33.0, 28.0, 48.0, 51.0, 50.0, 57.0, 62.0, 66.0, 56.0, 52.0, 57.0, 41.0, 43.0, 58.0, 30.0, 34.0, 24.0, 14.0, 22.0, 13.0, 7.0, 7.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.916393280029297, -9.558873176574707, -9.201353073120117, -8.843832015991211, -8.486311912536621, -8.128791809082031, -7.771271705627441, -7.413751602172852, -7.0562310218811035, -6.698710918426514, -6.341190338134766, -5.983670234680176, -5.626150131225586, -5.268629550933838, -4.911109447479248, -4.5535888671875, -4.19606876373291, -3.838548421859741, -3.4810280799865723, -3.1235079765319824, -2.7659876346588135, -2.4084672927856445, -2.0509471893310547, -1.6934268474578857, -1.3359065055847168, -0.9783862233161926, -0.6208659410476685, -0.26334571838378906, 0.09417462348937988, 0.45169496536254883, 0.8092150688171387, 1.1667354106903076, 1.524256706237793, 1.881777048110962, 2.239297389984131, 2.5968174934387207, 2.9543378353118896, 3.3118581771850586, 3.6693782806396484, 4.026898384094238, 4.384418964385986, 4.741939067840576, 5.099459648132324, 5.456979751586914, 5.814499855041504, 6.172020435333252, 6.529540538787842, 6.88706111907959, 7.24458122253418, 7.6021013259887695, 7.959621906280518, 8.317142486572266, 8.674662590026855, 9.032182693481445, 9.389702796936035, 9.747222900390625, 10.104743957519531, 10.462264060974121, 10.819784164428711, 11.177305221557617, 11.534825325012207, 11.892345428466797, 12.249865531921387, 12.607385635375977, 12.964905738830566]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 3.0, 8.0, 5.0, 13.0, 10.0, 15.0, 11.0, 14.0, 23.0, 24.0, 19.0, 38.0, 32.0, 34.0, 40.0, 24.0, 40.0, 43.0, 39.0, 32.0, 35.0, 49.0, 38.0, 45.0, 43.0, 39.0, 36.0, 37.0, 26.0, 23.0, 18.0, 28.0, 20.0, 13.0, 17.0, 16.0, 9.0, 5.0, 10.0, 2.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.790459156036377, -5.6042304039001465, -5.418001651763916, -5.231773376464844, -5.045544624328613, -4.859315872192383, -4.673087120056152, -4.486858367919922, -4.300629615783691, -4.114400863647461, -3.9281723499298096, -3.741943597793579, -3.5557150840759277, -3.3694863319396973, -3.183257579803467, -2.9970288276672363, -2.810800552368164, -2.6245718002319336, -2.4383432865142822, -2.2521145343780518, -2.0658860206604004, -1.87965726852417, -1.6934285163879395, -1.5071998834609985, -1.3209712505340576, -1.1347426176071167, -0.948513925075531, -0.7622852325439453, -0.5760565996170044, -0.3898279666900635, -0.203599214553833, -0.01737058162689209, 0.16885852813720703, 0.35508719086647034, 0.5413158535957336, 0.7275445461273193, 0.9137731790542603, 1.1000018119812012, 1.2862305641174316, 1.4724591970443726, 1.6586878299713135, 1.8449164628982544, 2.0311450958251953, 2.217373847961426, 2.4036026000976562, 2.5898311138153076, 2.776059865951538, 2.9622883796691895, 3.14851713180542, 3.3347458839416504, 3.5209743976593018, 3.7072031497955322, 3.8934316635131836, 4.079660415649414, 4.2658891677856445, 4.452117919921875, 4.6383466720581055, 4.824575424194336, 5.010804176330566, 5.197032928466797, 5.383261203765869, 5.5694899559021, 5.75571870803833, 5.9419474601745605, 6.128175735473633]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 14.0, 15.0, 20.0, 35.0, 51.0, 94.0, 110.0, 190.0, 294.0, 434.0, 735.0, 1183.0, 1993.0, 3094.0, 5405.0, 9055.0, 16142.0, 28975.0, 52234.0, 98343.0, 185954.0, 354251.0, 631377.0, 888111.0, 809553.0, 507762.0, 274675.0, 145310.0, 78015.0, 42789.0, 23914.0, 13602.0, 8092.0, 4797.0, 2825.0, 1790.0, 1095.0, 736.0, 427.0, 282.0, 177.0, 103.0, 77.0, 51.0, 29.0, 30.0, 20.0, 11.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5546875, -8.2769775390625, -7.999267578125, -7.7215576171875, -7.44384765625, -7.1661376953125, -6.888427734375, -6.6107177734375, -6.3330078125, -6.0552978515625, -5.777587890625, -5.4998779296875, -5.22216796875, -4.9444580078125, -4.666748046875, -4.3890380859375, -4.111328125, -3.8336181640625, -3.555908203125, -3.2781982421875, -3.00048828125, -2.7227783203125, -2.445068359375, -2.1673583984375, -1.8896484375, -1.6119384765625, -1.334228515625, -1.0565185546875, -0.77880859375, -0.5010986328125, -0.223388671875, 0.0543212890625, 0.33203125, 0.6097412109375, 0.887451171875, 1.1651611328125, 1.44287109375, 1.7205810546875, 1.998291015625, 2.2760009765625, 2.5537109375, 2.8314208984375, 3.109130859375, 3.3868408203125, 3.66455078125, 3.9422607421875, 4.219970703125, 4.4976806640625, 4.775390625, 5.0531005859375, 5.330810546875, 5.6085205078125, 5.88623046875, 6.1639404296875, 6.441650390625, 6.7193603515625, 6.9970703125, 7.2747802734375, 7.552490234375, 7.8302001953125, 8.10791015625, 8.3856201171875, 8.663330078125, 8.9410400390625, 9.21875]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 6.0, 9.0, 6.0, 7.0, 9.0, 8.0, 21.0, 19.0, 25.0, 27.0, 30.0, 35.0, 39.0, 39.0, 38.0, 35.0, 51.0, 40.0, 42.0, 46.0, 39.0, 41.0, 39.0, 42.0, 37.0, 26.0, 31.0, 24.0, 25.0, 20.0, 24.0, 19.0, 23.0, 10.0, 15.0, 5.0, 9.0, 8.0, 5.0, 5.0, 2.0, 5.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.76953125, -4.62872314453125, -4.4879150390625, -4.34710693359375, -4.206298828125, -4.06549072265625, -3.9246826171875, -3.78387451171875, -3.64306640625, -3.50225830078125, -3.3614501953125, -3.22064208984375, -3.079833984375, -2.93902587890625, -2.7982177734375, -2.65740966796875, -2.5166015625, -2.37579345703125, -2.2349853515625, -2.09417724609375, -1.953369140625, -1.81256103515625, -1.6717529296875, -1.53094482421875, -1.39013671875, -1.24932861328125, -1.1085205078125, -0.96771240234375, -0.826904296875, -0.68609619140625, -0.5452880859375, -0.40447998046875, -0.263671875, -0.12286376953125, 0.0179443359375, 0.15875244140625, 0.299560546875, 0.44036865234375, 0.5811767578125, 0.72198486328125, 0.86279296875, 1.00360107421875, 1.1444091796875, 1.28521728515625, 1.426025390625, 1.56683349609375, 1.7076416015625, 1.84844970703125, 1.9892578125, 2.13006591796875, 2.2708740234375, 2.41168212890625, 2.552490234375, 2.69329833984375, 2.8341064453125, 2.97491455078125, 3.11572265625, 3.25653076171875, 3.3973388671875, 3.53814697265625, 3.678955078125, 3.81976318359375, 3.9605712890625, 4.10137939453125, 4.2421875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 14.0, 23.0, 24.0, 49.0, 45.0, 67.0, 147.0, 217.0, 284.0, 405.0, 700.0, 1151.0, 1854.0, 3125.0, 5060.0, 8882.0, 15435.0, 28123.0, 52005.0, 97650.0, 183856.0, 337894.0, 577766.0, 813470.0, 800657.0, 558036.0, 323969.0, 176004.0, 93866.0, 50159.0, 27161.0, 14986.0, 8391.0, 4961.0, 2885.0, 1842.0, 1080.0, 721.0, 400.0, 308.0, 185.0, 133.0, 87.0, 58.0, 36.0, 30.0, 29.0, 14.0, 8.0, 13.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3515625, -9.049560546875, -8.74755859375, -8.445556640625, -8.1435546875, -7.841552734375, -7.53955078125, -7.237548828125, -6.935546875, -6.633544921875, -6.33154296875, -6.029541015625, -5.7275390625, -5.425537109375, -5.12353515625, -4.821533203125, -4.51953125, -4.217529296875, -3.91552734375, -3.613525390625, -3.3115234375, -3.009521484375, -2.70751953125, -2.405517578125, -2.103515625, -1.801513671875, -1.49951171875, -1.197509765625, -0.8955078125, -0.593505859375, -0.29150390625, 0.010498046875, 0.3125, 0.614501953125, 0.91650390625, 1.218505859375, 1.5205078125, 1.822509765625, 2.12451171875, 2.426513671875, 2.728515625, 3.030517578125, 3.33251953125, 3.634521484375, 3.9365234375, 4.238525390625, 4.54052734375, 4.842529296875, 5.14453125, 5.446533203125, 5.74853515625, 6.050537109375, 6.3525390625, 6.654541015625, 6.95654296875, 7.258544921875, 7.560546875, 7.862548828125, 8.16455078125, 8.466552734375, 8.7685546875, 9.070556640625, 9.37255859375, 9.674560546875, 9.9765625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 8.0, 8.0, 16.0, 14.0, 21.0, 13.0, 24.0, 34.0, 35.0, 59.0, 61.0, 73.0, 69.0, 104.0, 114.0, 134.0, 133.0, 191.0, 207.0, 191.0, 211.0, 236.0, 211.0, 224.0, 204.0, 209.0, 189.0, 188.0, 146.0, 126.0, 105.0, 97.0, 83.0, 61.0, 52.0, 53.0, 35.0, 34.0, 23.0, 15.0, 20.0, 11.0, 8.0, 5.0, 10.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-2.794921875, -2.715911865234375, -2.63690185546875, -2.557891845703125, -2.4788818359375, -2.399871826171875, -2.32086181640625, -2.241851806640625, -2.162841796875, -2.083831787109375, -2.00482177734375, -1.925811767578125, -1.8468017578125, -1.767791748046875, -1.68878173828125, -1.609771728515625, -1.53076171875, -1.451751708984375, -1.37274169921875, -1.293731689453125, -1.2147216796875, -1.135711669921875, -1.05670166015625, -0.977691650390625, -0.898681640625, -0.819671630859375, -0.74066162109375, -0.661651611328125, -0.5826416015625, -0.503631591796875, -0.42462158203125, -0.345611572265625, -0.2666015625, -0.187591552734375, -0.10858154296875, -0.029571533203125, 0.0494384765625, 0.128448486328125, 0.20745849609375, 0.286468505859375, 0.365478515625, 0.444488525390625, 0.52349853515625, 0.602508544921875, 0.6815185546875, 0.760528564453125, 0.83953857421875, 0.918548583984375, 0.99755859375, 1.076568603515625, 1.15557861328125, 1.234588623046875, 1.3135986328125, 1.392608642578125, 1.47161865234375, 1.550628662109375, 1.629638671875, 1.708648681640625, 1.78765869140625, 1.866668701171875, 1.9456787109375, 2.024688720703125, 2.10369873046875, 2.182708740234375, 2.26171875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 7.0, 7.0, 14.0, 11.0, 15.0, 14.0, 26.0, 35.0, 34.0, 36.0, 47.0, 51.0, 65.0, 50.0, 59.0, 53.0, 58.0, 53.0, 69.0, 52.0, 40.0, 46.0, 24.0, 27.0, 25.0, 13.0, 17.0, 8.0, 7.0, 8.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.228531837463379, -8.877561569213867, -8.526591300964355, -8.175621032714844, -7.824650287628174, -7.473680019378662, -7.122709274291992, -6.7717390060424805, -6.420768737792969, -6.069798469543457, -5.718828201293945, -5.367857456207275, -5.016887187957764, -4.665916919708252, -4.314946174621582, -3.9639759063720703, -3.6130056381225586, -3.262035369873047, -2.911064863204956, -2.5600943565368652, -2.2091240882873535, -1.8581537008285522, -1.507183313369751, -1.1562128067016602, -0.8052425384521484, -0.45427215099334717, -0.1033017635345459, 0.24766862392425537, 0.5986390113830566, 0.9496093988418579, 1.3005797863006592, 1.65155029296875, 2.0025196075439453, 2.353489875793457, 2.704460382461548, 3.0554308891296387, 3.4064011573791504, 3.757371425628662, 4.108342170715332, 4.459312438964844, 4.8102827072143555, 5.161252975463867, 5.512223243713379, 5.863193988800049, 6.2141642570495605, 6.565134525299072, 6.916105270385742, 7.267075538635254, 7.618045806884766, 7.969016075134277, 8.319986343383789, 8.6709566116333, 9.021926879882812, 9.37289810180664, 9.723868370056152, 10.074838638305664, 10.425808906555176, 10.776779174804688, 11.1277494430542, 11.478719711303711, 11.829690933227539, 12.18066120147705, 12.531631469726562, 12.882601737976074, 13.233572006225586]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 6.0, 11.0, 9.0, 11.0, 12.0, 21.0, 15.0, 22.0, 22.0, 32.0, 28.0, 25.0, 27.0, 42.0, 38.0, 31.0, 52.0, 48.0, 45.0, 58.0, 46.0, 50.0, 37.0, 33.0, 31.0, 31.0, 27.0, 31.0, 17.0, 20.0, 21.0, 14.0, 9.0, 12.0, 13.0, 13.0, 10.0, 8.0, 6.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.594196796417236, -6.414300441741943, -6.23440408706665, -6.054508209228516, -5.874611854553223, -5.69471549987793, -5.514819145202637, -5.334922790527344, -5.155026435852051, -4.975130081176758, -4.795233726501465, -4.615337371826172, -4.435441493988037, -4.255545139312744, -4.075648784637451, -3.895752429962158, -3.7158565521240234, -3.5359601974487305, -3.3560640811920166, -3.1761677265167236, -2.9962716102600098, -2.816375255584717, -2.636478900909424, -2.456582546234131, -2.276686429977417, -2.096790075302124, -1.9168939590454102, -1.7369976043701172, -1.5571013689041138, -1.3772051334381104, -1.1973087787628174, -1.017412543296814, -0.8375167846679688, -0.6576205492019653, -0.47772425413131714, -0.29782795906066895, -0.11793172359466553, 0.06196451187133789, 0.24186086654663086, 0.4217571020126343, 0.6016533374786377, 0.7815495729446411, 0.9614458680152893, 1.1413421630859375, 1.321238398551941, 1.5011346340179443, 1.6810309886932373, 1.8609272241592407, 2.040823459625244, 2.220719814300537, 2.400615930557251, 2.580512285232544, 2.760408401489258, 2.940304756164551, 3.1202011108398438, 3.3000974655151367, 3.4799935817718506, 3.6598899364471436, 3.8397860527038574, 4.01968240737915, 4.199578762054443, 4.379474639892578, 4.559370994567871, 4.739267349243164, 4.919163703918457]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 6.0, 2.0, 6.0, 17.0, 12.0, 17.0, 29.0, 38.0, 80.0, 103.0, 139.0, 216.0, 311.0, 526.0, 701.0, 1048.0, 1525.0, 2467.0, 3715.0, 5386.0, 8173.0, 12117.0, 17979.0, 26500.0, 38953.0, 55395.0, 74758.0, 96711.0, 115215.0, 121922.0, 114950.0, 97666.0, 75450.0, 55261.0, 39251.0, 26870.0, 18143.0, 12232.0, 8260.0, 5393.0, 3635.0, 2424.0, 1635.0, 1129.0, 727.0, 497.0, 323.0, 225.0, 136.0, 81.0, 74.0, 46.0, 30.0, 27.0, 13.0, 7.0, 7.0, 4.0, 3.0, 1.0, 2.0], "bins": [-2.560546875, -2.481781005859375, -2.40301513671875, -2.324249267578125, -2.2454833984375, -2.166717529296875, -2.08795166015625, -2.009185791015625, -1.930419921875, -1.851654052734375, -1.77288818359375, -1.694122314453125, -1.6153564453125, -1.536590576171875, -1.45782470703125, -1.379058837890625, -1.30029296875, -1.221527099609375, -1.14276123046875, -1.063995361328125, -0.9852294921875, -0.906463623046875, -0.82769775390625, -0.748931884765625, -0.670166015625, -0.591400146484375, -0.51263427734375, -0.433868408203125, -0.3551025390625, -0.276336669921875, -0.19757080078125, -0.118804931640625, -0.0400390625, 0.038726806640625, 0.11749267578125, 0.196258544921875, 0.2750244140625, 0.353790283203125, 0.43255615234375, 0.511322021484375, 0.590087890625, 0.668853759765625, 0.74761962890625, 0.826385498046875, 0.9051513671875, 0.983917236328125, 1.06268310546875, 1.141448974609375, 1.22021484375, 1.298980712890625, 1.37774658203125, 1.456512451171875, 1.5352783203125, 1.614044189453125, 1.69281005859375, 1.771575927734375, 1.850341796875, 1.929107666015625, 2.00787353515625, 2.086639404296875, 2.1654052734375, 2.244171142578125, 2.32293701171875, 2.401702880859375, 2.48046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 4.0, 3.0, 7.0, 9.0, 14.0, 7.0, 5.0, 18.0, 18.0, 24.0, 29.0, 29.0, 25.0, 33.0, 29.0, 31.0, 22.0, 36.0, 37.0, 40.0, 49.0, 45.0, 37.0, 57.0, 33.0, 37.0, 18.0, 30.0, 26.0, 40.0, 24.0, 24.0, 18.0, 25.0, 27.0, 14.0, 12.0, 8.0, 8.0, 7.0, 7.0, 8.0, 11.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.50390625, -6.3167724609375, -6.129638671875, -5.9425048828125, -5.75537109375, -5.5682373046875, -5.381103515625, -5.1939697265625, -5.0068359375, -4.8197021484375, -4.632568359375, -4.4454345703125, -4.25830078125, -4.0711669921875, -3.884033203125, -3.6968994140625, -3.509765625, -3.3226318359375, -3.135498046875, -2.9483642578125, -2.76123046875, -2.5740966796875, -2.386962890625, -2.1998291015625, -2.0126953125, -1.8255615234375, -1.638427734375, -1.4512939453125, -1.26416015625, -1.0770263671875, -0.889892578125, -0.7027587890625, -0.515625, -0.3284912109375, -0.141357421875, 0.0457763671875, 0.23291015625, 0.4200439453125, 0.607177734375, 0.7943115234375, 0.9814453125, 1.1685791015625, 1.355712890625, 1.5428466796875, 1.72998046875, 1.9171142578125, 2.104248046875, 2.2913818359375, 2.478515625, 2.6656494140625, 2.852783203125, 3.0399169921875, 3.22705078125, 3.4141845703125, 3.601318359375, 3.7884521484375, 3.9755859375, 4.1627197265625, 4.349853515625, 4.5369873046875, 4.72412109375, 4.9112548828125, 5.098388671875, 5.2855224609375, 5.47265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [5.0, 0.0, 5.0, 4.0, 1.0, 10.0, 13.0, 17.0, 31.0, 37.0, 59.0, 73.0, 128.0, 176.0, 228.0, 389.0, 596.0, 876.0, 1350.0, 1987.0, 3093.0, 5124.0, 8035.0, 12932.0, 20882.0, 33696.0, 54788.0, 86905.0, 129487.0, 166781.0, 166775.0, 128031.0, 85087.0, 53427.0, 33197.0, 20293.0, 12395.0, 7822.0, 4911.0, 3069.0, 1994.0, 1251.0, 879.0, 534.0, 364.0, 275.0, 190.0, 118.0, 85.0, 43.0, 42.0, 31.0, 17.0, 11.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.57421875, -3.45501708984375, -3.3358154296875, -3.21661376953125, -3.097412109375, -2.97821044921875, -2.8590087890625, -2.73980712890625, -2.62060546875, -2.50140380859375, -2.3822021484375, -2.26300048828125, -2.143798828125, -2.02459716796875, -1.9053955078125, -1.78619384765625, -1.6669921875, -1.54779052734375, -1.4285888671875, -1.30938720703125, -1.190185546875, -1.07098388671875, -0.9517822265625, -0.83258056640625, -0.71337890625, -0.59417724609375, -0.4749755859375, -0.35577392578125, -0.236572265625, -0.11737060546875, 0.0018310546875, 0.12103271484375, 0.240234375, 0.35943603515625, 0.4786376953125, 0.59783935546875, 0.717041015625, 0.83624267578125, 0.9554443359375, 1.07464599609375, 1.19384765625, 1.31304931640625, 1.4322509765625, 1.55145263671875, 1.670654296875, 1.78985595703125, 1.9090576171875, 2.02825927734375, 2.1474609375, 2.26666259765625, 2.3858642578125, 2.50506591796875, 2.624267578125, 2.74346923828125, 2.8626708984375, 2.98187255859375, 3.10107421875, 3.22027587890625, 3.3394775390625, 3.45867919921875, 3.577880859375, 3.69708251953125, 3.8162841796875, 3.93548583984375, 4.0546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 7.0, 5.0, 5.0, 8.0, 12.0, 18.0, 13.0, 9.0, 26.0, 32.0, 30.0, 35.0, 22.0, 27.0, 20.0, 26.0, 37.0, 36.0, 29.0, 41.0, 43.0, 43.0, 40.0, 32.0, 37.0, 50.0, 29.0, 33.0, 33.0, 29.0, 26.0, 30.0, 21.0, 19.0, 19.0, 9.0, 9.0, 11.0, 12.0, 5.0, 10.0, 4.0, 4.0, 7.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.93170166015625, -3.8165283203125, -3.70135498046875, -3.586181640625, -3.47100830078125, -3.3558349609375, -3.24066162109375, -3.12548828125, -3.01031494140625, -2.8951416015625, -2.77996826171875, -2.664794921875, -2.54962158203125, -2.4344482421875, -2.31927490234375, -2.2041015625, -2.08892822265625, -1.9737548828125, -1.85858154296875, -1.743408203125, -1.62823486328125, -1.5130615234375, -1.39788818359375, -1.28271484375, -1.16754150390625, -1.0523681640625, -0.93719482421875, -0.822021484375, -0.70684814453125, -0.5916748046875, -0.47650146484375, -0.361328125, -0.24615478515625, -0.1309814453125, -0.01580810546875, 0.099365234375, 0.21453857421875, 0.3297119140625, 0.44488525390625, 0.56005859375, 0.67523193359375, 0.7904052734375, 0.90557861328125, 1.020751953125, 1.13592529296875, 1.2510986328125, 1.36627197265625, 1.4814453125, 1.59661865234375, 1.7117919921875, 1.82696533203125, 1.942138671875, 2.05731201171875, 2.1724853515625, 2.28765869140625, 2.40283203125, 2.51800537109375, 2.6331787109375, 2.74835205078125, 2.863525390625, 2.97869873046875, 3.0938720703125, 3.20904541015625, 3.32421875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 10.0, 12.0, 11.0, 16.0, 35.0, 36.0, 55.0, 92.0, 118.0, 179.0, 270.0, 404.0, 541.0, 883.0, 1282.0, 1996.0, 2932.0, 4522.0, 7213.0, 11484.0, 18963.0, 30266.0, 50516.0, 83080.0, 130342.0, 179015.0, 179816.0, 129497.0, 82750.0, 50538.0, 30752.0, 18814.0, 11506.0, 7175.0, 4571.0, 2982.0, 1893.0, 1271.0, 845.0, 575.0, 374.0, 287.0, 188.0, 136.0, 94.0, 77.0, 35.0, 23.0, 23.0, 17.0, 11.0, 14.0, 6.0, 0.0, 6.0, 3.0, 2.0, 3.0], "bins": [-1.857421875, -1.79937744140625, -1.7413330078125, -1.68328857421875, -1.625244140625, -1.56719970703125, -1.5091552734375, -1.45111083984375, -1.39306640625, -1.33502197265625, -1.2769775390625, -1.21893310546875, -1.160888671875, -1.10284423828125, -1.0447998046875, -0.98675537109375, -0.9287109375, -0.87066650390625, -0.8126220703125, -0.75457763671875, -0.696533203125, -0.63848876953125, -0.5804443359375, -0.52239990234375, -0.46435546875, -0.40631103515625, -0.3482666015625, -0.29022216796875, -0.232177734375, -0.17413330078125, -0.1160888671875, -0.05804443359375, 0.0, 0.05804443359375, 0.1160888671875, 0.17413330078125, 0.232177734375, 0.29022216796875, 0.3482666015625, 0.40631103515625, 0.46435546875, 0.52239990234375, 0.5804443359375, 0.63848876953125, 0.696533203125, 0.75457763671875, 0.8126220703125, 0.87066650390625, 0.9287109375, 0.98675537109375, 1.0447998046875, 1.10284423828125, 1.160888671875, 1.21893310546875, 1.2769775390625, 1.33502197265625, 1.39306640625, 1.45111083984375, 1.5091552734375, 1.56719970703125, 1.625244140625, 1.68328857421875, 1.7413330078125, 1.79937744140625, 1.857421875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 5.0, 3.0, 4.0, 5.0, 4.0, 6.0, 10.0, 6.0, 11.0, 13.0, 15.0, 12.0, 19.0, 21.0, 24.0, 33.0, 29.0, 48.0, 34.0, 41.0, 61.0, 55.0, 56.0, 43.0, 42.0, 49.0, 44.0, 38.0, 46.0, 35.0, 33.0, 23.0, 24.0, 21.0, 20.0, 14.0, 9.0, 11.0, 4.0, 3.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.000301361083984e-05, -8.718203753232956e-05, -8.436106145381927e-05, -8.154008537530899e-05, -7.87191092967987e-05, -7.589813321828842e-05, -7.307715713977814e-05, -7.025618106126785e-05, -6.743520498275757e-05, -6.461422890424728e-05, -6.1793252825737e-05, -5.8972276747226715e-05, -5.615130066871643e-05, -5.3330324590206146e-05, -5.050934851169586e-05, -4.768837243318558e-05, -4.486739635467529e-05, -4.204642027616501e-05, -3.9225444197654724e-05, -3.640446811914444e-05, -3.3583492040634155e-05, -3.076251596212387e-05, -2.7941539883613586e-05, -2.5120563805103302e-05, -2.2299587726593018e-05, -1.9478611648082733e-05, -1.665763556957245e-05, -1.3836659491062164e-05, -1.101568341255188e-05, -8.194707334041595e-06, -5.373731255531311e-06, -2.5527551770210266e-06, 2.682209014892578e-07, 3.0891969799995422e-06, 5.910173058509827e-06, 8.731149137020111e-06, 1.1552125215530396e-05, 1.437310129404068e-05, 1.7194077372550964e-05, 2.001505345106125e-05, 2.2836029529571533e-05, 2.5657005608081818e-05, 2.8477981686592102e-05, 3.1298957765102386e-05, 3.411993384361267e-05, 3.6940909922122955e-05, 3.976188600063324e-05, 4.2582862079143524e-05, 4.540383815765381e-05, 4.822481423616409e-05, 5.104579031467438e-05, 5.386676639318466e-05, 5.6687742471694946e-05, 5.950871855020523e-05, 6.232969462871552e-05, 6.51506707072258e-05, 6.797164678573608e-05, 7.079262286424637e-05, 7.361359894275665e-05, 7.643457502126694e-05, 7.925555109977722e-05, 8.20765271782875e-05, 8.489750325679779e-05, 8.771847933530807e-05, 9.053945541381836e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 9.0, 10.0, 7.0, 11.0, 14.0, 26.0, 39.0, 52.0, 86.0, 119.0, 174.0, 268.0, 412.0, 632.0, 1064.0, 1645.0, 2604.0, 4260.0, 6964.0, 11041.0, 17600.0, 27882.0, 44416.0, 66551.0, 95234.0, 124045.0, 142241.0, 137995.0, 115581.0, 85859.0, 58592.0, 38545.0, 24348.0, 14903.0, 9497.0, 5900.0, 3599.0, 2324.0, 1452.0, 902.0, 580.0, 353.0, 260.0, 158.0, 89.0, 71.0, 48.0, 38.0, 19.0, 15.0, 10.0, 6.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.505859375, -1.45703125, -1.408203125, -1.359375, -1.310546875, -1.26171875, -1.212890625, -1.1640625, -1.115234375, -1.06640625, -1.017578125, -0.96875, -0.919921875, -0.87109375, -0.822265625, -0.7734375, -0.724609375, -0.67578125, -0.626953125, -0.578125, -0.529296875, -0.48046875, -0.431640625, -0.3828125, -0.333984375, -0.28515625, -0.236328125, -0.1875, -0.138671875, -0.08984375, -0.041015625, 0.0078125, 0.056640625, 0.10546875, 0.154296875, 0.203125, 0.251953125, 0.30078125, 0.349609375, 0.3984375, 0.447265625, 0.49609375, 0.544921875, 0.59375, 0.642578125, 0.69140625, 0.740234375, 0.7890625, 0.837890625, 0.88671875, 0.935546875, 0.984375, 1.033203125, 1.08203125, 1.130859375, 1.1796875, 1.228515625, 1.27734375, 1.326171875, 1.375, 1.423828125, 1.47265625, 1.521484375, 1.5703125, 1.619140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 7.0, 20.0, 15.0, 15.0, 16.0, 23.0, 20.0, 22.0, 26.0, 48.0, 37.0, 51.0, 33.0, 35.0, 35.0, 55.0, 55.0, 52.0, 45.0, 41.0, 49.0, 37.0, 31.0, 26.0, 28.0, 35.0, 18.0, 13.0, 13.0, 14.0, 7.0, 20.0, 4.0, 4.0, 10.0, 2.0, 9.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.42333984375, -0.4093818664550781, -0.39542388916015625, -0.3814659118652344, -0.3675079345703125, -0.3535499572753906, -0.33959197998046875, -0.3256340026855469, -0.311676025390625, -0.2977180480957031, -0.28376007080078125, -0.2698020935058594, -0.2558441162109375, -0.24188613891601562, -0.22792816162109375, -0.21397018432617188, -0.20001220703125, -0.18605422973632812, -0.17209625244140625, -0.15813827514648438, -0.1441802978515625, -0.13022232055664062, -0.11626434326171875, -0.10230636596679688, -0.088348388671875, -0.07439041137695312, -0.06043243408203125, -0.046474456787109375, -0.0325164794921875, -0.018558502197265625, -0.00460052490234375, 0.009357452392578125, 0.0233154296875, 0.037273406982421875, 0.05123138427734375, 0.06518936157226562, 0.0791473388671875, 0.09310531616210938, 0.10706329345703125, 0.12102127075195312, 0.134979248046875, 0.14893722534179688, 0.16289520263671875, 0.17685317993164062, 0.1908111572265625, 0.20476913452148438, 0.21872711181640625, 0.23268508911132812, 0.24664306640625, 0.2606010437011719, 0.27455902099609375, 0.2885169982910156, 0.3024749755859375, 0.3164329528808594, 0.33039093017578125, 0.3443489074707031, 0.358306884765625, 0.3722648620605469, 0.38622283935546875, 0.4001808166503906, 0.4141387939453125, 0.4280967712402344, 0.44205474853515625, 0.4560127258300781, 0.469970703125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 6.0, 14.0, 11.0, 15.0, 17.0, 27.0, 32.0, 38.0, 35.0, 44.0, 58.0, 57.0, 56.0, 57.0, 60.0, 57.0, 63.0, 52.0, 50.0, 47.0, 42.0, 24.0, 23.0, 21.0, 20.0, 8.0, 13.0, 8.0, 9.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.432392120361328, -9.08504867553711, -8.73770523071289, -8.390361785888672, -8.04301929473877, -7.695675849914551, -7.348332405090332, -7.000988960266113, -6.653645992279053, -6.306302547454834, -5.958959579467773, -5.611616134643555, -5.264272689819336, -4.916929721832275, -4.569586277008057, -4.222243309020996, -3.8748998641967773, -3.5275566577911377, -3.180213451385498, -2.8328700065612793, -2.4855268001556396, -2.13818359375, -1.7908401489257812, -1.4434969425201416, -1.096153736114502, -0.7488104701042175, -0.4014672040939331, -0.054123878479003906, 0.29321932792663574, 0.6405625343322754, 0.9879059791564941, 1.3352491855621338, 1.682591438293457, 2.0299346446990967, 2.3772778511047363, 2.724621295928955, 3.0719645023345947, 3.4193077087402344, 3.766651153564453, 4.113994598388672, 4.461337566375732, 4.808681011199951, 5.156023979187012, 5.5033674240112305, 5.850710868835449, 6.19805383682251, 6.5453972816467285, 6.892740249633789, 7.240083694458008, 7.587427139282227, 7.934770107269287, 8.282114028930664, 8.629456520080566, 8.976799964904785, 9.324143409729004, 9.671486854553223, 10.018829345703125, 10.366172790527344, 10.713516235351562, 11.060859680175781, 11.408202171325684, 11.755545616149902, 12.102889060974121, 12.45023250579834, 12.797575950622559]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 6.0, 5.0, 4.0, 11.0, 8.0, 12.0, 16.0, 16.0, 19.0, 17.0, 24.0, 27.0, 32.0, 27.0, 25.0, 35.0, 42.0, 40.0, 38.0, 51.0, 38.0, 61.0, 50.0, 42.0, 41.0, 31.0, 36.0, 31.0, 30.0, 24.0, 27.0, 17.0, 18.0, 15.0, 14.0, 11.0, 14.0, 9.0, 11.0, 9.0, 7.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.471033573150635, -6.295192241668701, -6.119350910186768, -5.943509101867676, -5.767667770385742, -5.591826438903809, -5.415985107421875, -5.240143775939941, -5.064302444458008, -4.888461112976074, -4.712619781494141, -4.536778450012207, -4.360936641693115, -4.185095310211182, -4.009253978729248, -3.8334126472473145, -3.6575710773468018, -3.481729745864868, -3.3058881759643555, -3.130046844482422, -2.9542055130004883, -2.7783641815185547, -2.602522611618042, -2.4266812801361084, -2.2508397102355957, -2.074998378753662, -1.899156928062439, -1.7233154773712158, -1.5474741458892822, -1.371632695198059, -1.195791244506836, -1.0199499130249023, -0.8441085815429688, -0.6682671904563904, -0.4924257695674896, -0.31658434867858887, -0.1407429575920105, 0.03509843349456787, 0.21093988418579102, 0.3867812156677246, 0.5626226663589478, 0.7384640574455261, 0.9143054485321045, 1.0901468992233276, 1.2659883499145508, 1.4418296813964844, 1.6176711320877075, 1.7935124635696411, 1.9693539142608643, 2.145195245742798, 2.3210368156433105, 2.496878147125244, 2.6727194786071777, 2.8485608100891113, 3.024402379989624, 3.2002437114715576, 3.3760852813720703, 3.551926612854004, 3.7277681827545166, 3.90360951423645, 4.079451084136963, 4.2552924156188965, 4.43113374710083, 4.606975078582764, 4.782816410064697]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 9.0, 11.0, 20.0, 26.0, 37.0, 61.0, 75.0, 128.0, 183.0, 325.0, 514.0, 845.0, 1522.0, 2568.0, 4825.0, 8588.0, 16034.0, 29407.0, 52696.0, 88984.0, 135907.0, 172869.0, 174273.0, 140369.0, 93407.0, 55522.0, 31245.0, 17058.0, 9206.0, 5012.0, 2725.0, 1665.0, 960.0, 557.0, 327.0, 231.0, 126.0, 79.0, 50.0, 32.0, 22.0, 20.0, 15.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.51171875, -7.27734375, -7.04296875, -6.80859375, -6.57421875, -6.33984375, -6.10546875, -5.87109375, -5.63671875, -5.40234375, -5.16796875, -4.93359375, -4.69921875, -4.46484375, -4.23046875, -3.99609375, -3.76171875, -3.52734375, -3.29296875, -3.05859375, -2.82421875, -2.58984375, -2.35546875, -2.12109375, -1.88671875, -1.65234375, -1.41796875, -1.18359375, -0.94921875, -0.71484375, -0.48046875, -0.24609375, -0.01171875, 0.22265625, 0.45703125, 0.69140625, 0.92578125, 1.16015625, 1.39453125, 1.62890625, 1.86328125, 2.09765625, 2.33203125, 2.56640625, 2.80078125, 3.03515625, 3.26953125, 3.50390625, 3.73828125, 3.97265625, 4.20703125, 4.44140625, 4.67578125, 4.91015625, 5.14453125, 5.37890625, 5.61328125, 5.84765625, 6.08203125, 6.31640625, 6.55078125, 6.78515625, 7.01953125, 7.25390625, 7.48828125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 7.0, 3.0, 10.0, 11.0, 14.0, 16.0, 19.0, 22.0, 18.0, 25.0, 27.0, 25.0, 27.0, 28.0, 35.0, 42.0, 47.0, 42.0, 36.0, 48.0, 46.0, 51.0, 43.0, 36.0, 35.0, 35.0, 36.0, 38.0, 28.0, 16.0, 25.0, 16.0, 18.0, 9.0, 11.0, 7.0, 7.0, 8.0, 4.0, 12.0, 6.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.38671875, -6.18341064453125, -5.9801025390625, -5.77679443359375, -5.573486328125, -5.37017822265625, -5.1668701171875, -4.96356201171875, -4.76025390625, -4.55694580078125, -4.3536376953125, -4.15032958984375, -3.947021484375, -3.74371337890625, -3.5404052734375, -3.33709716796875, -3.1337890625, -2.93048095703125, -2.7271728515625, -2.52386474609375, -2.320556640625, -2.11724853515625, -1.9139404296875, -1.71063232421875, -1.50732421875, -1.30401611328125, -1.1007080078125, -0.89739990234375, -0.694091796875, -0.49078369140625, -0.2874755859375, -0.08416748046875, 0.119140625, 0.32244873046875, 0.5257568359375, 0.72906494140625, 0.932373046875, 1.13568115234375, 1.3389892578125, 1.54229736328125, 1.74560546875, 1.94891357421875, 2.1522216796875, 2.35552978515625, 2.558837890625, 2.76214599609375, 2.9654541015625, 3.16876220703125, 3.3720703125, 3.57537841796875, 3.7786865234375, 3.98199462890625, 4.185302734375, 4.38861083984375, 4.5919189453125, 4.79522705078125, 4.99853515625, 5.20184326171875, 5.4051513671875, 5.60845947265625, 5.811767578125, 6.01507568359375, 6.2183837890625, 6.42169189453125, 6.625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 12.0, 13.0, 15.0, 23.0, 39.0, 52.0, 74.0, 132.0, 177.0, 316.0, 574.0, 950.0, 1521.0, 2604.0, 4510.0, 7555.0, 13227.0, 22864.0, 38510.0, 62392.0, 95261.0, 129432.0, 152477.0, 151396.0, 125310.0, 91386.0, 59440.0, 36324.0, 21802.0, 12523.0, 7219.0, 4290.0, 2481.0, 1412.0, 889.0, 507.0, 324.0, 193.0, 127.0, 75.0, 37.0, 35.0, 22.0, 8.0, 11.0, 4.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.93359375, -6.72314453125, -6.5126953125, -6.30224609375, -6.091796875, -5.88134765625, -5.6708984375, -5.46044921875, -5.25, -5.03955078125, -4.8291015625, -4.61865234375, -4.408203125, -4.19775390625, -3.9873046875, -3.77685546875, -3.56640625, -3.35595703125, -3.1455078125, -2.93505859375, -2.724609375, -2.51416015625, -2.3037109375, -2.09326171875, -1.8828125, -1.67236328125, -1.4619140625, -1.25146484375, -1.041015625, -0.83056640625, -0.6201171875, -0.40966796875, -0.19921875, 0.01123046875, 0.2216796875, 0.43212890625, 0.642578125, 0.85302734375, 1.0634765625, 1.27392578125, 1.484375, 1.69482421875, 1.9052734375, 2.11572265625, 2.326171875, 2.53662109375, 2.7470703125, 2.95751953125, 3.16796875, 3.37841796875, 3.5888671875, 3.79931640625, 4.009765625, 4.22021484375, 4.4306640625, 4.64111328125, 4.8515625, 5.06201171875, 5.2724609375, 5.48291015625, 5.693359375, 5.90380859375, 6.1142578125, 6.32470703125, 6.53515625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 12.0, 10.0, 13.0, 14.0, 12.0, 18.0, 26.0, 18.0, 26.0, 30.0, 31.0, 27.0, 26.0, 37.0, 36.0, 49.0, 41.0, 34.0, 46.0, 40.0, 43.0, 40.0, 39.0, 43.0, 32.0, 26.0, 29.0, 33.0, 25.0, 22.0, 16.0, 19.0, 15.0, 10.0, 12.0, 6.0, 10.0, 5.0, 5.0, 3.0, 6.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.23046875, -3.114501953125, -2.99853515625, -2.882568359375, -2.7666015625, -2.650634765625, -2.53466796875, -2.418701171875, -2.302734375, -2.186767578125, -2.07080078125, -1.954833984375, -1.8388671875, -1.722900390625, -1.60693359375, -1.490966796875, -1.375, -1.259033203125, -1.14306640625, -1.027099609375, -0.9111328125, -0.795166015625, -0.67919921875, -0.563232421875, -0.447265625, -0.331298828125, -0.21533203125, -0.099365234375, 0.0166015625, 0.132568359375, 0.24853515625, 0.364501953125, 0.48046875, 0.596435546875, 0.71240234375, 0.828369140625, 0.9443359375, 1.060302734375, 1.17626953125, 1.292236328125, 1.408203125, 1.524169921875, 1.64013671875, 1.756103515625, 1.8720703125, 1.988037109375, 2.10400390625, 2.219970703125, 2.3359375, 2.451904296875, 2.56787109375, 2.683837890625, 2.7998046875, 2.915771484375, 3.03173828125, 3.147705078125, 3.263671875, 3.379638671875, 3.49560546875, 3.611572265625, 3.7275390625, 3.843505859375, 3.95947265625, 4.075439453125, 4.19140625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 7.0, 15.0, 15.0, 24.0, 45.0, 78.0, 102.0, 150.0, 253.0, 392.0, 636.0, 965.0, 1535.0, 2411.0, 3826.0, 6145.0, 9688.0, 15651.0, 24505.0, 38775.0, 58643.0, 86368.0, 116283.0, 139468.0, 143080.0, 123502.0, 93838.0, 64981.0, 42771.0, 27508.0, 17310.0, 10983.0, 6780.0, 4345.0, 2700.0, 1721.0, 1086.0, 732.0, 451.0, 277.0, 184.0, 120.0, 73.0, 59.0, 37.0, 15.0, 7.0, 9.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.111328125, -3.01739501953125, -2.9234619140625, -2.82952880859375, -2.735595703125, -2.64166259765625, -2.5477294921875, -2.45379638671875, -2.35986328125, -2.26593017578125, -2.1719970703125, -2.07806396484375, -1.984130859375, -1.89019775390625, -1.7962646484375, -1.70233154296875, -1.6083984375, -1.51446533203125, -1.4205322265625, -1.32659912109375, -1.232666015625, -1.13873291015625, -1.0447998046875, -0.95086669921875, -0.85693359375, -0.76300048828125, -0.6690673828125, -0.57513427734375, -0.481201171875, -0.38726806640625, -0.2933349609375, -0.19940185546875, -0.10546875, -0.01153564453125, 0.0823974609375, 0.17633056640625, 0.270263671875, 0.36419677734375, 0.4581298828125, 0.55206298828125, 0.64599609375, 0.73992919921875, 0.8338623046875, 0.92779541015625, 1.021728515625, 1.11566162109375, 1.2095947265625, 1.30352783203125, 1.3974609375, 1.49139404296875, 1.5853271484375, 1.67926025390625, 1.773193359375, 1.86712646484375, 1.9610595703125, 2.05499267578125, 2.14892578125, 2.24285888671875, 2.3367919921875, 2.43072509765625, 2.524658203125, 2.61859130859375, 2.7125244140625, 2.80645751953125, 2.900390625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 10.0, 12.0, 5.0, 12.0, 22.0, 26.0, 30.0, 38.0, 47.0, 50.0, 41.0, 69.0, 58.0, 72.0, 80.0, 70.0, 66.0, 58.0, 34.0, 45.0, 23.0, 28.0, 21.0, 8.0, 19.0, 16.0, 7.0, 5.0, 7.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037026405334472656, -0.00035690516233444214, -0.0003435462713241577, -0.0003301873803138733, -0.00031682848930358887, -0.00030346959829330444, -0.00029011070728302, -0.0002767518162727356, -0.00026339292526245117, -0.00025003403425216675, -0.00023667514324188232, -0.0002233162522315979, -0.00020995736122131348, -0.00019659847021102905, -0.00018323957920074463, -0.0001698806881904602, -0.00015652179718017578, -0.00014316290616989136, -0.00012980401515960693, -0.00011644512414932251, -0.00010308623313903809, -8.972734212875366e-05, -7.636845111846924e-05, -6.300956010818481e-05, -4.965066909790039e-05, -3.629177808761597e-05, -2.2932887077331543e-05, -9.573996067047119e-06, 3.7848949432373047e-06, 1.714378595352173e-05, 3.0502676963806152e-05, 4.3861567974090576e-05, 5.7220458984375e-05, 7.057934999465942e-05, 8.393824100494385e-05, 9.729713201522827e-05, 0.0001106560230255127, 0.00012401491403579712, 0.00013737380504608154, 0.00015073269605636597, 0.0001640915870666504, 0.00017745047807693481, 0.00019080936908721924, 0.00020416826009750366, 0.00021752715110778809, 0.0002308860421180725, 0.00024424493312835693, 0.00025760382413864136, 0.0002709627151489258, 0.0002843216061592102, 0.00029768049716949463, 0.00031103938817977905, 0.0003243982791900635, 0.0003377571702003479, 0.0003511160612106323, 0.00036447495222091675, 0.00037783384323120117, 0.0003911927342414856, 0.00040455162525177, 0.00041791051626205444, 0.00043126940727233887, 0.0004446282982826233, 0.0004579871892929077, 0.00047134608030319214, 0.00048470497131347656]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 10.0, 13.0, 14.0, 25.0, 34.0, 57.0, 82.0, 113.0, 196.0, 307.0, 536.0, 867.0, 1503.0, 2627.0, 4919.0, 9492.0, 18472.0, 36544.0, 69872.0, 124469.0, 185334.0, 205696.0, 166246.0, 103754.0, 56913.0, 29007.0, 14674.0, 7504.0, 3892.0, 2168.0, 1249.0, 764.0, 420.0, 275.0, 169.0, 120.0, 60.0, 51.0, 35.0, 24.0, 11.0, 11.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.11328125, -3.98199462890625, -3.8507080078125, -3.71942138671875, -3.588134765625, -3.45684814453125, -3.3255615234375, -3.19427490234375, -3.06298828125, -2.93170166015625, -2.8004150390625, -2.66912841796875, -2.537841796875, -2.40655517578125, -2.2752685546875, -2.14398193359375, -2.0126953125, -1.88140869140625, -1.7501220703125, -1.61883544921875, -1.487548828125, -1.35626220703125, -1.2249755859375, -1.09368896484375, -0.96240234375, -0.83111572265625, -0.6998291015625, -0.56854248046875, -0.437255859375, -0.30596923828125, -0.1746826171875, -0.04339599609375, 0.087890625, 0.21917724609375, 0.3504638671875, 0.48175048828125, 0.613037109375, 0.74432373046875, 0.8756103515625, 1.00689697265625, 1.13818359375, 1.26947021484375, 1.4007568359375, 1.53204345703125, 1.663330078125, 1.79461669921875, 1.9259033203125, 2.05718994140625, 2.1884765625, 2.31976318359375, 2.4510498046875, 2.58233642578125, 2.713623046875, 2.84490966796875, 2.9761962890625, 3.10748291015625, 3.23876953125, 3.37005615234375, 3.5013427734375, 3.63262939453125, 3.763916015625, 3.89520263671875, 4.0264892578125, 4.15777587890625, 4.2890625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 5.0, 5.0, 3.0, 3.0, 8.0, 11.0, 9.0, 20.0, 13.0, 18.0, 21.0, 28.0, 51.0, 42.0, 44.0, 42.0, 58.0, 57.0, 63.0, 54.0, 46.0, 63.0, 43.0, 56.0, 40.0, 29.0, 32.0, 29.0, 18.0, 16.0, 18.0, 9.0, 10.0, 10.0, 6.0, 10.0, 2.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.029296875, -0.997283935546875, -0.96527099609375, -0.933258056640625, -0.9012451171875, -0.869232177734375, -0.83721923828125, -0.805206298828125, -0.773193359375, -0.741180419921875, -0.70916748046875, -0.677154541015625, -0.6451416015625, -0.613128662109375, -0.58111572265625, -0.549102783203125, -0.51708984375, -0.485076904296875, -0.45306396484375, -0.421051025390625, -0.3890380859375, -0.357025146484375, -0.32501220703125, -0.292999267578125, -0.260986328125, -0.228973388671875, -0.19696044921875, -0.164947509765625, -0.1329345703125, -0.100921630859375, -0.06890869140625, -0.036895751953125, -0.0048828125, 0.027130126953125, 0.05914306640625, 0.091156005859375, 0.1231689453125, 0.155181884765625, 0.18719482421875, 0.219207763671875, 0.251220703125, 0.283233642578125, 0.31524658203125, 0.347259521484375, 0.3792724609375, 0.411285400390625, 0.44329833984375, 0.475311279296875, 0.50732421875, 0.539337158203125, 0.57135009765625, 0.603363037109375, 0.6353759765625, 0.667388916015625, 0.69940185546875, 0.731414794921875, 0.763427734375, 0.795440673828125, 0.82745361328125, 0.859466552734375, 0.8914794921875, 0.923492431640625, 0.95550537109375, 0.987518310546875, 1.01953125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 8.0, 13.0, 13.0, 12.0, 23.0, 21.0, 27.0, 33.0, 41.0, 48.0, 53.0, 59.0, 60.0, 70.0, 53.0, 66.0, 52.0, 58.0, 44.0, 55.0, 32.0, 33.0, 26.0, 20.0, 22.0, 12.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.757859230041504, -10.388653755187988, -10.019449234008789, -9.650243759155273, -9.281038284301758, -8.911833763122559, -8.542628288269043, -8.173423767089844, -7.804218292236328, -7.435013294219971, -7.065808296203613, -6.696602821350098, -6.32739782333374, -5.958192825317383, -5.588987350463867, -5.21978235244751, -4.850577354431152, -4.481372356414795, -4.1121673583984375, -3.742961883544922, -3.3737568855285645, -3.004551887512207, -2.6353466510772705, -2.266141414642334, -1.8969364166259766, -1.5277312994003296, -1.1585261821746826, -0.7893210649490356, -0.42011594772338867, -0.0509108304977417, 0.3182942867279053, 0.6874995231628418, 1.0567035675048828, 1.4259086847305298, 1.7951138019561768, 2.1643190383911133, 2.5335240364074707, 2.902729034423828, 3.2719342708587646, 3.641139507293701, 4.010344505310059, 4.379549503326416, 4.748754501342773, 5.117959976196289, 5.4871649742126465, 5.856369972229004, 6.2255754470825195, 6.594780445098877, 6.963985443115234, 7.333190441131592, 7.702395439147949, 8.071600914001465, 8.440805435180664, 8.81001091003418, 9.179216384887695, 9.548421859741211, 9.91762638092041, 10.286831855773926, 10.656036376953125, 11.02524185180664, 11.394447326660156, 11.763651847839355, 12.132857322692871, 12.50206184387207, 12.871267318725586]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 1.0, 8.0, 5.0, 5.0, 9.0, 17.0, 14.0, 16.0, 19.0, 26.0, 18.0, 20.0, 30.0, 30.0, 46.0, 36.0, 39.0, 31.0, 48.0, 40.0, 52.0, 41.0, 37.0, 52.0, 46.0, 39.0, 30.0, 34.0, 38.0, 23.0, 32.0, 15.0, 21.0, 21.0, 16.0, 15.0, 9.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0], "bins": [-8.137473106384277, -7.937674522399902, -7.737875938415527, -7.538077354431152, -7.338278770446777, -7.138480186462402, -6.938681602478027, -6.738883018493652, -6.539084434509277, -6.339285850524902, -6.139487266540527, -5.939688682556152, -5.739890098571777, -5.540091514587402, -5.340292930603027, -5.140494346618652, -4.9406962394714355, -4.7408976554870605, -4.5410990715026855, -4.3413004875183105, -4.1415019035339355, -3.9417033195495605, -3.7419049739837646, -3.5421063899993896, -3.3423078060150146, -3.1425092220306396, -2.9427106380462646, -2.7429122924804688, -2.5431137084960938, -2.3433151245117188, -2.1435165405273438, -1.9437179565429688, -1.7439188957214355, -1.5441203117370605, -1.3443217277526855, -1.1445232629776, -0.9447246789932251, -0.7449260950088501, -0.5451276302337646, -0.34532904624938965, -0.14553046226501465, 0.054268091917037964, 0.2540666460990906, 0.4538651704788208, 0.6536637544631958, 0.8534623384475708, 1.0532608032226562, 1.2530593872070312, 1.4528579711914062, 1.6526565551757812, 1.8524551391601562, 2.0522537231445312, 2.2520523071289062, 2.4518508911132812, 2.651649236679077, 2.851447820663452, 3.051246404647827, 3.251044988632202, 3.450843572616577, 3.650641918182373, 3.850440502166748, 4.050239086151123, 4.250037670135498, 4.449836254119873, 4.649634838104248]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 11.0, 7.0, 15.0, 32.0, 28.0, 54.0, 100.0, 121.0, 209.0, 315.0, 467.0, 814.0, 1365.0, 2380.0, 4318.0, 7955.0, 15365.0, 30366.0, 62018.0, 133168.0, 291832.0, 616505.0, 1028158.0, 970733.0, 542875.0, 253949.0, 116699.0, 55161.0, 27206.0, 13891.0, 7432.0, 4339.0, 2429.0, 1475.0, 870.0, 540.0, 385.0, 213.0, 165.0, 98.0, 79.0, 57.0, 35.0, 16.0, 19.0, 5.0, 7.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.2208251953125, -9.879150390625, -9.5374755859375, -9.19580078125, -8.8541259765625, -8.512451171875, -8.1707763671875, -7.8291015625, -7.4874267578125, -7.145751953125, -6.8040771484375, -6.46240234375, -6.1207275390625, -5.779052734375, -5.4373779296875, -5.095703125, -4.7540283203125, -4.412353515625, -4.0706787109375, -3.72900390625, -3.3873291015625, -3.045654296875, -2.7039794921875, -2.3623046875, -2.0206298828125, -1.678955078125, -1.3372802734375, -0.99560546875, -0.6539306640625, -0.312255859375, 0.0294189453125, 0.37109375, 0.7127685546875, 1.054443359375, 1.3961181640625, 1.73779296875, 2.0794677734375, 2.421142578125, 2.7628173828125, 3.1044921875, 3.4461669921875, 3.787841796875, 4.1295166015625, 4.47119140625, 4.8128662109375, 5.154541015625, 5.4962158203125, 5.837890625, 6.1795654296875, 6.521240234375, 6.8629150390625, 7.20458984375, 7.5462646484375, 7.887939453125, 8.2296142578125, 8.5712890625, 8.9129638671875, 9.254638671875, 9.5963134765625, 9.93798828125, 10.2796630859375, 10.621337890625, 10.9630126953125, 11.3046875]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 4.0, 6.0, 5.0, 10.0, 16.0, 16.0, 8.0, 19.0, 15.0, 27.0, 24.0, 21.0, 36.0, 32.0, 27.0, 36.0, 33.0, 46.0, 36.0, 37.0, 51.0, 46.0, 35.0, 35.0, 46.0, 48.0, 29.0, 32.0, 22.0, 29.0, 21.0, 29.0, 19.0, 14.0, 14.0, 13.0, 16.0, 8.0, 9.0, 7.0, 5.0, 2.0, 5.0, 7.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.73828125, -4.597900390625, -4.45751953125, -4.317138671875, -4.1767578125, -4.036376953125, -3.89599609375, -3.755615234375, -3.615234375, -3.474853515625, -3.33447265625, -3.194091796875, -3.0537109375, -2.913330078125, -2.77294921875, -2.632568359375, -2.4921875, -2.351806640625, -2.21142578125, -2.071044921875, -1.9306640625, -1.790283203125, -1.64990234375, -1.509521484375, -1.369140625, -1.228759765625, -1.08837890625, -0.947998046875, -0.8076171875, -0.667236328125, -0.52685546875, -0.386474609375, -0.24609375, -0.105712890625, 0.03466796875, 0.175048828125, 0.3154296875, 0.455810546875, 0.59619140625, 0.736572265625, 0.876953125, 1.017333984375, 1.15771484375, 1.298095703125, 1.4384765625, 1.578857421875, 1.71923828125, 1.859619140625, 2.0, 2.140380859375, 2.28076171875, 2.421142578125, 2.5615234375, 2.701904296875, 2.84228515625, 2.982666015625, 3.123046875, 3.263427734375, 3.40380859375, 3.544189453125, 3.6845703125, 3.824951171875, 3.96533203125, 4.105712890625, 4.24609375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 7.0, 7.0, 9.0, 13.0, 17.0, 37.0, 45.0, 69.0, 83.0, 122.0, 223.0, 332.0, 456.0, 748.0, 1179.0, 1933.0, 3189.0, 5319.0, 9330.0, 16870.0, 31252.0, 58474.0, 111418.0, 212145.0, 392667.0, 655658.0, 859110.0, 759627.0, 489672.0, 273815.0, 144706.0, 75199.0, 40020.0, 21564.0, 11827.0, 6810.0, 3996.0, 2365.0, 1440.0, 865.0, 588.0, 372.0, 232.0, 160.0, 96.0, 72.0, 41.0, 37.0, 24.0, 14.0, 12.0, 8.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0], "bins": [-10.5859375, -10.26220703125, -9.9384765625, -9.61474609375, -9.291015625, -8.96728515625, -8.6435546875, -8.31982421875, -7.99609375, -7.67236328125, -7.3486328125, -7.02490234375, -6.701171875, -6.37744140625, -6.0537109375, -5.72998046875, -5.40625, -5.08251953125, -4.7587890625, -4.43505859375, -4.111328125, -3.78759765625, -3.4638671875, -3.14013671875, -2.81640625, -2.49267578125, -2.1689453125, -1.84521484375, -1.521484375, -1.19775390625, -0.8740234375, -0.55029296875, -0.2265625, 0.09716796875, 0.4208984375, 0.74462890625, 1.068359375, 1.39208984375, 1.7158203125, 2.03955078125, 2.36328125, 2.68701171875, 3.0107421875, 3.33447265625, 3.658203125, 3.98193359375, 4.3056640625, 4.62939453125, 4.953125, 5.27685546875, 5.6005859375, 5.92431640625, 6.248046875, 6.57177734375, 6.8955078125, 7.21923828125, 7.54296875, 7.86669921875, 8.1904296875, 8.51416015625, 8.837890625, 9.16162109375, 9.4853515625, 9.80908203125, 10.1328125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 8.0, 3.0, 8.0, 13.0, 18.0, 21.0, 17.0, 28.0, 31.0, 41.0, 54.0, 69.0, 61.0, 101.0, 111.0, 115.0, 135.0, 118.0, 166.0, 192.0, 213.0, 228.0, 219.0, 216.0, 242.0, 224.0, 190.0, 184.0, 157.0, 139.0, 141.0, 92.0, 107.0, 86.0, 84.0, 53.0, 39.0, 32.0, 28.0, 20.0, 23.0, 10.0, 9.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-2.80078125, -2.719085693359375, -2.63739013671875, -2.555694580078125, -2.4739990234375, -2.392303466796875, -2.31060791015625, -2.228912353515625, -2.147216796875, -2.065521240234375, -1.98382568359375, -1.902130126953125, -1.8204345703125, -1.738739013671875, -1.65704345703125, -1.575347900390625, -1.49365234375, -1.411956787109375, -1.33026123046875, -1.248565673828125, -1.1668701171875, -1.085174560546875, -1.00347900390625, -0.921783447265625, -0.840087890625, -0.758392333984375, -0.67669677734375, -0.595001220703125, -0.5133056640625, -0.431610107421875, -0.34991455078125, -0.268218994140625, -0.1865234375, -0.104827880859375, -0.02313232421875, 0.058563232421875, 0.1402587890625, 0.221954345703125, 0.30364990234375, 0.385345458984375, 0.467041015625, 0.548736572265625, 0.63043212890625, 0.712127685546875, 0.7938232421875, 0.875518798828125, 0.95721435546875, 1.038909912109375, 1.12060546875, 1.202301025390625, 1.28399658203125, 1.365692138671875, 1.4473876953125, 1.529083251953125, 1.61077880859375, 1.692474365234375, 1.774169921875, 1.855865478515625, 1.93756103515625, 2.019256591796875, 2.1009521484375, 2.182647705078125, 2.26434326171875, 2.346038818359375, 2.427734375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 9.0, 5.0, 9.0, 16.0, 12.0, 22.0, 25.0, 32.0, 35.0, 51.0, 48.0, 55.0, 58.0, 77.0, 69.0, 81.0, 85.0, 47.0, 53.0, 44.0, 38.0, 33.0, 23.0, 17.0, 11.0, 15.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.32799243927002, -11.923131942749023, -11.518272399902344, -11.113411903381348, -10.708551406860352, -10.303691864013672, -9.898831367492676, -9.49397087097168, -9.089111328125, -8.684250831604004, -8.279391288757324, -7.874530792236328, -7.469670295715332, -7.064810276031494, -6.659950256347656, -6.25508975982666, -5.850229263305664, -5.445369243621826, -5.04050874710083, -4.635648727416992, -4.230788230895996, -3.825928211212158, -3.4210681915283203, -3.0162079334259033, -2.6113476753234863, -2.2064874172210693, -1.801627278327942, -1.3967671394348145, -0.9919068813323975, -0.5870466232299805, -0.18218660354614258, 0.22267365455627441, 0.6275348663330078, 1.0323951244354248, 1.4372552633285522, 1.8421154022216797, 2.2469756603240967, 2.6518359184265137, 3.0566959381103516, 3.4615561962127686, 3.8664164543151855, 4.271276473999023, 4.6761369705200195, 5.080996990203857, 5.485857009887695, 5.890717506408691, 6.295577526092529, 6.700437545776367, 7.105298042297363, 7.510158061981201, 7.915018558502197, 8.319878578186035, 8.724739074707031, 9.129598617553711, 9.534459114074707, 9.939319610595703, 10.344179153442383, 10.749039649963379, 11.153899192810059, 11.558759689331055, 11.96362018585205, 12.368480682373047, 12.773340225219727, 13.178200721740723, 13.583061218261719]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 8.0, 11.0, 8.0, 13.0, 10.0, 20.0, 18.0, 18.0, 23.0, 32.0, 32.0, 33.0, 23.0, 37.0, 32.0, 39.0, 32.0, 37.0, 41.0, 41.0, 47.0, 40.0, 37.0, 42.0, 30.0, 41.0, 37.0, 27.0, 26.0, 23.0, 23.0, 17.0, 13.0, 14.0, 10.0, 15.0, 10.0, 10.0, 12.0, 5.0, 7.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.965183734893799, -5.783688068389893, -5.602191925048828, -5.420696258544922, -5.239200592041016, -5.057704925537109, -4.876209259033203, -4.694713115692139, -4.513217449188232, -4.331721782684326, -4.150225639343262, -3.9687299728393555, -3.787234306335449, -3.605738639831543, -3.4242427349090576, -3.2427468299865723, -3.061251163482666, -2.8797554969787598, -2.6982595920562744, -2.516763687133789, -2.335268020629883, -2.1537723541259766, -1.9722764492034912, -1.7907806634902954, -1.6092848777770996, -1.4277890920639038, -1.246293306350708, -1.0647975206375122, -0.8833017349243164, -0.7018059492111206, -0.5203101634979248, -0.338814377784729, -0.157318115234375, 0.0241776704788208, 0.2056734561920166, 0.3871692419052124, 0.5686650276184082, 0.750160813331604, 0.9316565990447998, 1.1131523847579956, 1.2946481704711914, 1.4761439561843872, 1.657639741897583, 1.8391355276107788, 2.0206313133239746, 2.202126979827881, 2.383622884750366, 2.5651187896728516, 2.746614456176758, 2.928110122680664, 3.1096060276031494, 3.2911019325256348, 3.472597599029541, 3.6540932655334473, 3.8355891704559326, 4.017085075378418, 4.198580741882324, 4.3800764083862305, 4.561572074890137, 4.743068218231201, 4.924563884735107, 5.106059551239014, 5.287555694580078, 5.469051361083984, 5.650547027587891]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 2.0, 9.0, 21.0, 15.0, 20.0, 31.0, 50.0, 50.0, 97.0, 111.0, 166.0, 207.0, 311.0, 398.0, 600.0, 844.0, 1265.0, 2010.0, 3509.0, 7713.0, 20809.0, 68340.0, 216903.0, 381435.0, 229774.0, 73630.0, 22168.0, 7985.0, 3621.0, 2100.0, 1352.0, 878.0, 586.0, 420.0, 338.0, 238.0, 152.0, 92.0, 82.0, 65.0, 47.0, 23.0, 26.0, 21.0, 5.0, 10.0, 8.0, 7.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.7578125, -8.470947265625, -8.18408203125, -7.897216796875, -7.6103515625, -7.323486328125, -7.03662109375, -6.749755859375, -6.462890625, -6.176025390625, -5.88916015625, -5.602294921875, -5.3154296875, -5.028564453125, -4.74169921875, -4.454833984375, -4.16796875, -3.881103515625, -3.59423828125, -3.307373046875, -3.0205078125, -2.733642578125, -2.44677734375, -2.159912109375, -1.873046875, -1.586181640625, -1.29931640625, -1.012451171875, -0.7255859375, -0.438720703125, -0.15185546875, 0.135009765625, 0.421875, 0.708740234375, 0.99560546875, 1.282470703125, 1.5693359375, 1.856201171875, 2.14306640625, 2.429931640625, 2.716796875, 3.003662109375, 3.29052734375, 3.577392578125, 3.8642578125, 4.151123046875, 4.43798828125, 4.724853515625, 5.01171875, 5.298583984375, 5.58544921875, 5.872314453125, 6.1591796875, 6.446044921875, 6.73291015625, 7.019775390625, 7.306640625, 7.593505859375, 7.88037109375, 8.167236328125, 8.4541015625, 8.740966796875, 9.02783203125, 9.314697265625, 9.6015625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 8.0, 12.0, 9.0, 16.0, 23.0, 27.0, 25.0, 19.0, 35.0, 31.0, 39.0, 29.0, 41.0, 41.0, 50.0, 41.0, 45.0, 41.0, 36.0, 49.0, 31.0, 36.0, 26.0, 31.0, 22.0, 24.0, 22.0, 21.0, 31.0, 25.0, 20.0, 13.0, 18.0, 12.0, 5.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5546875, -6.337158203125, -6.11962890625, -5.902099609375, -5.6845703125, -5.467041015625, -5.24951171875, -5.031982421875, -4.814453125, -4.596923828125, -4.37939453125, -4.161865234375, -3.9443359375, -3.726806640625, -3.50927734375, -3.291748046875, -3.07421875, -2.856689453125, -2.63916015625, -2.421630859375, -2.2041015625, -1.986572265625, -1.76904296875, -1.551513671875, -1.333984375, -1.116455078125, -0.89892578125, -0.681396484375, -0.4638671875, -0.246337890625, -0.02880859375, 0.188720703125, 0.40625, 0.623779296875, 0.84130859375, 1.058837890625, 1.2763671875, 1.493896484375, 1.71142578125, 1.928955078125, 2.146484375, 2.364013671875, 2.58154296875, 2.799072265625, 3.0166015625, 3.234130859375, 3.45166015625, 3.669189453125, 3.88671875, 4.104248046875, 4.32177734375, 4.539306640625, 4.7568359375, 4.974365234375, 5.19189453125, 5.409423828125, 5.626953125, 5.844482421875, 6.06201171875, 6.279541015625, 6.4970703125, 6.714599609375, 6.93212890625, 7.149658203125, 7.3671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 8.0, 2.0, 8.0, 6.0, 8.0, 15.0, 23.0, 16.0, 26.0, 34.0, 60.0, 79.0, 121.0, 182.0, 250.0, 399.0, 601.0, 1032.0, 1786.0, 3919.0, 13066.0, 78548.0, 536945.0, 351894.0, 43712.0, 8773.0, 3084.0, 1516.0, 860.0, 501.0, 333.0, 230.0, 154.0, 94.0, 88.0, 41.0, 36.0, 30.0, 27.0, 14.0, 14.0, 7.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.40625, -19.82080078125, -19.2353515625, -18.64990234375, -18.064453125, -17.47900390625, -16.8935546875, -16.30810546875, -15.72265625, -15.13720703125, -14.5517578125, -13.96630859375, -13.380859375, -12.79541015625, -12.2099609375, -11.62451171875, -11.0390625, -10.45361328125, -9.8681640625, -9.28271484375, -8.697265625, -8.11181640625, -7.5263671875, -6.94091796875, -6.35546875, -5.77001953125, -5.1845703125, -4.59912109375, -4.013671875, -3.42822265625, -2.8427734375, -2.25732421875, -1.671875, -1.08642578125, -0.5009765625, 0.08447265625, 0.669921875, 1.25537109375, 1.8408203125, 2.42626953125, 3.01171875, 3.59716796875, 4.1826171875, 4.76806640625, 5.353515625, 5.93896484375, 6.5244140625, 7.10986328125, 7.6953125, 8.28076171875, 8.8662109375, 9.45166015625, 10.037109375, 10.62255859375, 11.2080078125, 11.79345703125, 12.37890625, 12.96435546875, 13.5498046875, 14.13525390625, 14.720703125, 15.30615234375, 15.8916015625, 16.47705078125, 17.0625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 5.0, 12.0, 8.0, 10.0, 15.0, 19.0, 17.0, 18.0, 21.0, 25.0, 29.0, 31.0, 32.0, 24.0, 39.0, 33.0, 41.0, 39.0, 35.0, 38.0, 42.0, 35.0, 42.0, 30.0, 33.0, 24.0, 35.0, 40.0, 30.0, 20.0, 21.0, 18.0, 23.0, 20.0, 17.0, 12.0, 13.0, 10.0, 10.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.830078125, -3.714141845703125, -3.59820556640625, -3.482269287109375, -3.3663330078125, -3.250396728515625, -3.13446044921875, -3.018524169921875, -2.902587890625, -2.786651611328125, -2.67071533203125, -2.554779052734375, -2.4388427734375, -2.322906494140625, -2.20697021484375, -2.091033935546875, -1.97509765625, -1.859161376953125, -1.74322509765625, -1.627288818359375, -1.5113525390625, -1.395416259765625, -1.27947998046875, -1.163543701171875, -1.047607421875, -0.931671142578125, -0.81573486328125, -0.699798583984375, -0.5838623046875, -0.467926025390625, -0.35198974609375, -0.236053466796875, -0.1201171875, -0.004180908203125, 0.11175537109375, 0.227691650390625, 0.3436279296875, 0.459564208984375, 0.57550048828125, 0.691436767578125, 0.807373046875, 0.923309326171875, 1.03924560546875, 1.155181884765625, 1.2711181640625, 1.387054443359375, 1.50299072265625, 1.618927001953125, 1.73486328125, 1.850799560546875, 1.96673583984375, 2.082672119140625, 2.1986083984375, 2.314544677734375, 2.43048095703125, 2.546417236328125, 2.662353515625, 2.778289794921875, 2.89422607421875, 3.010162353515625, 3.1260986328125, 3.242034912109375, 3.35797119140625, 3.473907470703125, 3.58984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 2.0, 6.0, 6.0, 15.0, 21.0, 28.0, 43.0, 61.0, 96.0, 96.0, 177.0, 205.0, 307.0, 512.0, 747.0, 1090.0, 1708.0, 2773.0, 5181.0, 10333.0, 23549.0, 60812.0, 166307.0, 352065.0, 256591.0, 97685.0, 36268.0, 14787.0, 7135.0, 3562.0, 2161.0, 1356.0, 843.0, 640.0, 429.0, 291.0, 204.0, 135.0, 96.0, 76.0, 48.0, 34.0, 24.0, 15.0, 11.0, 11.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.17578125, -4.0482177734375, -3.920654296875, -3.7930908203125, -3.66552734375, -3.5379638671875, -3.410400390625, -3.2828369140625, -3.1552734375, -3.0277099609375, -2.900146484375, -2.7725830078125, -2.64501953125, -2.5174560546875, -2.389892578125, -2.2623291015625, -2.134765625, -2.0072021484375, -1.879638671875, -1.7520751953125, -1.62451171875, -1.4969482421875, -1.369384765625, -1.2418212890625, -1.1142578125, -0.9866943359375, -0.859130859375, -0.7315673828125, -0.60400390625, -0.4764404296875, -0.348876953125, -0.2213134765625, -0.09375, 0.0338134765625, 0.161376953125, 0.2889404296875, 0.41650390625, 0.5440673828125, 0.671630859375, 0.7991943359375, 0.9267578125, 1.0543212890625, 1.181884765625, 1.3094482421875, 1.43701171875, 1.5645751953125, 1.692138671875, 1.8197021484375, 1.947265625, 2.0748291015625, 2.202392578125, 2.3299560546875, 2.45751953125, 2.5850830078125, 2.712646484375, 2.8402099609375, 2.9677734375, 3.0953369140625, 3.222900390625, 3.3504638671875, 3.47802734375, 3.6055908203125, 3.733154296875, 3.8607177734375, 3.98828125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 15.0, 31.0, 66.0, 115.0, 165.0, 190.0, 169.0, 102.0, 61.0, 31.0, 19.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000377655029296875, -0.0003660470247268677, -0.00035443902015686035, -0.00034283101558685303, -0.0003312230110168457, -0.0003196150064468384, -0.00030800700187683105, -0.00029639899730682373, -0.0002847909927368164, -0.0002731829881668091, -0.00026157498359680176, -0.00024996697902679443, -0.0002383589744567871, -0.00022675096988677979, -0.00021514296531677246, -0.00020353496074676514, -0.0001919269561767578, -0.0001803189516067505, -0.00016871094703674316, -0.00015710294246673584, -0.00014549493789672852, -0.0001338869333267212, -0.00012227892875671387, -0.00011067092418670654, -9.906291961669922e-05, -8.74549150466919e-05, -7.584691047668457e-05, -6.423890590667725e-05, -5.263090133666992e-05, -4.10228967666626e-05, -2.9414892196655273e-05, -1.780688762664795e-05, -6.198883056640625e-06, 5.409121513366699e-06, 1.7017126083374023e-05, 2.8625130653381348e-05, 4.023313522338867e-05, 5.1841139793395996e-05, 6.344914436340332e-05, 7.505714893341064e-05, 8.666515350341797e-05, 9.827315807342529e-05, 0.00010988116264343262, 0.00012148916721343994, 0.00013309717178344727, 0.0001447051763534546, 0.00015631318092346191, 0.00016792118549346924, 0.00017952919006347656, 0.0001911371946334839, 0.0002027451992034912, 0.00021435320377349854, 0.00022596120834350586, 0.00023756921291351318, 0.0002491772174835205, 0.00026078522205352783, 0.00027239322662353516, 0.0002840012311935425, 0.0002956092357635498, 0.00030721724033355713, 0.00031882524490356445, 0.0003304332494735718, 0.0003420412540435791, 0.0003536492586135864, 0.00036525726318359375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 8.0, 8.0, 12.0, 16.0, 17.0, 29.0, 56.0, 76.0, 174.0, 245.0, 470.0, 736.0, 1422.0, 2330.0, 4549.0, 11065.0, 41361.0, 189052.0, 460351.0, 252914.0, 57977.0, 14196.0, 5303.0, 2601.0, 1475.0, 863.0, 514.0, 296.0, 152.0, 109.0, 76.0, 41.0, 20.0, 19.0, 14.0, 6.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75, -4.56451416015625, -4.3790283203125, -4.19354248046875, -4.008056640625, -3.82257080078125, -3.6370849609375, -3.45159912109375, -3.26611328125, -3.08062744140625, -2.8951416015625, -2.70965576171875, -2.524169921875, -2.33868408203125, -2.1531982421875, -1.96771240234375, -1.7822265625, -1.59674072265625, -1.4112548828125, -1.22576904296875, -1.040283203125, -0.85479736328125, -0.6693115234375, -0.48382568359375, -0.29833984375, -0.11285400390625, 0.0726318359375, 0.25811767578125, 0.443603515625, 0.62908935546875, 0.8145751953125, 1.00006103515625, 1.185546875, 1.37103271484375, 1.5565185546875, 1.74200439453125, 1.927490234375, 2.11297607421875, 2.2984619140625, 2.48394775390625, 2.66943359375, 2.85491943359375, 3.0404052734375, 3.22589111328125, 3.411376953125, 3.59686279296875, 3.7823486328125, 3.96783447265625, 4.1533203125, 4.33880615234375, 4.5242919921875, 4.70977783203125, 4.895263671875, 5.08074951171875, 5.2662353515625, 5.45172119140625, 5.63720703125, 5.82269287109375, 6.0081787109375, 6.19366455078125, 6.379150390625, 6.56463623046875, 6.7501220703125, 6.93560791015625, 7.12109375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 4.0, 5.0, 9.0, 11.0, 16.0, 23.0, 31.0, 34.0, 45.0, 29.0, 46.0, 60.0, 60.0, 83.0, 76.0, 67.0, 76.0, 66.0, 55.0, 34.0, 35.0, 28.0, 19.0, 14.0, 10.0, 11.0, 9.0, 8.0, 8.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.7607421875, -0.7370223999023438, -0.7133026123046875, -0.6895828247070312, -0.665863037109375, -0.6421432495117188, -0.6184234619140625, -0.5947036743164062, -0.57098388671875, -0.5472640991210938, -0.5235443115234375, -0.49982452392578125, -0.476104736328125, -0.45238494873046875, -0.4286651611328125, -0.40494537353515625, -0.3812255859375, -0.35750579833984375, -0.3337860107421875, -0.31006622314453125, -0.286346435546875, -0.26262664794921875, -0.2389068603515625, -0.21518707275390625, -0.19146728515625, -0.16774749755859375, -0.1440277099609375, -0.12030792236328125, -0.096588134765625, -0.07286834716796875, -0.0491485595703125, -0.02542877197265625, -0.001708984375, 0.02201080322265625, 0.0457305908203125, 0.06945037841796875, 0.093170166015625, 0.11688995361328125, 0.1406097412109375, 0.16432952880859375, 0.18804931640625, 0.21176910400390625, 0.2354888916015625, 0.25920867919921875, 0.282928466796875, 0.30664825439453125, 0.3303680419921875, 0.35408782958984375, 0.3778076171875, 0.40152740478515625, 0.4252471923828125, 0.44896697998046875, 0.472686767578125, 0.49640655517578125, 0.5201263427734375, 0.5438461303710938, 0.56756591796875, 0.5912857055664062, 0.6150054931640625, 0.6387252807617188, 0.662445068359375, 0.6861648559570312, 0.7098846435546875, 0.7336044311523438, 0.75732421875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 0.0, 1.0, 4.0, 5.0, 7.0, 9.0, 12.0, 14.0, 16.0, 32.0, 24.0, 33.0, 43.0, 63.0, 63.0, 66.0, 69.0, 98.0, 83.0, 68.0, 55.0, 57.0, 42.0, 33.0, 26.0, 20.0, 23.0, 8.0, 13.0, 8.0, 7.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.16039752960205, -12.72585678100586, -12.291315078735352, -11.85677433013916, -11.422233581542969, -10.987691879272461, -10.55315113067627, -10.118610382080078, -9.68406867980957, -9.249527931213379, -8.814986228942871, -8.38044548034668, -7.945904731750488, -7.511363506317139, -7.076822280883789, -6.642281532287598, -6.207740783691406, -5.773199558258057, -5.338658809661865, -4.904117584228516, -4.469576835632324, -4.035035610198975, -3.600494384765625, -3.1659533977508545, -2.731412410736084, -2.2968714237213135, -1.8623303174972534, -1.4277892112731934, -0.9932482242584229, -0.5587072372436523, -0.12416601181030273, 0.3103749752044678, 0.7449169158935547, 1.1794579029083252, 1.6139990091323853, 2.0485401153564453, 2.483081102371216, 2.9176220893859863, 3.352163314819336, 3.7867043018341064, 4.221245288848877, 4.655786514282227, 5.090327262878418, 5.524868488311768, 5.959409713745117, 6.393950462341309, 6.828491687774658, 7.263032913208008, 7.697573661804199, 8.13211441040039, 8.566656112670898, 9.00119686126709, 9.435737609863281, 9.870279312133789, 10.30482006072998, 10.739360809326172, 11.17390251159668, 11.608443260192871, 12.042984962463379, 12.47752571105957, 12.912066459655762, 13.346607208251953, 13.781148910522461, 14.215689659118652, 14.650230407714844]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 7.0, 7.0, 16.0, 7.0, 23.0, 18.0, 15.0, 22.0, 28.0, 35.0, 31.0, 27.0, 33.0, 38.0, 34.0, 28.0, 34.0, 42.0, 47.0, 34.0, 55.0, 34.0, 44.0, 32.0, 39.0, 46.0, 16.0, 29.0, 26.0, 21.0, 21.0, 14.0, 14.0, 10.0, 13.0, 11.0, 13.0, 7.0, 10.0, 8.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.930757999420166, -5.750031471252441, -5.569304466247559, -5.388577938079834, -5.207851409912109, -5.027124404907227, -4.846397876739502, -4.665671348571777, -4.4849443435668945, -4.30421781539917, -4.123490810394287, -3.9427642822265625, -3.762037754058838, -3.581310987472534, -3.4005842208862305, -3.219857692718506, -3.0391311645507812, -2.8584043979644775, -2.677677869796753, -2.496951103210449, -2.3162245750427246, -2.135497808456421, -1.9547710418701172, -1.774044394493103, -1.5933177471160889, -1.4125910997390747, -1.2318644523620605, -1.0511376857757568, -0.8704110383987427, -0.6896843910217285, -0.5089576244354248, -0.32823097705841064, -0.14750432968139648, 0.033222347497940063, 0.2139490246772766, 0.39467573165893555, 0.5754023790359497, 0.7561290264129639, 0.9368557929992676, 1.1175824403762817, 1.298309087753296, 1.47903573513031, 1.6597623825073242, 1.840489149093628, 2.0212159156799316, 2.2019424438476562, 2.38266921043396, 2.5633959770202637, 2.7441225051879883, 2.924849271774292, 3.1055757999420166, 3.2863025665283203, 3.467029094696045, 3.6477558612823486, 3.8284826278686523, 4.009209156036377, 4.189935684204102, 4.370662212371826, 4.551389217376709, 4.732115745544434, 4.912842273712158, 5.093568801879883, 5.274295806884766, 5.45502233505249, 5.635749340057373]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 7.0, 5.0, 9.0, 10.0, 12.0, 20.0, 56.0, 57.0, 101.0, 149.0, 228.0, 367.0, 593.0, 985.0, 1574.0, 2441.0, 4323.0, 7400.0, 12768.0, 21368.0, 35909.0, 57970.0, 88014.0, 121902.0, 147962.0, 151381.0, 129902.0, 97672.0, 64812.0, 40347.0, 24763.0, 14452.0, 8526.0, 4901.0, 2866.0, 1729.0, 1098.0, 700.0, 406.0, 279.0, 165.0, 129.0, 66.0, 52.0, 28.0, 22.0, 13.0, 9.0, 9.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-7.921875, -7.68975830078125, -7.4576416015625, -7.22552490234375, -6.993408203125, -6.76129150390625, -6.5291748046875, -6.29705810546875, -6.06494140625, -5.83282470703125, -5.6007080078125, -5.36859130859375, -5.136474609375, -4.90435791015625, -4.6722412109375, -4.44012451171875, -4.2080078125, -3.97589111328125, -3.7437744140625, -3.51165771484375, -3.279541015625, -3.04742431640625, -2.8153076171875, -2.58319091796875, -2.35107421875, -2.11895751953125, -1.8868408203125, -1.65472412109375, -1.422607421875, -1.19049072265625, -0.9583740234375, -0.72625732421875, -0.494140625, -0.26202392578125, -0.0299072265625, 0.20220947265625, 0.434326171875, 0.66644287109375, 0.8985595703125, 1.13067626953125, 1.36279296875, 1.59490966796875, 1.8270263671875, 2.05914306640625, 2.291259765625, 2.52337646484375, 2.7554931640625, 2.98760986328125, 3.2197265625, 3.45184326171875, 3.6839599609375, 3.91607666015625, 4.148193359375, 4.38031005859375, 4.6124267578125, 4.84454345703125, 5.07666015625, 5.30877685546875, 5.5408935546875, 5.77301025390625, 6.005126953125, 6.23724365234375, 6.4693603515625, 6.70147705078125, 6.93359375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 8.0, 5.0, 5.0, 14.0, 13.0, 24.0, 27.0, 26.0, 21.0, 21.0, 30.0, 25.0, 28.0, 30.0, 23.0, 28.0, 31.0, 38.0, 43.0, 38.0, 44.0, 30.0, 37.0, 36.0, 32.0, 32.0, 31.0, 24.0, 28.0, 32.0, 15.0, 22.0, 23.0, 11.0, 21.0, 15.0, 14.0, 17.0, 11.0, 11.0, 10.0, 6.0, 3.0, 5.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.57421875, -5.38995361328125, -5.2056884765625, -5.02142333984375, -4.837158203125, -4.65289306640625, -4.4686279296875, -4.28436279296875, -4.10009765625, -3.91583251953125, -3.7315673828125, -3.54730224609375, -3.363037109375, -3.17877197265625, -2.9945068359375, -2.81024169921875, -2.6259765625, -2.44171142578125, -2.2574462890625, -2.07318115234375, -1.888916015625, -1.70465087890625, -1.5203857421875, -1.33612060546875, -1.15185546875, -0.96759033203125, -0.7833251953125, -0.59906005859375, -0.414794921875, -0.23052978515625, -0.0462646484375, 0.13800048828125, 0.322265625, 0.50653076171875, 0.6907958984375, 0.87506103515625, 1.059326171875, 1.24359130859375, 1.4278564453125, 1.61212158203125, 1.79638671875, 1.98065185546875, 2.1649169921875, 2.34918212890625, 2.533447265625, 2.71771240234375, 2.9019775390625, 3.08624267578125, 3.2705078125, 3.45477294921875, 3.6390380859375, 3.82330322265625, 4.007568359375, 4.19183349609375, 4.3760986328125, 4.56036376953125, 4.74462890625, 4.92889404296875, 5.1131591796875, 5.29742431640625, 5.481689453125, 5.66595458984375, 5.8502197265625, 6.03448486328125, 6.21875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 19.0, 21.0, 16.0, 32.0, 55.0, 85.0, 113.0, 225.0, 415.0, 812.0, 1710.0, 3750.0, 9205.0, 23390.0, 59928.0, 139341.0, 245963.0, 264387.0, 169594.0, 77601.0, 30790.0, 11981.0, 4818.0, 2016.0, 1038.0, 500.0, 272.0, 169.0, 91.0, 68.0, 31.0, 29.0, 22.0, 15.0, 7.0, 10.0, 7.0, 1.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.9453125, -14.507568359375, -14.06982421875, -13.632080078125, -13.1943359375, -12.756591796875, -12.31884765625, -11.881103515625, -11.443359375, -11.005615234375, -10.56787109375, -10.130126953125, -9.6923828125, -9.254638671875, -8.81689453125, -8.379150390625, -7.94140625, -7.503662109375, -7.06591796875, -6.628173828125, -6.1904296875, -5.752685546875, -5.31494140625, -4.877197265625, -4.439453125, -4.001708984375, -3.56396484375, -3.126220703125, -2.6884765625, -2.250732421875, -1.81298828125, -1.375244140625, -0.9375, -0.499755859375, -0.06201171875, 0.375732421875, 0.8134765625, 1.251220703125, 1.68896484375, 2.126708984375, 2.564453125, 3.002197265625, 3.43994140625, 3.877685546875, 4.3154296875, 4.753173828125, 5.19091796875, 5.628662109375, 6.06640625, 6.504150390625, 6.94189453125, 7.379638671875, 7.8173828125, 8.255126953125, 8.69287109375, 9.130615234375, 9.568359375, 10.006103515625, 10.44384765625, 10.881591796875, 11.3193359375, 11.757080078125, 12.19482421875, 12.632568359375, 13.0703125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 5.0, 11.0, 6.0, 11.0, 13.0, 17.0, 20.0, 24.0, 31.0, 24.0, 27.0, 33.0, 23.0, 30.0, 43.0, 41.0, 34.0, 37.0, 56.0, 38.0, 41.0, 50.0, 35.0, 38.0, 36.0, 35.0, 28.0, 25.0, 26.0, 19.0, 20.0, 18.0, 16.0, 13.0, 17.0, 12.0, 10.0, 5.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.599609375, -3.479095458984375, -3.35858154296875, -3.238067626953125, -3.1175537109375, -2.997039794921875, -2.87652587890625, -2.756011962890625, -2.635498046875, -2.514984130859375, -2.39447021484375, -2.273956298828125, -2.1534423828125, -2.032928466796875, -1.91241455078125, -1.791900634765625, -1.67138671875, -1.550872802734375, -1.43035888671875, -1.309844970703125, -1.1893310546875, -1.068817138671875, -0.94830322265625, -0.827789306640625, -0.707275390625, -0.586761474609375, -0.46624755859375, -0.345733642578125, -0.2252197265625, -0.104705810546875, 0.01580810546875, 0.136322021484375, 0.2568359375, 0.377349853515625, 0.49786376953125, 0.618377685546875, 0.7388916015625, 0.859405517578125, 0.97991943359375, 1.100433349609375, 1.220947265625, 1.341461181640625, 1.46197509765625, 1.582489013671875, 1.7030029296875, 1.823516845703125, 1.94403076171875, 2.064544677734375, 2.18505859375, 2.305572509765625, 2.42608642578125, 2.546600341796875, 2.6671142578125, 2.787628173828125, 2.90814208984375, 3.028656005859375, 3.149169921875, 3.269683837890625, 3.39019775390625, 3.510711669921875, 3.6312255859375, 3.751739501953125, 3.87225341796875, 3.992767333984375, 4.11328125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 7.0, 1.0, 9.0, 8.0, 8.0, 15.0, 20.0, 32.0, 49.0, 56.0, 112.0, 146.0, 205.0, 298.0, 457.0, 723.0, 984.0, 1524.0, 2497.0, 4286.0, 8248.0, 18632.0, 50624.0, 149381.0, 319953.0, 292623.0, 122420.0, 41919.0, 15769.0, 7139.0, 3860.0, 2248.0, 1385.0, 917.0, 608.0, 396.0, 277.0, 217.0, 152.0, 97.0, 76.0, 50.0, 38.0, 24.0, 26.0, 12.0, 11.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0], "bins": [-9.515625, -9.2349853515625, -8.954345703125, -8.6737060546875, -8.39306640625, -8.1124267578125, -7.831787109375, -7.5511474609375, -7.2705078125, -6.9898681640625, -6.709228515625, -6.4285888671875, -6.14794921875, -5.8673095703125, -5.586669921875, -5.3060302734375, -5.025390625, -4.7447509765625, -4.464111328125, -4.1834716796875, -3.90283203125, -3.6221923828125, -3.341552734375, -3.0609130859375, -2.7802734375, -2.4996337890625, -2.218994140625, -1.9383544921875, -1.65771484375, -1.3770751953125, -1.096435546875, -0.8157958984375, -0.53515625, -0.2545166015625, 0.026123046875, 0.3067626953125, 0.58740234375, 0.8680419921875, 1.148681640625, 1.4293212890625, 1.7099609375, 1.9906005859375, 2.271240234375, 2.5518798828125, 2.83251953125, 3.1131591796875, 3.393798828125, 3.6744384765625, 3.955078125, 4.2357177734375, 4.516357421875, 4.7969970703125, 5.07763671875, 5.3582763671875, 5.638916015625, 5.9195556640625, 6.2001953125, 6.4808349609375, 6.761474609375, 7.0421142578125, 7.32275390625, 7.6033935546875, 7.884033203125, 8.1646728515625, 8.4453125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 10.0, 12.0, 22.0, 19.0, 63.0, 76.0, 106.0, 127.0, 118.0, 139.0, 103.0, 71.0, 42.0, 20.0, 27.0, 13.0, 14.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009899139404296875, -0.0009573698043823242, -0.0009248256683349609, -0.0008922815322875977, -0.0008597373962402344, -0.0008271932601928711, -0.0007946491241455078, -0.0007621049880981445, -0.0007295608520507812, -0.000697016716003418, -0.0006644725799560547, -0.0006319284439086914, -0.0005993843078613281, -0.0005668401718139648, -0.0005342960357666016, -0.0005017518997192383, -0.000469207763671875, -0.0004366636276245117, -0.00040411949157714844, -0.00037157535552978516, -0.0003390312194824219, -0.0003064870834350586, -0.0002739429473876953, -0.00024139881134033203, -0.00020885467529296875, -0.00017631053924560547, -0.0001437664031982422, -0.0001112222671508789, -7.867813110351562e-05, -4.6133995056152344e-05, -1.3589859008789062e-05, 1.895427703857422e-05, 5.14984130859375e-05, 8.404254913330078e-05, 0.00011658668518066406, 0.00014913082122802734, 0.00018167495727539062, 0.0002142190933227539, 0.0002467632293701172, 0.00027930736541748047, 0.00031185150146484375, 0.00034439563751220703, 0.0003769397735595703, 0.0004094839096069336, 0.0004420280456542969, 0.00047457218170166016, 0.0005071163177490234, 0.0005396604537963867, 0.00057220458984375, 0.0006047487258911133, 0.0006372928619384766, 0.0006698369979858398, 0.0007023811340332031, 0.0007349252700805664, 0.0007674694061279297, 0.000800013542175293, 0.0008325576782226562, 0.0008651018142700195, 0.0008976459503173828, 0.0009301900863647461, 0.0009627342224121094, 0.0009952783584594727, 0.001027822494506836, 0.0010603666305541992, 0.0010929107666015625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 1.0, 7.0, 9.0, 19.0, 13.0, 23.0, 49.0, 52.0, 77.0, 105.0, 183.0, 273.0, 412.0, 679.0, 1027.0, 1842.0, 3345.0, 6842.0, 17649.0, 59788.0, 209653.0, 405240.0, 236306.0, 68923.0, 20049.0, 7438.0, 3590.0, 1891.0, 1123.0, 651.0, 454.0, 270.0, 168.0, 132.0, 83.0, 57.0, 37.0, 21.0, 21.0, 18.0, 8.0, 10.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.234375, -9.9100341796875, -9.585693359375, -9.2613525390625, -8.93701171875, -8.6126708984375, -8.288330078125, -7.9639892578125, -7.6396484375, -7.3153076171875, -6.990966796875, -6.6666259765625, -6.34228515625, -6.0179443359375, -5.693603515625, -5.3692626953125, -5.044921875, -4.7205810546875, -4.396240234375, -4.0718994140625, -3.74755859375, -3.4232177734375, -3.098876953125, -2.7745361328125, -2.4501953125, -2.1258544921875, -1.801513671875, -1.4771728515625, -1.15283203125, -0.8284912109375, -0.504150390625, -0.1798095703125, 0.14453125, 0.4688720703125, 0.793212890625, 1.1175537109375, 1.44189453125, 1.7662353515625, 2.090576171875, 2.4149169921875, 2.7392578125, 3.0635986328125, 3.387939453125, 3.7122802734375, 4.03662109375, 4.3609619140625, 4.685302734375, 5.0096435546875, 5.333984375, 5.6583251953125, 5.982666015625, 6.3070068359375, 6.63134765625, 6.9556884765625, 7.280029296875, 7.6043701171875, 7.9287109375, 8.2530517578125, 8.577392578125, 8.9017333984375, 9.22607421875, 9.5504150390625, 9.874755859375, 10.1990966796875, 10.5234375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 6.0, 9.0, 14.0, 20.0, 30.0, 53.0, 55.0, 77.0, 118.0, 113.0, 102.0, 103.0, 92.0, 50.0, 52.0, 25.0, 26.0, 17.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-2.58203125, -2.5064697265625, -2.430908203125, -2.3553466796875, -2.27978515625, -2.2042236328125, -2.128662109375, -2.0531005859375, -1.9775390625, -1.9019775390625, -1.826416015625, -1.7508544921875, -1.67529296875, -1.5997314453125, -1.524169921875, -1.4486083984375, -1.373046875, -1.2974853515625, -1.221923828125, -1.1463623046875, -1.07080078125, -0.9952392578125, -0.919677734375, -0.8441162109375, -0.7685546875, -0.6929931640625, -0.617431640625, -0.5418701171875, -0.46630859375, -0.3907470703125, -0.315185546875, -0.2396240234375, -0.1640625, -0.0885009765625, -0.012939453125, 0.0626220703125, 0.13818359375, 0.2137451171875, 0.289306640625, 0.3648681640625, 0.4404296875, 0.5159912109375, 0.591552734375, 0.6671142578125, 0.74267578125, 0.8182373046875, 0.893798828125, 0.9693603515625, 1.044921875, 1.1204833984375, 1.196044921875, 1.2716064453125, 1.34716796875, 1.4227294921875, 1.498291015625, 1.5738525390625, 1.6494140625, 1.7249755859375, 1.800537109375, 1.8760986328125, 1.95166015625, 2.0272216796875, 2.102783203125, 2.1783447265625, 2.25390625]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 4.0, 8.0, 6.0, 17.0, 18.0, 24.0, 29.0, 38.0, 51.0, 62.0, 61.0, 68.0, 79.0, 92.0, 84.0, 78.0, 62.0, 47.0, 50.0, 27.0, 19.0, 18.0, 17.0, 10.0, 10.0, 9.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.419083595275879, -11.964229583740234, -11.509374618530273, -11.054520606994629, -10.599666595458984, -10.144811630249023, -9.689957618713379, -9.235103607177734, -8.780248641967773, -8.325394630432129, -7.870539665222168, -7.415685653686523, -6.960831165313721, -6.505976676940918, -6.051122665405273, -5.596268177032471, -5.141413688659668, -4.686559200286865, -4.2317047119140625, -3.776850700378418, -3.3219962120056152, -2.8671417236328125, -2.412287473678589, -1.9574332237243652, -1.5025787353515625, -1.0477243661880493, -0.5928699970245361, -0.13801562786102295, 0.31683874130249023, 0.771693229675293, 1.2265474796295166, 1.6814017295837402, 2.1362552642822266, 2.5911097526550293, 3.045964002609253, 3.5008182525634766, 3.9556727409362793, 4.410527229309082, 4.865381240844727, 5.320235729217529, 5.775090217590332, 6.229944705963135, 6.6847991943359375, 7.139653205871582, 7.594507694244385, 8.049362182617188, 8.504216194152832, 8.959070205688477, 9.413925170898438, 9.868779182434082, 10.323634147644043, 10.778488159179688, 11.233343124389648, 11.688197135925293, 12.143051147460938, 12.597906112670898, 13.052760124206543, 13.507614135742188, 13.962469100952148, 14.417323112487793, 14.872177124023438, 15.327032089233398, 15.781886100769043, 16.236740112304688, 16.69159507751465]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 10.0, 7.0, 7.0, 8.0, 13.0, 24.0, 12.0, 24.0, 26.0, 25.0, 29.0, 31.0, 26.0, 32.0, 25.0, 42.0, 39.0, 37.0, 48.0, 46.0, 38.0, 40.0, 39.0, 35.0, 40.0, 33.0, 31.0, 27.0, 27.0, 19.0, 34.0, 22.0, 18.0, 19.0, 10.0, 11.0, 8.0, 4.0, 8.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.938849449157715, -5.748709201812744, -5.558568954467773, -5.3684282302856445, -5.178287982940674, -4.988147735595703, -4.798007488250732, -4.607867240905762, -4.417726516723633, -4.227586269378662, -4.037446022033691, -3.8473055362701416, -3.657165050506592, -3.467024803161621, -3.2768845558166504, -3.0867443084716797, -2.896604061126709, -2.7064638137817383, -2.5163233280181885, -2.3261830806732178, -2.136042594909668, -1.9459023475646973, -1.7557621002197266, -1.5656217336654663, -1.375481367111206, -1.1853410005569458, -0.9952006936073303, -0.8050603866577148, -0.6149200201034546, -0.42477965354919434, -0.23463940620422363, -0.04449903964996338, 0.14564132690429688, 0.33578166365623474, 0.5259220004081726, 0.7160623073577881, 0.9062026739120483, 1.0963430404663086, 1.2864832878112793, 1.4766236543655396, 1.6667640209197998, 1.85690438747406, 2.0470447540283203, 2.237185001373291, 2.4273252487182617, 2.6174657344818115, 2.8076059818267822, 2.997746467590332, 3.1878867149353027, 3.3780269622802734, 3.5681674480438232, 3.758307695388794, 3.9484481811523438, 4.1385884284973145, 4.328728675842285, 4.518868923187256, 4.709009170532227, 4.899149417877197, 5.089289665222168, 5.279430389404297, 5.469570636749268, 5.659710884094238, 5.849851131439209, 6.03999137878418, 6.230132102966309]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 10.0, 3.0, 15.0, 18.0, 38.0, 48.0, 87.0, 176.0, 242.0, 453.0, 765.0, 1349.0, 2379.0, 4760.0, 9531.0, 20520.0, 46299.0, 112563.0, 284694.0, 712826.0, 1277581.0, 994255.0, 429399.0, 168422.0, 68967.0, 29964.0, 14056.0, 6963.0, 3530.0, 1899.0, 1075.0, 555.0, 329.0, 193.0, 121.0, 72.0, 40.0, 37.0, 18.0, 14.0, 6.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.4453125, -14.00390625, -13.5625, -13.12109375, -12.6796875, -12.23828125, -11.796875, -11.35546875, -10.9140625, -10.47265625, -10.03125, -9.58984375, -9.1484375, -8.70703125, -8.265625, -7.82421875, -7.3828125, -6.94140625, -6.5, -6.05859375, -5.6171875, -5.17578125, -4.734375, -4.29296875, -3.8515625, -3.41015625, -2.96875, -2.52734375, -2.0859375, -1.64453125, -1.203125, -0.76171875, -0.3203125, 0.12109375, 0.5625, 1.00390625, 1.4453125, 1.88671875, 2.328125, 2.76953125, 3.2109375, 3.65234375, 4.09375, 4.53515625, 4.9765625, 5.41796875, 5.859375, 6.30078125, 6.7421875, 7.18359375, 7.625, 8.06640625, 8.5078125, 8.94921875, 9.390625, 9.83203125, 10.2734375, 10.71484375, 11.15625, 11.59765625, 12.0390625, 12.48046875, 12.921875, 13.36328125, 13.8046875]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 5.0, 9.0, 5.0, 7.0, 13.0, 11.0, 14.0, 21.0, 16.0, 25.0, 38.0, 39.0, 35.0, 38.0, 40.0, 27.0, 34.0, 39.0, 44.0, 44.0, 44.0, 52.0, 50.0, 43.0, 33.0, 44.0, 28.0, 36.0, 24.0, 18.0, 20.0, 15.0, 15.0, 15.0, 14.0, 17.0, 13.0, 3.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83984375, -4.6767578125, -4.513671875, -4.3505859375, -4.1875, -4.0244140625, -3.861328125, -3.6982421875, -3.53515625, -3.3720703125, -3.208984375, -3.0458984375, -2.8828125, -2.7197265625, -2.556640625, -2.3935546875, -2.23046875, -2.0673828125, -1.904296875, -1.7412109375, -1.578125, -1.4150390625, -1.251953125, -1.0888671875, -0.92578125, -0.7626953125, -0.599609375, -0.4365234375, -0.2734375, -0.1103515625, 0.052734375, 0.2158203125, 0.37890625, 0.5419921875, 0.705078125, 0.8681640625, 1.03125, 1.1943359375, 1.357421875, 1.5205078125, 1.68359375, 1.8466796875, 2.009765625, 2.1728515625, 2.3359375, 2.4990234375, 2.662109375, 2.8251953125, 2.98828125, 3.1513671875, 3.314453125, 3.4775390625, 3.640625, 3.8037109375, 3.966796875, 4.1298828125, 4.29296875, 4.4560546875, 4.619140625, 4.7822265625, 4.9453125, 5.1083984375, 5.271484375, 5.4345703125, 5.59765625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 6.0, 7.0, 9.0, 11.0, 19.0, 31.0, 49.0, 73.0, 131.0, 204.0, 325.0, 471.0, 933.0, 1488.0, 2769.0, 5363.0, 10720.0, 22080.0, 47677.0, 106739.0, 242236.0, 523736.0, 941145.0, 1045972.0, 661964.0, 318847.0, 141813.0, 63072.0, 28399.0, 13463.0, 6548.0, 3510.0, 1904.0, 979.0, 601.0, 390.0, 210.0, 151.0, 93.0, 53.0, 29.0, 26.0, 10.0, 9.0, 9.0, 4.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.9921875, -14.56591796875, -14.1396484375, -13.71337890625, -13.287109375, -12.86083984375, -12.4345703125, -12.00830078125, -11.58203125, -11.15576171875, -10.7294921875, -10.30322265625, -9.876953125, -9.45068359375, -9.0244140625, -8.59814453125, -8.171875, -7.74560546875, -7.3193359375, -6.89306640625, -6.466796875, -6.04052734375, -5.6142578125, -5.18798828125, -4.76171875, -4.33544921875, -3.9091796875, -3.48291015625, -3.056640625, -2.63037109375, -2.2041015625, -1.77783203125, -1.3515625, -0.92529296875, -0.4990234375, -0.07275390625, 0.353515625, 0.77978515625, 1.2060546875, 1.63232421875, 2.05859375, 2.48486328125, 2.9111328125, 3.33740234375, 3.763671875, 4.18994140625, 4.6162109375, 5.04248046875, 5.46875, 5.89501953125, 6.3212890625, 6.74755859375, 7.173828125, 7.60009765625, 8.0263671875, 8.45263671875, 8.87890625, 9.30517578125, 9.7314453125, 10.15771484375, 10.583984375, 11.01025390625, 11.4365234375, 11.86279296875, 12.2890625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 6.0, 8.0, 11.0, 13.0, 22.0, 18.0, 19.0, 33.0, 30.0, 38.0, 44.0, 73.0, 77.0, 108.0, 105.0, 132.0, 136.0, 163.0, 212.0, 216.0, 235.0, 258.0, 258.0, 231.0, 218.0, 237.0, 204.0, 169.0, 154.0, 132.0, 108.0, 93.0, 67.0, 59.0, 51.0, 34.0, 23.0, 19.0, 20.0, 5.0, 8.0, 6.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0], "bins": [-3.490234375, -3.396209716796875, -3.30218505859375, -3.208160400390625, -3.1141357421875, -3.020111083984375, -2.92608642578125, -2.832061767578125, -2.738037109375, -2.644012451171875, -2.54998779296875, -2.455963134765625, -2.3619384765625, -2.267913818359375, -2.17388916015625, -2.079864501953125, -1.98583984375, -1.891815185546875, -1.79779052734375, -1.703765869140625, -1.6097412109375, -1.515716552734375, -1.42169189453125, -1.327667236328125, -1.233642578125, -1.139617919921875, -1.04559326171875, -0.951568603515625, -0.8575439453125, -0.763519287109375, -0.66949462890625, -0.575469970703125, -0.4814453125, -0.387420654296875, -0.29339599609375, -0.199371337890625, -0.1053466796875, -0.011322021484375, 0.08270263671875, 0.176727294921875, 0.270751953125, 0.364776611328125, 0.45880126953125, 0.552825927734375, 0.6468505859375, 0.740875244140625, 0.83489990234375, 0.928924560546875, 1.02294921875, 1.116973876953125, 1.21099853515625, 1.305023193359375, 1.3990478515625, 1.493072509765625, 1.58709716796875, 1.681121826171875, 1.775146484375, 1.869171142578125, 1.96319580078125, 2.057220458984375, 2.1512451171875, 2.245269775390625, 2.33929443359375, 2.433319091796875, 2.52734375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 14.0, 9.0, 29.0, 33.0, 27.0, 50.0, 58.0, 60.0, 69.0, 82.0, 78.0, 80.0, 68.0, 72.0, 62.0, 58.0, 36.0, 23.0, 19.0, 18.0, 15.0, 8.0, 10.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.267213821411133, -16.784475326538086, -16.301738739013672, -15.819000244140625, -15.336261749267578, -14.853523254394531, -14.3707857131958, -13.88804817199707, -13.405309677124023, -12.922571182250977, -12.439833641052246, -11.957096099853516, -11.474357604980469, -10.991619110107422, -10.508881568908691, -10.026144027709961, -9.543405532836914, -9.060667037963867, -8.577929496765137, -8.095191955566406, -7.612453460693359, -7.129715442657471, -6.646977424621582, -6.164239406585693, -5.681501388549805, -5.198763370513916, -4.716025352478027, -4.233287334442139, -3.75054931640625, -3.2678112983703613, -2.7850732803344727, -2.302335262298584, -1.8195981979370117, -1.336860179901123, -0.8541221618652344, -0.3713841438293457, 0.11135387420654297, 0.5940918922424316, 1.0768299102783203, 1.559567928314209, 2.0423059463500977, 2.5250439643859863, 3.007781982421875, 3.4905200004577637, 3.9732580184936523, 4.455996036529541, 4.93873405456543, 5.421472072601318, 5.904210090637207, 6.386948108673096, 6.869686126708984, 7.352424144744873, 7.835162162780762, 8.317899703979492, 8.800638198852539, 9.283376693725586, 9.766114234924316, 10.248851776123047, 10.731590270996094, 11.21432876586914, 11.697066307067871, 12.179803848266602, 12.662542343139648, 13.145280838012695, 13.628018379211426]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 9.0, 2.0, 4.0, 10.0, 10.0, 8.0, 7.0, 10.0, 11.0, 14.0, 12.0, 18.0, 26.0, 19.0, 18.0, 19.0, 40.0, 35.0, 32.0, 25.0, 30.0, 35.0, 36.0, 44.0, 42.0, 42.0, 41.0, 34.0, 46.0, 28.0, 27.0, 26.0, 35.0, 27.0, 22.0, 29.0, 22.0, 12.0, 10.0, 9.0, 15.0, 18.0, 9.0, 8.0, 9.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.441751956939697, -5.2632670402526855, -5.084782123565674, -4.90629768371582, -4.727812767028809, -4.549327850341797, -4.370842933654785, -4.192358016967773, -4.013873100280762, -3.83538818359375, -3.6569035053253174, -3.4784185886383057, -3.299933910369873, -3.1214489936828613, -2.9429640769958496, -2.764479160308838, -2.5859947204589844, -2.4075098037719727, -2.22902512550354, -2.0505402088165283, -1.8720554113388062, -1.693570613861084, -1.5150856971740723, -1.33660089969635, -1.158116102218628, -0.9796313047409058, -0.8011464476585388, -0.6226615905761719, -0.4441767930984497, -0.26569199562072754, -0.08720707893371582, 0.09127771854400635, 0.2697625160217285, 0.44824734330177307, 0.6267321705818176, 0.8052170276641846, 0.9837018251419067, 1.162186622619629, 1.3406715393066406, 1.5191563367843628, 1.697641134262085, 1.8761259317398071, 2.0546107292175293, 2.233095645904541, 2.4115805625915527, 2.5900652408599854, 2.768550157546997, 2.9470348358154297, 3.1255197525024414, 3.304004669189453, 3.4824893474578857, 3.6609742641448975, 3.83945894241333, 4.017943859100342, 4.1964287757873535, 4.374913692474365, 4.553398132324219, 4.7318830490112305, 4.910367965698242, 5.088852882385254, 5.267337322235107, 5.445822238922119, 5.624307155609131, 5.802792072296143, 5.981276988983154]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 11.0, 7.0, 10.0, 25.0, 31.0, 35.0, 57.0, 86.0, 142.0, 222.0, 332.0, 559.0, 888.0, 1515.0, 2650.0, 4942.0, 9452.0, 19133.0, 38928.0, 79865.0, 151004.0, 224742.0, 219829.0, 143322.0, 75631.0, 36950.0, 18050.0, 9110.0, 4677.0, 2578.0, 1439.0, 862.0, 503.0, 318.0, 211.0, 153.0, 89.0, 60.0, 47.0, 31.0, 22.0, 16.0, 9.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91015625, -5.7308349609375, -5.551513671875, -5.3721923828125, -5.19287109375, -5.0135498046875, -4.834228515625, -4.6549072265625, -4.4755859375, -4.2962646484375, -4.116943359375, -3.9376220703125, -3.75830078125, -3.5789794921875, -3.399658203125, -3.2203369140625, -3.041015625, -2.8616943359375, -2.682373046875, -2.5030517578125, -2.32373046875, -2.1444091796875, -1.965087890625, -1.7857666015625, -1.6064453125, -1.4271240234375, -1.247802734375, -1.0684814453125, -0.88916015625, -0.7098388671875, -0.530517578125, -0.3511962890625, -0.171875, 0.0074462890625, 0.186767578125, 0.3660888671875, 0.54541015625, 0.7247314453125, 0.904052734375, 1.0833740234375, 1.2626953125, 1.4420166015625, 1.621337890625, 1.8006591796875, 1.97998046875, 2.1593017578125, 2.338623046875, 2.5179443359375, 2.697265625, 2.8765869140625, 3.055908203125, 3.2352294921875, 3.41455078125, 3.5938720703125, 3.773193359375, 3.9525146484375, 4.1318359375, 4.3111572265625, 4.490478515625, 4.6697998046875, 4.84912109375, 5.0284423828125, 5.207763671875, 5.3870849609375, 5.56640625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 10.0, 7.0, 10.0, 16.0, 7.0, 14.0, 15.0, 19.0, 29.0, 28.0, 28.0, 28.0, 41.0, 37.0, 40.0, 42.0, 54.0, 48.0, 54.0, 52.0, 55.0, 33.0, 37.0, 44.0, 37.0, 33.0, 26.0, 28.0, 27.0, 18.0, 21.0, 14.0, 10.0, 10.0, 9.0, 6.0, 3.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1640625, -8.8956298828125, -8.627197265625, -8.3587646484375, -8.09033203125, -7.8218994140625, -7.553466796875, -7.2850341796875, -7.0166015625, -6.7481689453125, -6.479736328125, -6.2113037109375, -5.94287109375, -5.6744384765625, -5.406005859375, -5.1375732421875, -4.869140625, -4.6007080078125, -4.332275390625, -4.0638427734375, -3.79541015625, -3.5269775390625, -3.258544921875, -2.9901123046875, -2.7216796875, -2.4532470703125, -2.184814453125, -1.9163818359375, -1.64794921875, -1.3795166015625, -1.111083984375, -0.8426513671875, -0.57421875, -0.3057861328125, -0.037353515625, 0.2310791015625, 0.49951171875, 0.7679443359375, 1.036376953125, 1.3048095703125, 1.5732421875, 1.8416748046875, 2.110107421875, 2.3785400390625, 2.64697265625, 2.9154052734375, 3.183837890625, 3.4522705078125, 3.720703125, 3.9891357421875, 4.257568359375, 4.5260009765625, 4.79443359375, 5.0628662109375, 5.331298828125, 5.5997314453125, 5.8681640625, 6.1365966796875, 6.405029296875, 6.6734619140625, 6.94189453125, 7.2103271484375, 7.478759765625, 7.7471923828125, 8.015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 8.0, 13.0, 16.0, 18.0, 18.0, 23.0, 42.0, 66.0, 91.0, 144.0, 246.0, 451.0, 830.0, 1659.0, 3790.0, 8812.0, 23211.0, 70388.0, 216958.0, 399322.0, 213742.0, 69283.0, 23432.0, 8753.0, 3554.0, 1651.0, 861.0, 474.0, 262.0, 142.0, 93.0, 69.0, 45.0, 33.0, 15.0, 17.0, 6.0, 1.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.0703125, -9.7288818359375, -9.387451171875, -9.0460205078125, -8.70458984375, -8.3631591796875, -8.021728515625, -7.6802978515625, -7.3388671875, -6.9974365234375, -6.656005859375, -6.3145751953125, -5.97314453125, -5.6317138671875, -5.290283203125, -4.9488525390625, -4.607421875, -4.2659912109375, -3.924560546875, -3.5831298828125, -3.24169921875, -2.9002685546875, -2.558837890625, -2.2174072265625, -1.8759765625, -1.5345458984375, -1.193115234375, -0.8516845703125, -0.51025390625, -0.1688232421875, 0.172607421875, 0.5140380859375, 0.85546875, 1.1968994140625, 1.538330078125, 1.8797607421875, 2.22119140625, 2.5626220703125, 2.904052734375, 3.2454833984375, 3.5869140625, 3.9283447265625, 4.269775390625, 4.6112060546875, 4.95263671875, 5.2940673828125, 5.635498046875, 5.9769287109375, 6.318359375, 6.6597900390625, 7.001220703125, 7.3426513671875, 7.68408203125, 8.0255126953125, 8.366943359375, 8.7083740234375, 9.0498046875, 9.3912353515625, 9.732666015625, 10.0740966796875, 10.41552734375, 10.7569580078125, 11.098388671875, 11.4398193359375, 11.78125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 8.0, 11.0, 13.0, 12.0, 7.0, 11.0, 22.0, 19.0, 19.0, 20.0, 21.0, 26.0, 26.0, 29.0, 30.0, 39.0, 24.0, 35.0, 43.0, 45.0, 52.0, 32.0, 32.0, 41.0, 25.0, 44.0, 33.0, 37.0, 42.0, 20.0, 23.0, 21.0, 18.0, 17.0, 18.0, 15.0, 13.0, 11.0, 3.0, 12.0, 7.0, 9.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-4.15234375, -4.02191162109375, -3.8914794921875, -3.76104736328125, -3.630615234375, -3.50018310546875, -3.3697509765625, -3.23931884765625, -3.10888671875, -2.97845458984375, -2.8480224609375, -2.71759033203125, -2.587158203125, -2.45672607421875, -2.3262939453125, -2.19586181640625, -2.0654296875, -1.93499755859375, -1.8045654296875, -1.67413330078125, -1.543701171875, -1.41326904296875, -1.2828369140625, -1.15240478515625, -1.02197265625, -0.89154052734375, -0.7611083984375, -0.63067626953125, -0.500244140625, -0.36981201171875, -0.2393798828125, -0.10894775390625, 0.021484375, 0.15191650390625, 0.2823486328125, 0.41278076171875, 0.543212890625, 0.67364501953125, 0.8040771484375, 0.93450927734375, 1.06494140625, 1.19537353515625, 1.3258056640625, 1.45623779296875, 1.586669921875, 1.71710205078125, 1.8475341796875, 1.97796630859375, 2.1083984375, 2.23883056640625, 2.3692626953125, 2.49969482421875, 2.630126953125, 2.76055908203125, 2.8909912109375, 3.02142333984375, 3.15185546875, 3.28228759765625, 3.4127197265625, 3.54315185546875, 3.673583984375, 3.80401611328125, 3.9344482421875, 4.06488037109375, 4.1953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 10.0, 12.0, 16.0, 28.0, 31.0, 47.0, 71.0, 95.0, 166.0, 220.0, 371.0, 576.0, 796.0, 1259.0, 1959.0, 3216.0, 5347.0, 9168.0, 16309.0, 29832.0, 56410.0, 105849.0, 184617.0, 237757.0, 176857.0, 99577.0, 52818.0, 27902.0, 15057.0, 8767.0, 4998.0, 3064.0, 1885.0, 1129.0, 749.0, 518.0, 321.0, 214.0, 170.0, 120.0, 74.0, 44.0, 50.0, 20.0, 21.0, 12.0, 14.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.611328125, -2.52557373046875, -2.4398193359375, -2.35406494140625, -2.268310546875, -2.18255615234375, -2.0968017578125, -2.01104736328125, -1.92529296875, -1.83953857421875, -1.7537841796875, -1.66802978515625, -1.582275390625, -1.49652099609375, -1.4107666015625, -1.32501220703125, -1.2392578125, -1.15350341796875, -1.0677490234375, -0.98199462890625, -0.896240234375, -0.81048583984375, -0.7247314453125, -0.63897705078125, -0.55322265625, -0.46746826171875, -0.3817138671875, -0.29595947265625, -0.210205078125, -0.12445068359375, -0.0386962890625, 0.04705810546875, 0.1328125, 0.21856689453125, 0.3043212890625, 0.39007568359375, 0.475830078125, 0.56158447265625, 0.6473388671875, 0.73309326171875, 0.81884765625, 0.90460205078125, 0.9903564453125, 1.07611083984375, 1.161865234375, 1.24761962890625, 1.3333740234375, 1.41912841796875, 1.5048828125, 1.59063720703125, 1.6763916015625, 1.76214599609375, 1.847900390625, 1.93365478515625, 2.0194091796875, 2.10516357421875, 2.19091796875, 2.27667236328125, 2.3624267578125, 2.44818115234375, 2.533935546875, 2.61968994140625, 2.7054443359375, 2.79119873046875, 2.876953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 6.0, 11.0, 5.0, 7.0, 9.0, 15.0, 18.0, 17.0, 27.0, 28.0, 28.0, 44.0, 39.0, 53.0, 66.0, 59.0, 65.0, 60.0, 64.0, 67.0, 60.0, 42.0, 40.0, 34.0, 22.0, 16.0, 18.0, 15.0, 15.0, 12.0, 11.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00014448165893554688, -0.00014055147767066956, -0.00013662129640579224, -0.00013269111514091492, -0.0001287609338760376, -0.00012483075261116028, -0.00012090057134628296, -0.00011697039008140564, -0.00011304020881652832, -0.000109110027551651, -0.00010517984628677368, -0.00010124966502189636, -9.731948375701904e-05, -9.338930249214172e-05, -8.94591212272644e-05, -8.552893996238708e-05, -8.159875869750977e-05, -7.766857743263245e-05, -7.373839616775513e-05, -6.980821490287781e-05, -6.587803363800049e-05, -6.194785237312317e-05, -5.801767110824585e-05, -5.408748984336853e-05, -5.015730857849121e-05, -4.622712731361389e-05, -4.229694604873657e-05, -3.836676478385925e-05, -3.4436583518981934e-05, -3.0506402254104614e-05, -2.6576220989227295e-05, -2.2646039724349976e-05, -1.8715858459472656e-05, -1.4785677194595337e-05, -1.0855495929718018e-05, -6.925314664840698e-06, -2.995133399963379e-06, 9.350478649139404e-07, 4.86522912979126e-06, 8.795410394668579e-06, 1.2725591659545898e-05, 1.6655772924423218e-05, 2.0585954189300537e-05, 2.4516135454177856e-05, 2.8446316719055176e-05, 3.2376497983932495e-05, 3.6306679248809814e-05, 4.0236860513687134e-05, 4.416704177856445e-05, 4.809722304344177e-05, 5.202740430831909e-05, 5.595758557319641e-05, 5.988776683807373e-05, 6.381794810295105e-05, 6.774812936782837e-05, 7.167831063270569e-05, 7.560849189758301e-05, 7.953867316246033e-05, 8.346885442733765e-05, 8.739903569221497e-05, 9.132921695709229e-05, 9.52593982219696e-05, 9.918957948684692e-05, 0.00010311976075172424, 0.00010704994201660156]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 13.0, 18.0, 27.0, 42.0, 65.0, 106.0, 154.0, 249.0, 424.0, 666.0, 1090.0, 1862.0, 3124.0, 5668.0, 9994.0, 18007.0, 32222.0, 59002.0, 103952.0, 160066.0, 195674.0, 176242.0, 120362.0, 70589.0, 39291.0, 21727.0, 11955.0, 6656.0, 3779.0, 2140.0, 1397.0, 756.0, 441.0, 300.0, 179.0, 116.0, 61.0, 45.0, 30.0, 21.0, 13.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.482421875, -2.406402587890625, -2.33038330078125, -2.254364013671875, -2.1783447265625, -2.102325439453125, -2.02630615234375, -1.950286865234375, -1.874267578125, -1.798248291015625, -1.72222900390625, -1.646209716796875, -1.5701904296875, -1.494171142578125, -1.41815185546875, -1.342132568359375, -1.26611328125, -1.190093994140625, -1.11407470703125, -1.038055419921875, -0.9620361328125, -0.886016845703125, -0.80999755859375, -0.733978271484375, -0.657958984375, -0.581939697265625, -0.50592041015625, -0.429901123046875, -0.3538818359375, -0.277862548828125, -0.20184326171875, -0.125823974609375, -0.0498046875, 0.026214599609375, 0.10223388671875, 0.178253173828125, 0.2542724609375, 0.330291748046875, 0.40631103515625, 0.482330322265625, 0.558349609375, 0.634368896484375, 0.71038818359375, 0.786407470703125, 0.8624267578125, 0.938446044921875, 1.01446533203125, 1.090484619140625, 1.16650390625, 1.242523193359375, 1.31854248046875, 1.394561767578125, 1.4705810546875, 1.546600341796875, 1.62261962890625, 1.698638916015625, 1.774658203125, 1.850677490234375, 1.92669677734375, 2.002716064453125, 2.0787353515625, 2.154754638671875, 2.23077392578125, 2.306793212890625, 2.3828125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 10.0, 11.0, 25.0, 22.0, 33.0, 34.0, 41.0, 46.0, 48.0, 45.0, 53.0, 52.0, 61.0, 56.0, 50.0, 52.0, 47.0, 44.0, 39.0, 39.0, 24.0, 25.0, 20.0, 17.0, 20.0, 19.0, 13.0, 9.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71875, -0.6975326538085938, -0.6763153076171875, -0.6550979614257812, -0.633880615234375, -0.6126632690429688, -0.5914459228515625, -0.5702285766601562, -0.54901123046875, -0.5277938842773438, -0.5065765380859375, -0.48535919189453125, -0.464141845703125, -0.44292449951171875, -0.4217071533203125, -0.40048980712890625, -0.3792724609375, -0.35805511474609375, -0.3368377685546875, -0.31562042236328125, -0.294403076171875, -0.27318572998046875, -0.2519683837890625, -0.23075103759765625, -0.20953369140625, -0.18831634521484375, -0.1670989990234375, -0.14588165283203125, -0.124664306640625, -0.10344696044921875, -0.0822296142578125, -0.06101226806640625, -0.039794921875, -0.01857757568359375, 0.0026397705078125, 0.02385711669921875, 0.045074462890625, 0.06629180908203125, 0.0875091552734375, 0.10872650146484375, 0.12994384765625, 0.15116119384765625, 0.1723785400390625, 0.19359588623046875, 0.214813232421875, 0.23603057861328125, 0.2572479248046875, 0.27846527099609375, 0.2996826171875, 0.32089996337890625, 0.3421173095703125, 0.36333465576171875, 0.384552001953125, 0.40576934814453125, 0.4269866943359375, 0.44820404052734375, 0.46942138671875, 0.49063873291015625, 0.5118560791015625, 0.5330734252929688, 0.554290771484375, 0.5755081176757812, 0.5967254638671875, 0.6179428100585938, 0.63916015625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 13.0, 14.0, 17.0, 23.0, 38.0, 29.0, 52.0, 66.0, 54.0, 73.0, 67.0, 70.0, 82.0, 67.0, 76.0, 59.0, 47.0, 37.0, 25.0, 23.0, 15.0, 14.0, 8.0, 13.0, 7.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.546504020690918, -15.08419418334961, -14.621885299682617, -14.159575462341309, -13.697265625, -13.234956741333008, -12.7726469039917, -12.31033706665039, -11.848028182983398, -11.38571834564209, -10.923409461975098, -10.461099624633789, -9.99878978729248, -9.536479949951172, -9.07417106628418, -8.611861228942871, -8.149551391601562, -7.687242031097412, -7.2249321937561035, -6.762622833251953, -6.3003129959106445, -5.838003635406494, -5.375694274902344, -4.913384437561035, -4.451075077056885, -3.9887654781341553, -3.526455879211426, -3.0641465187072754, -2.601836919784546, -2.1395273208618164, -1.677217960357666, -1.2149083614349365, -0.752598762512207, -0.2902892231941223, 0.1720203161239624, 0.6343297958374023, 1.0966393947601318, 1.5589489936828613, 2.0212583541870117, 2.483567953109741, 2.9458775520324707, 3.4081871509552, 3.8704967498779297, 4.33280611038208, 4.7951154708862305, 5.257425308227539, 5.7197346687316895, 6.18204402923584, 6.644353866577148, 7.106663227081299, 7.568973064422607, 8.031282424926758, 8.493592262268066, 8.955902099609375, 9.418210983276367, 9.880520820617676, 10.342830657958984, 10.805140495300293, 11.267449378967285, 11.729759216308594, 12.192069053649902, 12.654378890991211, 13.116687774658203, 13.578997611999512, 14.041306495666504]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 6.0, 9.0, 6.0, 8.0, 4.0, 12.0, 11.0, 15.0, 8.0, 16.0, 23.0, 20.0, 21.0, 20.0, 34.0, 34.0, 33.0, 26.0, 30.0, 35.0, 36.0, 41.0, 38.0, 39.0, 43.0, 36.0, 40.0, 39.0, 26.0, 32.0, 28.0, 28.0, 31.0, 24.0, 26.0, 16.0, 9.0, 7.0, 19.0, 16.0, 5.0, 10.0, 12.0, 8.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.41213321685791, -5.237030029296875, -5.061926364898682, -4.8868231773376465, -4.711719512939453, -4.536616325378418, -4.361513137817383, -4.186409950256348, -4.011306285858154, -3.83620285987854, -3.661099433898926, -3.4859962463378906, -3.3108928203582764, -3.135789394378662, -2.960686206817627, -2.7855827808380127, -2.6104793548583984, -2.435375928878784, -2.26027250289917, -2.0851693153381348, -1.9100658893585205, -1.7349624633789062, -1.5598591566085815, -1.3847558498382568, -1.2096524238586426, -1.0345489978790283, -0.8594456911087036, -0.6843423247337341, -0.5092389583587646, -0.33413559198379517, -0.15903222560882568, 0.016071081161499023, 0.19117498397827148, 0.36627835035324097, 0.5413817167282104, 0.7164850831031799, 0.8915884494781494, 1.0666918754577637, 1.2417951822280884, 1.416898488998413, 1.5920019149780273, 1.7671053409576416, 1.9422086477279663, 2.117311954498291, 2.2924153804779053, 2.4675188064575195, 2.6426219940185547, 2.817725419998169, 2.992828845977783, 3.1679322719573975, 3.3430356979370117, 3.518138885498047, 3.693242311477661, 3.8683457374572754, 4.0434489250183105, 4.218552589416504, 4.393655776977539, 4.568758964538574, 4.743862628936768, 4.918965816497803, 5.094069480895996, 5.269172668457031, 5.444275856018066, 5.619379043579102, 5.794482707977295]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 16.0, 17.0, 30.0, 47.0, 72.0, 92.0, 132.0, 255.0, 458.0, 679.0, 1130.0, 1881.0, 3214.0, 5126.0, 8816.0, 14841.0, 24948.0, 41814.0, 66290.0, 99934.0, 134438.0, 154988.0, 148555.0, 119720.0, 84494.0, 54600.0, 32836.0, 19868.0, 11717.0, 7015.0, 4139.0, 2504.0, 1470.0, 917.0, 543.0, 339.0, 210.0, 148.0, 99.0, 65.0, 25.0, 27.0, 17.0, 6.0, 5.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.3984375, -9.128173828125, -8.85791015625, -8.587646484375, -8.3173828125, -8.047119140625, -7.77685546875, -7.506591796875, -7.236328125, -6.966064453125, -6.69580078125, -6.425537109375, -6.1552734375, -5.885009765625, -5.61474609375, -5.344482421875, -5.07421875, -4.803955078125, -4.53369140625, -4.263427734375, -3.9931640625, -3.722900390625, -3.45263671875, -3.182373046875, -2.912109375, -2.641845703125, -2.37158203125, -2.101318359375, -1.8310546875, -1.560791015625, -1.29052734375, -1.020263671875, -0.75, -0.479736328125, -0.20947265625, 0.060791015625, 0.3310546875, 0.601318359375, 0.87158203125, 1.141845703125, 1.412109375, 1.682373046875, 1.95263671875, 2.222900390625, 2.4931640625, 2.763427734375, 3.03369140625, 3.303955078125, 3.57421875, 3.844482421875, 4.11474609375, 4.385009765625, 4.6552734375, 4.925537109375, 5.19580078125, 5.466064453125, 5.736328125, 6.006591796875, 6.27685546875, 6.547119140625, 6.8173828125, 7.087646484375, 7.35791015625, 7.628173828125, 7.8984375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 6.0, 6.0, 11.0, 13.0, 10.0, 17.0, 17.0, 18.0, 24.0, 24.0, 26.0, 31.0, 31.0, 41.0, 33.0, 44.0, 35.0, 38.0, 45.0, 38.0, 34.0, 44.0, 47.0, 36.0, 42.0, 33.0, 37.0, 31.0, 30.0, 26.0, 18.0, 17.0, 17.0, 15.0, 9.0, 15.0, 2.0, 4.0, 7.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.22265625, -7.00372314453125, -6.7847900390625, -6.56585693359375, -6.346923828125, -6.12799072265625, -5.9090576171875, -5.69012451171875, -5.47119140625, -5.25225830078125, -5.0333251953125, -4.81439208984375, -4.595458984375, -4.37652587890625, -4.1575927734375, -3.93865966796875, -3.7197265625, -3.50079345703125, -3.2818603515625, -3.06292724609375, -2.843994140625, -2.62506103515625, -2.4061279296875, -2.18719482421875, -1.96826171875, -1.74932861328125, -1.5303955078125, -1.31146240234375, -1.092529296875, -0.87359619140625, -0.6546630859375, -0.43572998046875, -0.216796875, 0.00213623046875, 0.2210693359375, 0.44000244140625, 0.658935546875, 0.87786865234375, 1.0968017578125, 1.31573486328125, 1.53466796875, 1.75360107421875, 1.9725341796875, 2.19146728515625, 2.410400390625, 2.62933349609375, 2.8482666015625, 3.06719970703125, 3.2861328125, 3.50506591796875, 3.7239990234375, 3.94293212890625, 4.161865234375, 4.38079833984375, 4.5997314453125, 4.81866455078125, 5.03759765625, 5.25653076171875, 5.4754638671875, 5.69439697265625, 5.913330078125, 6.13226318359375, 6.3511962890625, 6.57012939453125, 6.7890625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 9.0, 10.0, 8.0, 19.0, 33.0, 46.0, 79.0, 134.0, 190.0, 293.0, 508.0, 943.0, 1667.0, 2889.0, 5391.0, 10238.0, 19240.0, 36388.0, 65910.0, 109123.0, 156901.0, 183074.0, 166432.0, 122009.0, 75440.0, 42586.0, 22978.0, 11843.0, 6390.0, 3374.0, 1802.0, 1046.0, 606.0, 313.0, 232.0, 142.0, 91.0, 54.0, 32.0, 22.0, 24.0, 15.0, 9.0, 9.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.9453125, -9.609619140625, -9.27392578125, -8.938232421875, -8.6025390625, -8.266845703125, -7.93115234375, -7.595458984375, -7.259765625, -6.924072265625, -6.58837890625, -6.252685546875, -5.9169921875, -5.581298828125, -5.24560546875, -4.909912109375, -4.57421875, -4.238525390625, -3.90283203125, -3.567138671875, -3.2314453125, -2.895751953125, -2.56005859375, -2.224365234375, -1.888671875, -1.552978515625, -1.21728515625, -0.881591796875, -0.5458984375, -0.210205078125, 0.12548828125, 0.461181640625, 0.796875, 1.132568359375, 1.46826171875, 1.803955078125, 2.1396484375, 2.475341796875, 2.81103515625, 3.146728515625, 3.482421875, 3.818115234375, 4.15380859375, 4.489501953125, 4.8251953125, 5.160888671875, 5.49658203125, 5.832275390625, 6.16796875, 6.503662109375, 6.83935546875, 7.175048828125, 7.5107421875, 7.846435546875, 8.18212890625, 8.517822265625, 8.853515625, 9.189208984375, 9.52490234375, 9.860595703125, 10.1962890625, 10.531982421875, 10.86767578125, 11.203369140625, 11.5390625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 4.0, 6.0, 12.0, 12.0, 13.0, 29.0, 22.0, 23.0, 25.0, 32.0, 43.0, 30.0, 42.0, 42.0, 46.0, 37.0, 44.0, 46.0, 59.0, 41.0, 42.0, 47.0, 32.0, 37.0, 35.0, 30.0, 30.0, 31.0, 17.0, 15.0, 15.0, 17.0, 10.0, 11.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.561767578125, -4.40869140625, -4.255615234375, -4.1025390625, -3.949462890625, -3.79638671875, -3.643310546875, -3.490234375, -3.337158203125, -3.18408203125, -3.031005859375, -2.8779296875, -2.724853515625, -2.57177734375, -2.418701171875, -2.265625, -2.112548828125, -1.95947265625, -1.806396484375, -1.6533203125, -1.500244140625, -1.34716796875, -1.194091796875, -1.041015625, -0.887939453125, -0.73486328125, -0.581787109375, -0.4287109375, -0.275634765625, -0.12255859375, 0.030517578125, 0.18359375, 0.336669921875, 0.48974609375, 0.642822265625, 0.7958984375, 0.948974609375, 1.10205078125, 1.255126953125, 1.408203125, 1.561279296875, 1.71435546875, 1.867431640625, 2.0205078125, 2.173583984375, 2.32666015625, 2.479736328125, 2.6328125, 2.785888671875, 2.93896484375, 3.092041015625, 3.2451171875, 3.398193359375, 3.55126953125, 3.704345703125, 3.857421875, 4.010498046875, 4.16357421875, 4.316650390625, 4.4697265625, 4.622802734375, 4.77587890625, 4.928955078125, 5.08203125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 12.0, 13.0, 14.0, 15.0, 33.0, 55.0, 58.0, 79.0, 99.0, 140.0, 200.0, 221.0, 372.0, 484.0, 689.0, 1078.0, 1740.0, 3064.0, 5797.0, 12662.0, 33536.0, 98195.0, 261577.0, 345637.0, 179858.0, 61455.0, 21495.0, 8746.0, 4286.0, 2405.0, 1359.0, 985.0, 653.0, 427.0, 283.0, 214.0, 162.0, 119.0, 84.0, 63.0, 60.0, 29.0, 31.0, 16.0, 17.0, 12.0, 8.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.296875, -11.90380859375, -11.5107421875, -11.11767578125, -10.724609375, -10.33154296875, -9.9384765625, -9.54541015625, -9.15234375, -8.75927734375, -8.3662109375, -7.97314453125, -7.580078125, -7.18701171875, -6.7939453125, -6.40087890625, -6.0078125, -5.61474609375, -5.2216796875, -4.82861328125, -4.435546875, -4.04248046875, -3.6494140625, -3.25634765625, -2.86328125, -2.47021484375, -2.0771484375, -1.68408203125, -1.291015625, -0.89794921875, -0.5048828125, -0.11181640625, 0.28125, 0.67431640625, 1.0673828125, 1.46044921875, 1.853515625, 2.24658203125, 2.6396484375, 3.03271484375, 3.42578125, 3.81884765625, 4.2119140625, 4.60498046875, 4.998046875, 5.39111328125, 5.7841796875, 6.17724609375, 6.5703125, 6.96337890625, 7.3564453125, 7.74951171875, 8.142578125, 8.53564453125, 8.9287109375, 9.32177734375, 9.71484375, 10.10791015625, 10.5009765625, 10.89404296875, 11.287109375, 11.68017578125, 12.0732421875, 12.46630859375, 12.859375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 10.0, 17.0, 24.0, 19.0, 36.0, 43.0, 54.0, 69.0, 96.0, 91.0, 99.0, 97.0, 67.0, 63.0, 38.0, 31.0, 24.0, 31.0, 24.0, 15.0, 9.0, 9.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0009479522705078125, -0.0009127259254455566, -0.0008774995803833008, -0.0008422732353210449, -0.0008070468902587891, -0.0007718205451965332, -0.0007365942001342773, -0.0007013678550720215, -0.0006661415100097656, -0.0006309151649475098, -0.0005956888198852539, -0.000560462474822998, -0.0005252361297607422, -0.0004900097846984863, -0.00045478343963623047, -0.0004195570945739746, -0.00038433074951171875, -0.0003491044044494629, -0.00031387805938720703, -0.00027865171432495117, -0.0002434253692626953, -0.00020819902420043945, -0.0001729726791381836, -0.00013774633407592773, -0.00010251998901367188, -6.729364395141602e-05, -3.2067298889160156e-05, 3.159046173095703e-06, 3.838539123535156e-05, 7.361173629760742e-05, 0.00010883808135986328, 0.00014406442642211914, 0.000179290771484375, 0.00021451711654663086, 0.0002497434616088867, 0.0002849698066711426, 0.00032019615173339844, 0.0003554224967956543, 0.00039064884185791016, 0.000425875186920166, 0.0004611015319824219, 0.0004963278770446777, 0.0005315542221069336, 0.0005667805671691895, 0.0006020069122314453, 0.0006372332572937012, 0.000672459602355957, 0.0007076859474182129, 0.0007429122924804688, 0.0007781386375427246, 0.0008133649826049805, 0.0008485913276672363, 0.0008838176727294922, 0.000919044017791748, 0.0009542703628540039, 0.0009894967079162598, 0.0010247230529785156, 0.0010599493980407715, 0.0010951757431030273, 0.0011304020881652832, 0.001165628433227539, 0.001200854778289795, 0.0012360811233520508, 0.0012713074684143066, 0.0013065338134765625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 7.0, 4.0, 3.0, 8.0, 15.0, 17.0, 27.0, 35.0, 46.0, 57.0, 81.0, 93.0, 134.0, 227.0, 261.0, 387.0, 581.0, 824.0, 1224.0, 1911.0, 3050.0, 4952.0, 9269.0, 18186.0, 40123.0, 92331.0, 193945.0, 273592.0, 212020.0, 103944.0, 45274.0, 20567.0, 10138.0, 5611.0, 3336.0, 2101.0, 1245.0, 852.0, 615.0, 404.0, 283.0, 229.0, 162.0, 80.0, 85.0, 56.0, 40.0, 38.0, 27.0, 21.0, 15.0, 17.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.734375, -8.457763671875, -8.18115234375, -7.904541015625, -7.6279296875, -7.351318359375, -7.07470703125, -6.798095703125, -6.521484375, -6.244873046875, -5.96826171875, -5.691650390625, -5.4150390625, -5.138427734375, -4.86181640625, -4.585205078125, -4.30859375, -4.031982421875, -3.75537109375, -3.478759765625, -3.2021484375, -2.925537109375, -2.64892578125, -2.372314453125, -2.095703125, -1.819091796875, -1.54248046875, -1.265869140625, -0.9892578125, -0.712646484375, -0.43603515625, -0.159423828125, 0.1171875, 0.393798828125, 0.67041015625, 0.947021484375, 1.2236328125, 1.500244140625, 1.77685546875, 2.053466796875, 2.330078125, 2.606689453125, 2.88330078125, 3.159912109375, 3.4365234375, 3.713134765625, 3.98974609375, 4.266357421875, 4.54296875, 4.819580078125, 5.09619140625, 5.372802734375, 5.6494140625, 5.926025390625, 6.20263671875, 6.479248046875, 6.755859375, 7.032470703125, 7.30908203125, 7.585693359375, 7.8623046875, 8.138916015625, 8.41552734375, 8.692138671875, 8.96875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 6.0, 12.0, 24.0, 36.0, 41.0, 56.0, 57.0, 73.0, 85.0, 80.0, 88.0, 77.0, 63.0, 62.0, 56.0, 31.0, 28.0, 29.0, 18.0, 16.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.349609375, -2.265716552734375, -2.18182373046875, -2.097930908203125, -2.0140380859375, -1.930145263671875, -1.84625244140625, -1.762359619140625, -1.678466796875, -1.594573974609375, -1.51068115234375, -1.426788330078125, -1.3428955078125, -1.259002685546875, -1.17510986328125, -1.091217041015625, -1.00732421875, -0.923431396484375, -0.83953857421875, -0.755645751953125, -0.6717529296875, -0.587860107421875, -0.50396728515625, -0.420074462890625, -0.336181640625, -0.252288818359375, -0.16839599609375, -0.084503173828125, -0.0006103515625, 0.083282470703125, 0.16717529296875, 0.251068115234375, 0.3349609375, 0.418853759765625, 0.50274658203125, 0.586639404296875, 0.6705322265625, 0.754425048828125, 0.83831787109375, 0.922210693359375, 1.006103515625, 1.089996337890625, 1.17388916015625, 1.257781982421875, 1.3416748046875, 1.425567626953125, 1.50946044921875, 1.593353271484375, 1.67724609375, 1.761138916015625, 1.84503173828125, 1.928924560546875, 2.0128173828125, 2.096710205078125, 2.18060302734375, 2.264495849609375, 2.348388671875, 2.432281494140625, 2.51617431640625, 2.600067138671875, 2.6839599609375, 2.767852783203125, 2.85174560546875, 2.935638427734375, 3.01953125]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 9.0, 10.0, 12.0, 17.0, 13.0, 19.0, 30.0, 39.0, 47.0, 59.0, 63.0, 61.0, 73.0, 71.0, 56.0, 66.0, 61.0, 45.0, 53.0, 42.0, 35.0, 16.0, 22.0, 21.0, 17.0, 15.0, 11.0, 4.0, 4.0, 5.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.549323081970215, -15.116962432861328, -14.684601783752441, -14.252241134643555, -13.819879531860352, -13.387519836425781, -12.955158233642578, -12.522797584533691, -12.090436935424805, -11.658076286315918, -11.225715637207031, -10.793354988098145, -10.360994338989258, -9.928632736206055, -9.496272087097168, -9.063911437988281, -8.631550788879395, -8.199190139770508, -7.766829490661621, -7.334468364715576, -6.9021077156066895, -6.469747066497803, -6.037385940551758, -5.605025291442871, -5.172664642333984, -4.740303993225098, -4.307943344116211, -3.875582218170166, -3.4432215690612793, -3.0108609199523926, -2.5785000324249268, -2.146139144897461, -1.7137775421142578, -1.2814167737960815, -0.8490560054779053, -0.416695237159729, 0.015665531158447266, 0.448026180267334, 0.8803870677947998, 1.3127479553222656, 1.7451086044311523, 2.177469253540039, 2.609830141067505, 3.0421910285949707, 3.4745516777038574, 3.906912326812744, 4.339273452758789, 4.771634101867676, 5.2039947509765625, 5.636355400085449, 6.068716049194336, 6.501077175140381, 6.933437824249268, 7.365798473358154, 7.798159599304199, 8.230520248413086, 8.662880897521973, 9.09524154663086, 9.527602195739746, 9.959962844848633, 10.392324447631836, 10.824684143066406, 11.25704574584961, 11.689406394958496, 12.121767044067383]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 10.0, 8.0, 10.0, 12.0, 7.0, 11.0, 15.0, 18.0, 23.0, 33.0, 42.0, 34.0, 31.0, 28.0, 43.0, 42.0, 40.0, 49.0, 43.0, 44.0, 46.0, 45.0, 42.0, 33.0, 42.0, 30.0, 36.0, 30.0, 16.0, 20.0, 26.0, 15.0, 12.0, 10.0, 12.0, 11.0, 12.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.618297100067139, -6.390865802764893, -6.1634345054626465, -5.936003684997559, -5.7085723876953125, -5.481141090393066, -5.25370979309082, -5.026278495788574, -4.798847198486328, -4.571415901184082, -4.343984603881836, -4.11655330657959, -3.889122486114502, -3.661691188812256, -3.4342598915100098, -3.2068285942077637, -2.979397773742676, -2.7519664764404297, -2.5245354175567627, -2.2971041202545166, -2.0696730613708496, -1.8422417640686035, -1.6148104667663574, -1.3873792886734009, -1.1599481105804443, -0.9325169324874878, -0.7050856947898865, -0.47765445709228516, -0.2502232789993286, -0.02279210090637207, 0.20463919639587402, 0.43207037448883057, 0.6595010757446289, 0.8869322538375854, 1.114363431930542, 1.341794729232788, 1.5692259073257446, 1.7966570854187012, 2.0240883827209473, 2.2515196800231934, 2.4789507389068604, 2.7063820362091064, 2.9338130950927734, 3.1612443923950195, 3.3886756896972656, 3.6161067485809326, 3.8435380458831787, 4.070969104766846, 4.298400402069092, 4.525831699371338, 4.753262996673584, 4.980693817138672, 5.208125114440918, 5.435556411743164, 5.66298770904541, 5.890419006347656, 6.117850303649902, 6.345281600952148, 6.5727128982543945, 6.800144195556641, 7.0275750160217285, 7.255006313323975, 7.482437610626221, 7.709868907928467, 7.937299728393555]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 10.0, 13.0, 27.0, 32.0, 38.0, 78.0, 113.0, 167.0, 215.0, 317.0, 513.0, 819.0, 1286.0, 1997.0, 3184.0, 5237.0, 9207.0, 15759.0, 28984.0, 55581.0, 110695.0, 230526.0, 481656.0, 881089.0, 1026037.0, 674715.0, 333537.0, 159437.0, 78577.0, 40669.0, 22286.0, 12702.0, 7248.0, 4377.0, 2668.0, 1547.0, 1012.0, 639.0, 448.0, 266.0, 196.0, 131.0, 72.0, 62.0, 42.0, 26.0, 19.0, 8.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-11.4140625, -11.048828125, -10.68359375, -10.318359375, -9.953125, -9.587890625, -9.22265625, -8.857421875, -8.4921875, -8.126953125, -7.76171875, -7.396484375, -7.03125, -6.666015625, -6.30078125, -5.935546875, -5.5703125, -5.205078125, -4.83984375, -4.474609375, -4.109375, -3.744140625, -3.37890625, -3.013671875, -2.6484375, -2.283203125, -1.91796875, -1.552734375, -1.1875, -0.822265625, -0.45703125, -0.091796875, 0.2734375, 0.638671875, 1.00390625, 1.369140625, 1.734375, 2.099609375, 2.46484375, 2.830078125, 3.1953125, 3.560546875, 3.92578125, 4.291015625, 4.65625, 5.021484375, 5.38671875, 5.751953125, 6.1171875, 6.482421875, 6.84765625, 7.212890625, 7.578125, 7.943359375, 8.30859375, 8.673828125, 9.0390625, 9.404296875, 9.76953125, 10.134765625, 10.5, 10.865234375, 11.23046875, 11.595703125, 11.9609375]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 3.0, 3.0, 9.0, 6.0, 9.0, 9.0, 15.0, 23.0, 15.0, 19.0, 29.0, 33.0, 39.0, 35.0, 40.0, 37.0, 37.0, 49.0, 41.0, 41.0, 55.0, 50.0, 35.0, 44.0, 30.0, 38.0, 40.0, 36.0, 35.0, 29.0, 15.0, 15.0, 16.0, 10.0, 13.0, 12.0, 11.0, 9.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.66009521484375, -4.4725341796875, -4.28497314453125, -4.097412109375, -3.90985107421875, -3.7222900390625, -3.53472900390625, -3.34716796875, -3.15960693359375, -2.9720458984375, -2.78448486328125, -2.596923828125, -2.40936279296875, -2.2218017578125, -2.03424072265625, -1.8466796875, -1.65911865234375, -1.4715576171875, -1.28399658203125, -1.096435546875, -0.90887451171875, -0.7213134765625, -0.53375244140625, -0.34619140625, -0.15863037109375, 0.0289306640625, 0.21649169921875, 0.404052734375, 0.59161376953125, 0.7791748046875, 0.96673583984375, 1.154296875, 1.34185791015625, 1.5294189453125, 1.71697998046875, 1.904541015625, 2.09210205078125, 2.2796630859375, 2.46722412109375, 2.65478515625, 2.84234619140625, 3.0299072265625, 3.21746826171875, 3.405029296875, 3.59259033203125, 3.7801513671875, 3.96771240234375, 4.1552734375, 4.34283447265625, 4.5303955078125, 4.71795654296875, 4.905517578125, 5.09307861328125, 5.2806396484375, 5.46820068359375, 5.65576171875, 5.84332275390625, 6.0308837890625, 6.21844482421875, 6.406005859375, 6.59356689453125, 6.7811279296875, 6.96868896484375, 7.15625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 8.0, 13.0, 14.0, 13.0, 34.0, 57.0, 72.0, 128.0, 186.0, 261.0, 380.0, 635.0, 991.0, 1600.0, 2810.0, 4697.0, 8170.0, 14975.0, 27343.0, 52796.0, 101186.0, 198180.0, 378772.0, 668852.0, 912423.0, 792833.0, 485605.0, 259267.0, 133942.0, 68433.0, 35589.0, 18818.0, 10396.0, 5921.0, 3431.0, 2025.0, 1231.0, 768.0, 487.0, 325.0, 205.0, 136.0, 100.0, 52.0, 41.0, 29.0, 18.0, 15.0, 7.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.1171875, -11.7349853515625, -11.352783203125, -10.9705810546875, -10.58837890625, -10.2061767578125, -9.823974609375, -9.4417724609375, -9.0595703125, -8.6773681640625, -8.295166015625, -7.9129638671875, -7.53076171875, -7.1485595703125, -6.766357421875, -6.3841552734375, -6.001953125, -5.6197509765625, -5.237548828125, -4.8553466796875, -4.47314453125, -4.0909423828125, -3.708740234375, -3.3265380859375, -2.9443359375, -2.5621337890625, -2.179931640625, -1.7977294921875, -1.41552734375, -1.0333251953125, -0.651123046875, -0.2689208984375, 0.11328125, 0.4954833984375, 0.877685546875, 1.2598876953125, 1.64208984375, 2.0242919921875, 2.406494140625, 2.7886962890625, 3.1708984375, 3.5531005859375, 3.935302734375, 4.3175048828125, 4.69970703125, 5.0819091796875, 5.464111328125, 5.8463134765625, 6.228515625, 6.6107177734375, 6.992919921875, 7.3751220703125, 7.75732421875, 8.1395263671875, 8.521728515625, 8.9039306640625, 9.2861328125, 9.6683349609375, 10.050537109375, 10.4327392578125, 10.81494140625, 11.1971435546875, 11.579345703125, 11.9615478515625, 12.34375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 4.0, 10.0, 11.0, 16.0, 17.0, 17.0, 24.0, 38.0, 41.0, 63.0, 96.0, 96.0, 101.0, 126.0, 166.0, 196.0, 227.0, 251.0, 252.0, 316.0, 295.0, 262.0, 244.0, 215.0, 162.0, 161.0, 158.0, 107.0, 85.0, 87.0, 56.0, 49.0, 29.0, 24.0, 18.0, 12.0, 13.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.76953125, -3.654510498046875, -3.53948974609375, -3.424468994140625, -3.3094482421875, -3.194427490234375, -3.07940673828125, -2.964385986328125, -2.849365234375, -2.734344482421875, -2.61932373046875, -2.504302978515625, -2.3892822265625, -2.274261474609375, -2.15924072265625, -2.044219970703125, -1.92919921875, -1.814178466796875, -1.69915771484375, -1.584136962890625, -1.4691162109375, -1.354095458984375, -1.23907470703125, -1.124053955078125, -1.009033203125, -0.894012451171875, -0.77899169921875, -0.663970947265625, -0.5489501953125, -0.433929443359375, -0.31890869140625, -0.203887939453125, -0.0888671875, 0.026153564453125, 0.14117431640625, 0.256195068359375, 0.3712158203125, 0.486236572265625, 0.60125732421875, 0.716278076171875, 0.831298828125, 0.946319580078125, 1.06134033203125, 1.176361083984375, 1.2913818359375, 1.406402587890625, 1.52142333984375, 1.636444091796875, 1.75146484375, 1.866485595703125, 1.98150634765625, 2.096527099609375, 2.2115478515625, 2.326568603515625, 2.44158935546875, 2.556610107421875, 2.671630859375, 2.786651611328125, 2.90167236328125, 3.016693115234375, 3.1317138671875, 3.246734619140625, 3.36175537109375, 3.476776123046875, 3.591796875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 5.0, 10.0, 13.0, 12.0, 13.0, 19.0, 18.0, 30.0, 25.0, 38.0, 41.0, 27.0, 34.0, 56.0, 63.0, 66.0, 54.0, 49.0, 40.0, 52.0, 47.0, 49.0, 32.0, 29.0, 28.0, 25.0, 23.0, 18.0, 19.0, 7.0, 14.0, 9.0, 6.0, 3.0, 8.0, 2.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.261503219604492, -11.896818161010742, -11.532133102416992, -11.167448043823242, -10.802762985229492, -10.438078880310059, -10.073393821716309, -9.708708763122559, -9.344023704528809, -8.979338645935059, -8.614653587341309, -8.249968528747559, -7.885283946990967, -7.520598888397217, -7.155914306640625, -6.791229248046875, -6.426544189453125, -6.061859130859375, -5.697174072265625, -5.332489490509033, -4.967804431915283, -4.603119373321533, -4.238434791564941, -3.8737497329711914, -3.5090646743774414, -3.1443796157836914, -2.7796947956085205, -2.4150099754333496, -2.0503249168395996, -1.6856399774551392, -1.3209550380706787, -0.9562702178955078, -0.5915861129760742, -0.22690117359161377, 0.13778376579284668, 0.5024687051773071, 0.8671536445617676, 1.231838583946228, 1.5965235233306885, 1.9612083435058594, 2.3258934020996094, 2.6905784606933594, 3.0552632808685303, 3.419948101043701, 3.784633159637451, 4.149318218231201, 4.514002799987793, 4.878687858581543, 5.243372917175293, 5.608057975769043, 5.972743034362793, 6.337427616119385, 6.702112674713135, 7.066797733306885, 7.431482315063477, 7.796167373657227, 8.160852432250977, 8.525537490844727, 8.890222549438477, 9.254907608032227, 9.619592666625977, 9.98427677154541, 10.34896183013916, 10.71364688873291, 11.07833194732666]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 10.0, 5.0, 11.0, 15.0, 16.0, 13.0, 21.0, 23.0, 24.0, 23.0, 35.0, 37.0, 35.0, 41.0, 50.0, 60.0, 57.0, 53.0, 51.0, 40.0, 41.0, 40.0, 47.0, 34.0, 29.0, 34.0, 25.0, 23.0, 22.0, 21.0, 10.0, 12.0, 12.0, 3.0, 5.0, 6.0, 1.0, 5.0, 8.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.680408000946045, -7.436301231384277, -7.192193984985352, -6.948086738586426, -6.703979969024658, -6.459873199462891, -6.215765953063965, -5.971658706665039, -5.7275519371032715, -5.483445167541504, -5.239337921142578, -4.995230674743652, -4.751123905181885, -4.507017135620117, -4.262909889221191, -4.018802642822266, -3.774695873260498, -3.5305888652801514, -3.2864818572998047, -3.042374849319458, -2.7982678413391113, -2.5541608333587646, -2.310053825378418, -2.0659468173980713, -1.8218398094177246, -1.577732801437378, -1.3336257934570312, -1.0895187854766846, -0.8454117774963379, -0.6013047695159912, -0.35719776153564453, -0.11309075355529785, 0.13101577758789062, 0.3751227855682373, 0.619229793548584, 0.8633368015289307, 1.1074438095092773, 1.351550817489624, 1.5956578254699707, 1.8397648334503174, 2.083871841430664, 2.3279788494110107, 2.5720858573913574, 2.816192865371704, 3.060299873352051, 3.3044068813323975, 3.548513889312744, 3.792620897293091, 4.0367279052734375, 4.280835151672363, 4.524941921234131, 4.769048690795898, 5.013155937194824, 5.25726318359375, 5.501369953155518, 5.745476722717285, 5.989583969116211, 6.233691215515137, 6.477797985076904, 6.721904754638672, 6.966012001037598, 7.210119247436523, 7.454226016998291, 7.698332786560059, 7.942440032958984]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 14.0, 7.0, 7.0, 18.0, 20.0, 31.0, 29.0, 56.0, 57.0, 83.0, 115.0, 131.0, 189.0, 225.0, 310.0, 441.0, 543.0, 815.0, 1229.0, 1840.0, 3078.0, 5431.0, 11251.0, 25742.0, 64610.0, 155354.0, 277047.0, 261412.0, 136962.0, 55524.0, 22222.0, 10040.0, 4986.0, 2896.0, 1778.0, 1072.0, 830.0, 536.0, 392.0, 277.0, 248.0, 194.0, 131.0, 84.0, 93.0, 55.0, 39.0, 29.0, 30.0, 17.0, 15.0, 10.0, 7.0, 4.0, 5.0, 5.0, 0.0, 2.0], "bins": [-8.7890625, -8.5220947265625, -8.255126953125, -7.9881591796875, -7.72119140625, -7.4542236328125, -7.187255859375, -6.9202880859375, -6.6533203125, -6.3863525390625, -6.119384765625, -5.8524169921875, -5.58544921875, -5.3184814453125, -5.051513671875, -4.7845458984375, -4.517578125, -4.2506103515625, -3.983642578125, -3.7166748046875, -3.44970703125, -3.1827392578125, -2.915771484375, -2.6488037109375, -2.3818359375, -2.1148681640625, -1.847900390625, -1.5809326171875, -1.31396484375, -1.0469970703125, -0.780029296875, -0.5130615234375, -0.24609375, 0.0208740234375, 0.287841796875, 0.5548095703125, 0.82177734375, 1.0887451171875, 1.355712890625, 1.6226806640625, 1.8896484375, 2.1566162109375, 2.423583984375, 2.6905517578125, 2.95751953125, 3.2244873046875, 3.491455078125, 3.7584228515625, 4.025390625, 4.2923583984375, 4.559326171875, 4.8262939453125, 5.09326171875, 5.3602294921875, 5.627197265625, 5.8941650390625, 6.1611328125, 6.4281005859375, 6.695068359375, 6.9620361328125, 7.22900390625, 7.4959716796875, 7.762939453125, 8.0299072265625, 8.296875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 8.0, 13.0, 12.0, 20.0, 23.0, 16.0, 19.0, 38.0, 21.0, 30.0, 34.0, 46.0, 44.0, 46.0, 59.0, 50.0, 51.0, 62.0, 41.0, 46.0, 52.0, 34.0, 34.0, 38.0, 30.0, 26.0, 24.0, 18.0, 14.0, 6.0, 10.0, 7.0, 6.0, 6.0, 4.0, 11.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.671875, -8.37353515625, -8.0751953125, -7.77685546875, -7.478515625, -7.18017578125, -6.8818359375, -6.58349609375, -6.28515625, -5.98681640625, -5.6884765625, -5.39013671875, -5.091796875, -4.79345703125, -4.4951171875, -4.19677734375, -3.8984375, -3.60009765625, -3.3017578125, -3.00341796875, -2.705078125, -2.40673828125, -2.1083984375, -1.81005859375, -1.51171875, -1.21337890625, -0.9150390625, -0.61669921875, -0.318359375, -0.02001953125, 0.2783203125, 0.57666015625, 0.875, 1.17333984375, 1.4716796875, 1.77001953125, 2.068359375, 2.36669921875, 2.6650390625, 2.96337890625, 3.26171875, 3.56005859375, 3.8583984375, 4.15673828125, 4.455078125, 4.75341796875, 5.0517578125, 5.35009765625, 5.6484375, 5.94677734375, 6.2451171875, 6.54345703125, 6.841796875, 7.14013671875, 7.4384765625, 7.73681640625, 8.03515625, 8.33349609375, 8.6318359375, 8.93017578125, 9.228515625, 9.52685546875, 9.8251953125, 10.12353515625, 10.421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 10.0, 7.0, 14.0, 19.0, 36.0, 30.0, 60.0, 97.0, 100.0, 151.0, 175.0, 283.0, 466.0, 731.0, 1289.0, 2486.0, 6565.0, 24353.0, 134502.0, 557212.0, 258948.0, 43065.0, 10090.0, 3568.0, 1654.0, 924.0, 553.0, 355.0, 236.0, 165.0, 118.0, 78.0, 62.0, 36.0, 37.0, 23.0, 8.0, 9.0, 9.0, 9.0, 6.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.718017578125, -18.10791015625, -17.497802734375, -16.8876953125, -16.277587890625, -15.66748046875, -15.057373046875, -14.447265625, -13.837158203125, -13.22705078125, -12.616943359375, -12.0068359375, -11.396728515625, -10.78662109375, -10.176513671875, -9.56640625, -8.956298828125, -8.34619140625, -7.736083984375, -7.1259765625, -6.515869140625, -5.90576171875, -5.295654296875, -4.685546875, -4.075439453125, -3.46533203125, -2.855224609375, -2.2451171875, -1.635009765625, -1.02490234375, -0.414794921875, 0.1953125, 0.805419921875, 1.41552734375, 2.025634765625, 2.6357421875, 3.245849609375, 3.85595703125, 4.466064453125, 5.076171875, 5.686279296875, 6.29638671875, 6.906494140625, 7.5166015625, 8.126708984375, 8.73681640625, 9.346923828125, 9.95703125, 10.567138671875, 11.17724609375, 11.787353515625, 12.3974609375, 13.007568359375, 13.61767578125, 14.227783203125, 14.837890625, 15.447998046875, 16.05810546875, 16.668212890625, 17.2783203125, 17.888427734375, 18.49853515625, 19.108642578125, 19.71875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 2.0, 6.0, 12.0, 10.0, 9.0, 17.0, 11.0, 13.0, 28.0, 18.0, 17.0, 31.0, 26.0, 26.0, 24.0, 28.0, 31.0, 40.0, 41.0, 36.0, 47.0, 39.0, 36.0, 38.0, 46.0, 49.0, 23.0, 32.0, 39.0, 22.0, 19.0, 22.0, 21.0, 25.0, 21.0, 14.0, 10.0, 11.0, 11.0, 11.0, 4.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-4.37890625, -4.2415771484375, -4.104248046875, -3.9669189453125, -3.82958984375, -3.6922607421875, -3.554931640625, -3.4176025390625, -3.2802734375, -3.1429443359375, -3.005615234375, -2.8682861328125, -2.73095703125, -2.5936279296875, -2.456298828125, -2.3189697265625, -2.181640625, -2.0443115234375, -1.906982421875, -1.7696533203125, -1.63232421875, -1.4949951171875, -1.357666015625, -1.2203369140625, -1.0830078125, -0.9456787109375, -0.808349609375, -0.6710205078125, -0.53369140625, -0.3963623046875, -0.259033203125, -0.1217041015625, 0.015625, 0.1529541015625, 0.290283203125, 0.4276123046875, 0.56494140625, 0.7022705078125, 0.839599609375, 0.9769287109375, 1.1142578125, 1.2515869140625, 1.388916015625, 1.5262451171875, 1.66357421875, 1.8009033203125, 1.938232421875, 2.0755615234375, 2.212890625, 2.3502197265625, 2.487548828125, 2.6248779296875, 2.76220703125, 2.8995361328125, 3.036865234375, 3.1741943359375, 3.3115234375, 3.4488525390625, 3.586181640625, 3.7235107421875, 3.86083984375, 3.9981689453125, 4.135498046875, 4.2728271484375, 4.41015625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 15.0, 9.0, 26.0, 41.0, 32.0, 62.0, 73.0, 101.0, 157.0, 196.0, 290.0, 424.0, 606.0, 860.0, 1152.0, 1779.0, 2621.0, 4460.0, 9832.0, 32042.0, 147723.0, 503469.0, 259566.0, 53229.0, 14264.0, 5748.0, 3082.0, 1959.0, 1332.0, 968.0, 672.0, 447.0, 356.0, 264.0, 184.0, 143.0, 103.0, 61.0, 52.0, 38.0, 26.0, 27.0, 17.0, 8.0, 5.0, 7.0, 7.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.1796875, -7.92938232421875, -7.6790771484375, -7.42877197265625, -7.178466796875, -6.92816162109375, -6.6778564453125, -6.42755126953125, -6.17724609375, -5.92694091796875, -5.6766357421875, -5.42633056640625, -5.176025390625, -4.92572021484375, -4.6754150390625, -4.42510986328125, -4.1748046875, -3.92449951171875, -3.6741943359375, -3.42388916015625, -3.173583984375, -2.92327880859375, -2.6729736328125, -2.42266845703125, -2.17236328125, -1.92205810546875, -1.6717529296875, -1.42144775390625, -1.171142578125, -0.92083740234375, -0.6705322265625, -0.42022705078125, -0.169921875, 0.08038330078125, 0.3306884765625, 0.58099365234375, 0.831298828125, 1.08160400390625, 1.3319091796875, 1.58221435546875, 1.83251953125, 2.08282470703125, 2.3331298828125, 2.58343505859375, 2.833740234375, 3.08404541015625, 3.3343505859375, 3.58465576171875, 3.8349609375, 4.08526611328125, 4.3355712890625, 4.58587646484375, 4.836181640625, 5.08648681640625, 5.3367919921875, 5.58709716796875, 5.83740234375, 6.08770751953125, 6.3380126953125, 6.58831787109375, 6.838623046875, 7.08892822265625, 7.3392333984375, 7.58953857421875, 7.83984375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 4.0, 8.0, 17.0, 31.0, 55.0, 122.0, 183.0, 204.0, 153.0, 116.0, 50.0, 23.0, 11.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005311965942382812, -0.0005165338516235352, -0.0005018711090087891, -0.00048720836639404297, -0.0004725456237792969, -0.0004578828811645508, -0.0004432201385498047, -0.0004285573959350586, -0.0004138946533203125, -0.0003992319107055664, -0.0003845691680908203, -0.0003699064254760742, -0.0003552436828613281, -0.00034058094024658203, -0.00032591819763183594, -0.00031125545501708984, -0.00029659271240234375, -0.00028192996978759766, -0.00026726722717285156, -0.00025260448455810547, -0.00023794174194335938, -0.00022327899932861328, -0.0002086162567138672, -0.0001939535140991211, -0.000179290771484375, -0.0001646280288696289, -0.0001499652862548828, -0.00013530254364013672, -0.00012063980102539062, -0.00010597705841064453, -9.131431579589844e-05, -7.665157318115234e-05, -6.198883056640625e-05, -4.7326087951660156e-05, -3.266334533691406e-05, -1.800060272216797e-05, -3.337860107421875e-06, 1.1324882507324219e-05, 2.5987625122070312e-05, 4.0650367736816406e-05, 5.53131103515625e-05, 6.99758529663086e-05, 8.463859558105469e-05, 9.930133819580078e-05, 0.00011396408081054688, 0.00012862682342529297, 0.00014328956604003906, 0.00015795230865478516, 0.00017261505126953125, 0.00018727779388427734, 0.00020194053649902344, 0.00021660327911376953, 0.00023126602172851562, 0.0002459287643432617, 0.0002605915069580078, 0.0002752542495727539, 0.0002899169921875, 0.0003045797348022461, 0.0003192424774169922, 0.0003339052200317383, 0.0003485679626464844, 0.00036323070526123047, 0.00037789344787597656, 0.00039255619049072266, 0.00040721893310546875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 4.0, 10.0, 4.0, 11.0, 24.0, 38.0, 37.0, 63.0, 81.0, 121.0, 152.0, 274.0, 330.0, 464.0, 696.0, 978.0, 1615.0, 2650.0, 4367.0, 10473.0, 85335.0, 622302.0, 279181.0, 23986.0, 5998.0, 3200.0, 2043.0, 1319.0, 896.0, 586.0, 389.0, 275.0, 201.0, 141.0, 102.0, 63.0, 37.0, 30.0, 28.0, 19.0, 11.0, 5.0, 6.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-13.484375, -13.1070556640625, -12.729736328125, -12.3524169921875, -11.97509765625, -11.5977783203125, -11.220458984375, -10.8431396484375, -10.4658203125, -10.0885009765625, -9.711181640625, -9.3338623046875, -8.95654296875, -8.5792236328125, -8.201904296875, -7.8245849609375, -7.447265625, -7.0699462890625, -6.692626953125, -6.3153076171875, -5.93798828125, -5.5606689453125, -5.183349609375, -4.8060302734375, -4.4287109375, -4.0513916015625, -3.674072265625, -3.2967529296875, -2.91943359375, -2.5421142578125, -2.164794921875, -1.7874755859375, -1.41015625, -1.0328369140625, -0.655517578125, -0.2781982421875, 0.09912109375, 0.4764404296875, 0.853759765625, 1.2310791015625, 1.6083984375, 1.9857177734375, 2.363037109375, 2.7403564453125, 3.11767578125, 3.4949951171875, 3.872314453125, 4.2496337890625, 4.626953125, 5.0042724609375, 5.381591796875, 5.7589111328125, 6.13623046875, 6.5135498046875, 6.890869140625, 7.2681884765625, 7.6455078125, 8.0228271484375, 8.400146484375, 8.7774658203125, 9.15478515625, 9.5321044921875, 9.909423828125, 10.2867431640625, 10.6640625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 27.0, 100.0, 254.0, 301.0, 198.0, 66.0, 19.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.778778076171875, -4.63958740234375, -4.500396728515625, -4.3612060546875, -4.222015380859375, -4.08282470703125, -3.943634033203125, -3.804443359375, -3.665252685546875, -3.52606201171875, -3.386871337890625, -3.2476806640625, -3.108489990234375, -2.96929931640625, -2.830108642578125, -2.69091796875, -2.551727294921875, -2.41253662109375, -2.273345947265625, -2.1341552734375, -1.994964599609375, -1.85577392578125, -1.716583251953125, -1.577392578125, -1.438201904296875, -1.29901123046875, -1.159820556640625, -1.0206298828125, -0.881439208984375, -0.74224853515625, -0.603057861328125, -0.4638671875, -0.324676513671875, -0.18548583984375, -0.046295166015625, 0.0928955078125, 0.232086181640625, 0.37127685546875, 0.510467529296875, 0.649658203125, 0.788848876953125, 0.92803955078125, 1.067230224609375, 1.2064208984375, 1.345611572265625, 1.48480224609375, 1.623992919921875, 1.76318359375, 1.902374267578125, 2.04156494140625, 2.180755615234375, 2.3199462890625, 2.459136962890625, 2.59832763671875, 2.737518310546875, 2.876708984375, 3.015899658203125, 3.15509033203125, 3.294281005859375, 3.4334716796875, 3.572662353515625, 3.71185302734375, 3.851043701171875, 3.990234375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 13.0, 16.0, 12.0, 12.0, 28.0, 35.0, 28.0, 29.0, 46.0, 34.0, 38.0, 60.0, 61.0, 46.0, 66.0, 49.0, 47.0, 46.0, 51.0, 36.0, 35.0, 33.0, 22.0, 31.0, 14.0, 23.0, 12.0, 12.0, 13.0, 6.0, 6.0, 5.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-13.80494499206543, -13.435741424560547, -13.066537857055664, -12.697334289550781, -12.328129768371582, -11.9589262008667, -11.589722633361816, -11.220519065856934, -10.851314544677734, -10.482110977172852, -10.112907409667969, -9.743703842163086, -9.374499320983887, -9.005295753479004, -8.636092185974121, -8.266888618469238, -7.8976850509643555, -7.528481483459473, -7.159277439117432, -6.790073871612549, -6.420869827270508, -6.051666259765625, -5.682462692260742, -5.313259124755859, -4.944055080413818, -4.5748515129089355, -4.2056474685668945, -3.8364439010620117, -3.46724009513855, -3.098036289215088, -2.728832721710205, -2.359628915786743, -1.9904241561889648, -1.621220350265503, -1.2520166635513306, -0.8828129768371582, -0.5136091709136963, -0.14440536499023438, 0.22479820251464844, 0.5940020084381104, 0.9632058143615723, 1.3324096202850342, 1.7016133069992065, 2.070816993713379, 2.440020799636841, 2.8092246055603027, 3.1784281730651855, 3.5476319789886475, 3.9168357849121094, 4.286039352416992, 4.655243396759033, 5.024446964263916, 5.393651008605957, 5.76285457611084, 6.132058143615723, 6.5012617111206055, 6.8704657554626465, 7.239669322967529, 7.60887336730957, 7.978076934814453, 8.347280502319336, 8.716484069824219, 9.085687637329102, 9.4548921585083, 9.824095726013184]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 9.0, 10.0, 16.0, 14.0, 17.0, 18.0, 22.0, 25.0, 30.0, 34.0, 44.0, 38.0, 46.0, 62.0, 48.0, 43.0, 62.0, 45.0, 51.0, 46.0, 40.0, 33.0, 36.0, 26.0, 27.0, 27.0, 26.0, 21.0, 18.0, 13.0, 9.0, 5.0, 6.0, 7.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.964357852935791, -7.708812236785889, -7.4532670974731445, -7.197721481323242, -6.942176342010498, -6.686630725860596, -6.431085586547852, -6.175539970397949, -5.919994354248047, -5.6644487380981445, -5.4089035987854, -5.153357982635498, -4.897812843322754, -4.642267227172852, -4.386721611022949, -4.131176471710205, -3.875631332397461, -3.6200859546661377, -3.3645405769348145, -3.108994960784912, -2.853449821472168, -2.5979042053222656, -2.3423588275909424, -2.086813449859619, -1.831268072128296, -1.5757226943969727, -1.3201773166656494, -1.0646318197250366, -0.8090864419937134, -0.5535410642623901, -0.29799556732177734, -0.0424501895904541, 0.21309566497802734, 0.468641072511673, 0.7241864800453186, 0.9797319173812866, 1.2352772951126099, 1.490822672843933, 1.746368169784546, 2.001913547515869, 2.2574589252471924, 2.5130043029785156, 2.768549680709839, 3.024095058441162, 3.2796406745910645, 3.5351858139038086, 3.790731430053711, 4.046277046203613, 4.301822185516357, 4.55736780166626, 4.812912940979004, 5.068458557128906, 5.32400369644165, 5.579549312591553, 5.835094451904297, 6.090640068054199, 6.346185684204102, 6.601731300354004, 6.857276439666748, 7.11282205581665, 7.3683671951293945, 7.623912811279297, 7.879458427429199, 8.135004043579102, 8.390548706054688]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 16.0, 17.0, 17.0, 25.0, 37.0, 58.0, 88.0, 105.0, 185.0, 254.0, 378.0, 532.0, 790.0, 1137.0, 1704.0, 2615.0, 4153.0, 6389.0, 10568.0, 16817.0, 27594.0, 43840.0, 67202.0, 97791.0, 128409.0, 146128.0, 141067.0, 115205.0, 83578.0, 56220.0, 35848.0, 22204.0, 13840.0, 8485.0, 5251.0, 3457.0, 2150.0, 1434.0, 911.0, 619.0, 433.0, 296.0, 196.0, 152.0, 97.0, 93.0, 46.0, 29.0, 26.0, 13.0, 12.0, 17.0, 8.0, 3.0, 2.0, 0.0, 4.0, 2.0], "bins": [-9.5625, -9.2615966796875, -8.960693359375, -8.6597900390625, -8.35888671875, -8.0579833984375, -7.757080078125, -7.4561767578125, -7.1552734375, -6.8543701171875, -6.553466796875, -6.2525634765625, -5.95166015625, -5.6507568359375, -5.349853515625, -5.0489501953125, -4.748046875, -4.4471435546875, -4.146240234375, -3.8453369140625, -3.54443359375, -3.2435302734375, -2.942626953125, -2.6417236328125, -2.3408203125, -2.0399169921875, -1.739013671875, -1.4381103515625, -1.13720703125, -0.8363037109375, -0.535400390625, -0.2344970703125, 0.06640625, 0.3673095703125, 0.668212890625, 0.9691162109375, 1.27001953125, 1.5709228515625, 1.871826171875, 2.1727294921875, 2.4736328125, 2.7745361328125, 3.075439453125, 3.3763427734375, 3.67724609375, 3.9781494140625, 4.279052734375, 4.5799560546875, 4.880859375, 5.1817626953125, 5.482666015625, 5.7835693359375, 6.08447265625, 6.3853759765625, 6.686279296875, 6.9871826171875, 7.2880859375, 7.5889892578125, 7.889892578125, 8.1907958984375, 8.49169921875, 8.7926025390625, 9.093505859375, 9.3944091796875, 9.6953125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 9.0, 9.0, 15.0, 12.0, 15.0, 16.0, 16.0, 23.0, 29.0, 31.0, 35.0, 41.0, 37.0, 40.0, 36.0, 37.0, 48.0, 54.0, 42.0, 46.0, 43.0, 40.0, 42.0, 44.0, 29.0, 25.0, 28.0, 24.0, 25.0, 18.0, 24.0, 17.0, 14.0, 8.0, 5.0, 9.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.898681640625, -7.63330078125, -7.367919921875, -7.1025390625, -6.837158203125, -6.57177734375, -6.306396484375, -6.041015625, -5.775634765625, -5.51025390625, -5.244873046875, -4.9794921875, -4.714111328125, -4.44873046875, -4.183349609375, -3.91796875, -3.652587890625, -3.38720703125, -3.121826171875, -2.8564453125, -2.591064453125, -2.32568359375, -2.060302734375, -1.794921875, -1.529541015625, -1.26416015625, -0.998779296875, -0.7333984375, -0.468017578125, -0.20263671875, 0.062744140625, 0.328125, 0.593505859375, 0.85888671875, 1.124267578125, 1.3896484375, 1.655029296875, 1.92041015625, 2.185791015625, 2.451171875, 2.716552734375, 2.98193359375, 3.247314453125, 3.5126953125, 3.778076171875, 4.04345703125, 4.308837890625, 4.57421875, 4.839599609375, 5.10498046875, 5.370361328125, 5.6357421875, 5.901123046875, 6.16650390625, 6.431884765625, 6.697265625, 6.962646484375, 7.22802734375, 7.493408203125, 7.7587890625, 8.024169921875, 8.28955078125, 8.554931640625, 8.8203125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 6.0, 5.0, 4.0, 14.0, 26.0, 24.0, 47.0, 44.0, 75.0, 97.0, 184.0, 269.0, 368.0, 541.0, 818.0, 1180.0, 1921.0, 3008.0, 4572.0, 6819.0, 10483.0, 16211.0, 25193.0, 37953.0, 54964.0, 78056.0, 101984.0, 122368.0, 129353.0, 119828.0, 99474.0, 74848.0, 52784.0, 36144.0, 23681.0, 15794.0, 10297.0, 6488.0, 4346.0, 2830.0, 1871.0, 1190.0, 746.0, 564.0, 329.0, 249.0, 162.0, 115.0, 79.0, 49.0, 36.0, 28.0, 12.0, 11.0, 6.0, 4.0, 6.0, 2.0, 1.0, 4.0, 3.0], "bins": [-8.6171875, -8.3431396484375, -8.069091796875, -7.7950439453125, -7.52099609375, -7.2469482421875, -6.972900390625, -6.6988525390625, -6.4248046875, -6.1507568359375, -5.876708984375, -5.6026611328125, -5.32861328125, -5.0545654296875, -4.780517578125, -4.5064697265625, -4.232421875, -3.9583740234375, -3.684326171875, -3.4102783203125, -3.13623046875, -2.8621826171875, -2.588134765625, -2.3140869140625, -2.0400390625, -1.7659912109375, -1.491943359375, -1.2178955078125, -0.94384765625, -0.6697998046875, -0.395751953125, -0.1217041015625, 0.15234375, 0.4263916015625, 0.700439453125, 0.9744873046875, 1.24853515625, 1.5225830078125, 1.796630859375, 2.0706787109375, 2.3447265625, 2.6187744140625, 2.892822265625, 3.1668701171875, 3.44091796875, 3.7149658203125, 3.989013671875, 4.2630615234375, 4.537109375, 4.8111572265625, 5.085205078125, 5.3592529296875, 5.63330078125, 5.9073486328125, 6.181396484375, 6.4554443359375, 6.7294921875, 7.0035400390625, 7.277587890625, 7.5516357421875, 7.82568359375, 8.0997314453125, 8.373779296875, 8.6478271484375, 8.921875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 10.0, 11.0, 14.0, 11.0, 13.0, 15.0, 13.0, 12.0, 15.0, 24.0, 14.0, 21.0, 30.0, 26.0, 30.0, 29.0, 37.0, 29.0, 43.0, 40.0, 40.0, 35.0, 48.0, 37.0, 37.0, 34.0, 25.0, 26.0, 27.0, 39.0, 24.0, 24.0, 28.0, 21.0, 15.0, 13.0, 14.0, 15.0, 13.0, 11.0, 11.0, 8.0, 1.0, 6.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8984375, -3.760986328125, -3.62353515625, -3.486083984375, -3.3486328125, -3.211181640625, -3.07373046875, -2.936279296875, -2.798828125, -2.661376953125, -2.52392578125, -2.386474609375, -2.2490234375, -2.111572265625, -1.97412109375, -1.836669921875, -1.69921875, -1.561767578125, -1.42431640625, -1.286865234375, -1.1494140625, -1.011962890625, -0.87451171875, -0.737060546875, -0.599609375, -0.462158203125, -0.32470703125, -0.187255859375, -0.0498046875, 0.087646484375, 0.22509765625, 0.362548828125, 0.5, 0.637451171875, 0.77490234375, 0.912353515625, 1.0498046875, 1.187255859375, 1.32470703125, 1.462158203125, 1.599609375, 1.737060546875, 1.87451171875, 2.011962890625, 2.1494140625, 2.286865234375, 2.42431640625, 2.561767578125, 2.69921875, 2.836669921875, 2.97412109375, 3.111572265625, 3.2490234375, 3.386474609375, 3.52392578125, 3.661376953125, 3.798828125, 3.936279296875, 4.07373046875, 4.211181640625, 4.3486328125, 4.486083984375, 4.62353515625, 4.760986328125, 4.8984375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 12.0, 14.0, 27.0, 28.0, 67.0, 91.0, 150.0, 188.0, 334.0, 462.0, 778.0, 1246.0, 1865.0, 3089.0, 4866.0, 8201.0, 13881.0, 25190.0, 45959.0, 86948.0, 163426.0, 238364.0, 202154.0, 114468.0, 60419.0, 32143.0, 17657.0, 10202.0, 6071.0, 3808.0, 2303.0, 1553.0, 934.0, 592.0, 377.0, 240.0, 167.0, 106.0, 67.0, 37.0, 25.0, 17.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.140625, -8.822265625, -8.50390625, -8.185546875, -7.8671875, -7.548828125, -7.23046875, -6.912109375, -6.59375, -6.275390625, -5.95703125, -5.638671875, -5.3203125, -5.001953125, -4.68359375, -4.365234375, -4.046875, -3.728515625, -3.41015625, -3.091796875, -2.7734375, -2.455078125, -2.13671875, -1.818359375, -1.5, -1.181640625, -0.86328125, -0.544921875, -0.2265625, 0.091796875, 0.41015625, 0.728515625, 1.046875, 1.365234375, 1.68359375, 2.001953125, 2.3203125, 2.638671875, 2.95703125, 3.275390625, 3.59375, 3.912109375, 4.23046875, 4.548828125, 4.8671875, 5.185546875, 5.50390625, 5.822265625, 6.140625, 6.458984375, 6.77734375, 7.095703125, 7.4140625, 7.732421875, 8.05078125, 8.369140625, 8.6875, 9.005859375, 9.32421875, 9.642578125, 9.9609375, 10.279296875, 10.59765625, 10.916015625, 11.234375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 9.0, 12.0, 13.0, 20.0, 23.0, 25.0, 22.0, 36.0, 42.0, 62.0, 75.0, 78.0, 83.0, 78.0, 93.0, 53.0, 61.0, 44.0, 28.0, 26.0, 15.0, 26.0, 6.0, 11.0, 8.0, 4.0, 8.0, 8.0, 5.0, 4.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014667510986328125, -0.0014257729053497314, -0.0013847947120666504, -0.0013438165187835693, -0.0013028383255004883, -0.0012618601322174072, -0.0012208819389343262, -0.0011799037456512451, -0.001138925552368164, -0.001097947359085083, -0.001056969165802002, -0.001015990972518921, -0.0009750127792358398, -0.0009340345859527588, -0.0008930563926696777, -0.0008520781993865967, -0.0008111000061035156, -0.0007701218128204346, -0.0007291436195373535, -0.0006881654262542725, -0.0006471872329711914, -0.0006062090396881104, -0.0005652308464050293, -0.0005242526531219482, -0.0004832744598388672, -0.00044229626655578613, -0.0004013180732727051, -0.000360339879989624, -0.00031936168670654297, -0.0002783834934234619, -0.00023740530014038086, -0.0001964271068572998, -0.00015544891357421875, -0.0001144707202911377, -7.349252700805664e-05, -3.2514333724975586e-05, 8.463859558105469e-06, 4.9442052841186523e-05, 9.042024612426758e-05, 0.00013139843940734863, 0.0001723766326904297, 0.00021335482597351074, 0.0002543330192565918, 0.00029531121253967285, 0.0003362894058227539, 0.00037726759910583496, 0.000418245792388916, 0.00045922398567199707, 0.0005002021789550781, 0.0005411803722381592, 0.0005821585655212402, 0.0006231367588043213, 0.0006641149520874023, 0.0007050931453704834, 0.0007460713386535645, 0.0007870495319366455, 0.0008280277252197266, 0.0008690059185028076, 0.0009099841117858887, 0.0009509623050689697, 0.0009919404983520508, 0.0010329186916351318, 0.0010738968849182129, 0.001114875078201294, 0.001155853271484375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 10.0, 14.0, 22.0, 27.0, 52.0, 81.0, 137.0, 218.0, 351.0, 528.0, 844.0, 1321.0, 2074.0, 3347.0, 5491.0, 9246.0, 16328.0, 29372.0, 55060.0, 105996.0, 189524.0, 239097.0, 177258.0, 97422.0, 50375.0, 27007.0, 14865.0, 8669.0, 5266.0, 3209.0, 1953.0, 1298.0, 769.0, 449.0, 318.0, 212.0, 119.0, 72.0, 57.0, 41.0, 21.0, 16.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.34375, -8.05029296875, -7.7568359375, -7.46337890625, -7.169921875, -6.87646484375, -6.5830078125, -6.28955078125, -5.99609375, -5.70263671875, -5.4091796875, -5.11572265625, -4.822265625, -4.52880859375, -4.2353515625, -3.94189453125, -3.6484375, -3.35498046875, -3.0615234375, -2.76806640625, -2.474609375, -2.18115234375, -1.8876953125, -1.59423828125, -1.30078125, -1.00732421875, -0.7138671875, -0.42041015625, -0.126953125, 0.16650390625, 0.4599609375, 0.75341796875, 1.046875, 1.34033203125, 1.6337890625, 1.92724609375, 2.220703125, 2.51416015625, 2.8076171875, 3.10107421875, 3.39453125, 3.68798828125, 3.9814453125, 4.27490234375, 4.568359375, 4.86181640625, 5.1552734375, 5.44873046875, 5.7421875, 6.03564453125, 6.3291015625, 6.62255859375, 6.916015625, 7.20947265625, 7.5029296875, 7.79638671875, 8.08984375, 8.38330078125, 8.6767578125, 8.97021484375, 9.263671875, 9.55712890625, 9.8505859375, 10.14404296875, 10.4375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 6.0, 5.0, 7.0, 10.0, 6.0, 9.0, 15.0, 13.0, 16.0, 17.0, 37.0, 34.0, 43.0, 63.0, 66.0, 47.0, 62.0, 66.0, 76.0, 57.0, 55.0, 48.0, 32.0, 40.0, 28.0, 24.0, 14.0, 18.0, 7.0, 9.0, 11.0, 13.0, 6.0, 5.0, 5.0, 3.0, 1.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.40234375, -2.3319091796875, -2.261474609375, -2.1910400390625, -2.12060546875, -2.0501708984375, -1.979736328125, -1.9093017578125, -1.8388671875, -1.7684326171875, -1.697998046875, -1.6275634765625, -1.55712890625, -1.4866943359375, -1.416259765625, -1.3458251953125, -1.275390625, -1.2049560546875, -1.134521484375, -1.0640869140625, -0.99365234375, -0.9232177734375, -0.852783203125, -0.7823486328125, -0.7119140625, -0.6414794921875, -0.571044921875, -0.5006103515625, -0.43017578125, -0.3597412109375, -0.289306640625, -0.2188720703125, -0.1484375, -0.0780029296875, -0.007568359375, 0.0628662109375, 0.13330078125, 0.2037353515625, 0.274169921875, 0.3446044921875, 0.4150390625, 0.4854736328125, 0.555908203125, 0.6263427734375, 0.69677734375, 0.7672119140625, 0.837646484375, 0.9080810546875, 0.978515625, 1.0489501953125, 1.119384765625, 1.1898193359375, 1.26025390625, 1.3306884765625, 1.401123046875, 1.4715576171875, 1.5419921875, 1.6124267578125, 1.682861328125, 1.7532958984375, 1.82373046875, 1.8941650390625, 1.964599609375, 2.0350341796875, 2.10546875]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 8.0, 6.0, 8.0, 8.0, 22.0, 15.0, 16.0, 33.0, 28.0, 21.0, 35.0, 48.0, 34.0, 50.0, 59.0, 44.0, 49.0, 46.0, 47.0, 66.0, 40.0, 50.0, 36.0, 40.0, 25.0, 26.0, 18.0, 13.0, 20.0, 22.0, 8.0, 12.0, 6.0, 8.0, 2.0, 6.0, 5.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.72091007232666, -11.356776237487793, -10.992643356323242, -10.628509521484375, -10.264375686645508, -9.90024185180664, -9.536108016967773, -9.171975135803223, -8.807841300964355, -8.443707466125488, -8.079574584960938, -7.71544075012207, -7.351306915283203, -6.987173080444336, -6.623039722442627, -6.258906364440918, -5.894772529602051, -5.530638694763184, -5.166505336761475, -4.802371978759766, -4.438238143920898, -4.074104309082031, -3.7099709510803223, -3.345837354660034, -2.981703758239746, -2.617570161819458, -2.25343656539917, -1.8893029689788818, -1.5251693725585938, -1.1610357761383057, -0.7969021797180176, -0.4327685832977295, -0.06863594055175781, 0.2954976558685303, 0.6596312522888184, 1.0237648487091064, 1.3878984451293945, 1.7520320415496826, 2.1161656379699707, 2.480299234390259, 2.844432830810547, 3.208566427230835, 3.572700023651123, 3.936833620071411, 4.300967216491699, 4.665101051330566, 5.029234409332275, 5.393367767333984, 5.757501602172852, 6.121635437011719, 6.485768795013428, 6.849902153015137, 7.214035987854004, 7.578169822692871, 7.94230318069458, 8.306436538696289, 8.670570373535156, 9.034704208374023, 9.39883804321289, 9.762970924377441, 10.127104759216309, 10.491238594055176, 10.855371475219727, 11.219505310058594, 11.583639144897461]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 13.0, 14.0, 17.0, 18.0, 14.0, 24.0, 23.0, 32.0, 37.0, 34.0, 39.0, 46.0, 47.0, 52.0, 43.0, 38.0, 41.0, 55.0, 45.0, 36.0, 42.0, 30.0, 27.0, 38.0, 36.0, 20.0, 22.0, 17.0, 15.0, 14.0, 13.0, 13.0, 10.0, 7.0, 8.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.093531608581543, -8.833710670471191, -8.573888778686523, -8.314067840576172, -8.05424690246582, -7.7944254875183105, -7.534604072570801, -7.274783134460449, -7.014962196350098, -6.755140781402588, -6.495319843292236, -6.235498428344727, -5.975677490234375, -5.715856075286865, -5.4560346603393555, -5.196213722229004, -4.936392307281494, -4.676570892333984, -4.416749954223633, -4.156928539276123, -3.8971076011657715, -3.6372861862182617, -3.377465009689331, -3.1176438331604004, -2.8578226566314697, -2.598001480102539, -2.3381803035736084, -2.0783591270446777, -1.8185378313064575, -1.5587166547775269, -1.2988953590393066, -1.039074182510376, -0.7792530059814453, -0.5194318294525146, -0.2596105933189392, 0.00021064281463623047, 0.2600318193435669, 0.5198529958724976, 0.7796742916107178, 1.0394954681396484, 1.299316644668579, 1.5591378211975098, 1.8189589977264404, 2.078780174255371, 2.338601589202881, 2.5984225273132324, 2.858243942260742, 3.118065118789673, 3.3778862953186035, 3.637707471847534, 3.897528648376465, 4.157350063323975, 4.417171001434326, 4.676992416381836, 4.9368133544921875, 5.196634769439697, 5.456456184387207, 5.716277599334717, 5.976098537445068, 6.235919952392578, 6.49574089050293, 6.7555623054504395, 7.015383720397949, 7.275204658508301, 7.535025596618652]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 12.0, 26.0, 24.0, 57.0, 73.0, 122.0, 141.0, 199.0, 293.0, 487.0, 647.0, 944.0, 1470.0, 2201.0, 3489.0, 5730.0, 9362.0, 15317.0, 26720.0, 46294.0, 83583.0, 151451.0, 278347.0, 496512.0, 768152.0, 848320.0, 632884.0, 368665.0, 198949.0, 107647.0, 59544.0, 34527.0, 19474.0, 11844.0, 7177.0, 4669.0, 2985.0, 1946.0, 1291.0, 826.0, 593.0, 381.0, 280.0, 175.0, 153.0, 90.0, 69.0, 48.0, 29.0, 24.0, 8.0, 7.0, 6.0, 8.0, 3.0, 2.0, 2.0], "bins": [-10.5390625, -10.212158203125, -9.88525390625, -9.558349609375, -9.2314453125, -8.904541015625, -8.57763671875, -8.250732421875, -7.923828125, -7.596923828125, -7.27001953125, -6.943115234375, -6.6162109375, -6.289306640625, -5.96240234375, -5.635498046875, -5.30859375, -4.981689453125, -4.65478515625, -4.327880859375, -4.0009765625, -3.674072265625, -3.34716796875, -3.020263671875, -2.693359375, -2.366455078125, -2.03955078125, -1.712646484375, -1.3857421875, -1.058837890625, -0.73193359375, -0.405029296875, -0.078125, 0.248779296875, 0.57568359375, 0.902587890625, 1.2294921875, 1.556396484375, 1.88330078125, 2.210205078125, 2.537109375, 2.864013671875, 3.19091796875, 3.517822265625, 3.8447265625, 4.171630859375, 4.49853515625, 4.825439453125, 5.15234375, 5.479248046875, 5.80615234375, 6.133056640625, 6.4599609375, 6.786865234375, 7.11376953125, 7.440673828125, 7.767578125, 8.094482421875, 8.42138671875, 8.748291015625, 9.0751953125, 9.402099609375, 9.72900390625, 10.055908203125, 10.3828125]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 8.0, 9.0, 11.0, 11.0, 11.0, 11.0, 27.0, 24.0, 24.0, 32.0, 29.0, 30.0, 36.0, 28.0, 37.0, 39.0, 52.0, 44.0, 48.0, 34.0, 41.0, 36.0, 39.0, 35.0, 34.0, 29.0, 39.0, 27.0, 17.0, 21.0, 25.0, 20.0, 20.0, 15.0, 5.0, 14.0, 10.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.73046875, -5.55084228515625, -5.3712158203125, -5.19158935546875, -5.011962890625, -4.83233642578125, -4.6527099609375, -4.47308349609375, -4.29345703125, -4.11383056640625, -3.9342041015625, -3.75457763671875, -3.574951171875, -3.39532470703125, -3.2156982421875, -3.03607177734375, -2.8564453125, -2.67681884765625, -2.4971923828125, -2.31756591796875, -2.137939453125, -1.95831298828125, -1.7786865234375, -1.59906005859375, -1.41943359375, -1.23980712890625, -1.0601806640625, -0.88055419921875, -0.700927734375, -0.52130126953125, -0.3416748046875, -0.16204833984375, 0.017578125, 0.19720458984375, 0.3768310546875, 0.55645751953125, 0.736083984375, 0.91571044921875, 1.0953369140625, 1.27496337890625, 1.45458984375, 1.63421630859375, 1.8138427734375, 1.99346923828125, 2.173095703125, 2.35272216796875, 2.5323486328125, 2.71197509765625, 2.8916015625, 3.07122802734375, 3.2508544921875, 3.43048095703125, 3.610107421875, 3.78973388671875, 3.9693603515625, 4.14898681640625, 4.32861328125, 4.50823974609375, 4.6878662109375, 4.86749267578125, 5.047119140625, 5.22674560546875, 5.4063720703125, 5.58599853515625, 5.765625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 10.0, 19.0, 29.0, 29.0, 52.0, 75.0, 142.0, 180.0, 279.0, 446.0, 693.0, 1126.0, 1750.0, 2856.0, 4692.0, 8258.0, 14246.0, 24809.0, 43552.0, 78032.0, 137261.0, 242473.0, 410615.0, 631411.0, 780491.0, 689695.0, 468935.0, 281750.0, 160474.0, 90225.0, 50812.0, 28698.0, 16301.0, 9489.0, 5529.0, 3379.0, 2023.0, 1254.0, 827.0, 463.0, 333.0, 205.0, 139.0, 70.0, 60.0, 30.0, 34.0, 12.0, 7.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0], "bins": [-11.8125, -11.4613037109375, -11.110107421875, -10.7589111328125, -10.40771484375, -10.0565185546875, -9.705322265625, -9.3541259765625, -9.0029296875, -8.6517333984375, -8.300537109375, -7.9493408203125, -7.59814453125, -7.2469482421875, -6.895751953125, -6.5445556640625, -6.193359375, -5.8421630859375, -5.490966796875, -5.1397705078125, -4.78857421875, -4.4373779296875, -4.086181640625, -3.7349853515625, -3.3837890625, -3.0325927734375, -2.681396484375, -2.3302001953125, -1.97900390625, -1.6278076171875, -1.276611328125, -0.9254150390625, -0.57421875, -0.2230224609375, 0.128173828125, 0.4793701171875, 0.83056640625, 1.1817626953125, 1.532958984375, 1.8841552734375, 2.2353515625, 2.5865478515625, 2.937744140625, 3.2889404296875, 3.64013671875, 3.9913330078125, 4.342529296875, 4.6937255859375, 5.044921875, 5.3961181640625, 5.747314453125, 6.0985107421875, 6.44970703125, 6.8009033203125, 7.152099609375, 7.5032958984375, 7.8544921875, 8.2056884765625, 8.556884765625, 8.9080810546875, 9.25927734375, 9.6104736328125, 9.961669921875, 10.3128662109375, 10.6640625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 2.0, 7.0, 4.0, 9.0, 10.0, 13.0, 15.0, 26.0, 28.0, 44.0, 40.0, 49.0, 69.0, 53.0, 86.0, 120.0, 117.0, 143.0, 159.0, 162.0, 197.0, 220.0, 213.0, 229.0, 227.0, 231.0, 205.0, 205.0, 185.0, 141.0, 160.0, 130.0, 91.0, 100.0, 68.0, 67.0, 54.0, 40.0, 35.0, 25.0, 18.0, 21.0, 16.0, 9.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.423828125, -3.32342529296875, -3.2230224609375, -3.12261962890625, -3.022216796875, -2.92181396484375, -2.8214111328125, -2.72100830078125, -2.62060546875, -2.52020263671875, -2.4197998046875, -2.31939697265625, -2.218994140625, -2.11859130859375, -2.0181884765625, -1.91778564453125, -1.8173828125, -1.71697998046875, -1.6165771484375, -1.51617431640625, -1.415771484375, -1.31536865234375, -1.2149658203125, -1.11456298828125, -1.01416015625, -0.91375732421875, -0.8133544921875, -0.71295166015625, -0.612548828125, -0.51214599609375, -0.4117431640625, -0.31134033203125, -0.2109375, -0.11053466796875, -0.0101318359375, 0.09027099609375, 0.190673828125, 0.29107666015625, 0.3914794921875, 0.49188232421875, 0.59228515625, 0.69268798828125, 0.7930908203125, 0.89349365234375, 0.993896484375, 1.09429931640625, 1.1947021484375, 1.29510498046875, 1.3955078125, 1.49591064453125, 1.5963134765625, 1.69671630859375, 1.797119140625, 1.89752197265625, 1.9979248046875, 2.09832763671875, 2.19873046875, 2.29913330078125, 2.3995361328125, 2.49993896484375, 2.600341796875, 2.70074462890625, 2.8011474609375, 2.90155029296875, 3.001953125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 11.0, 10.0, 13.0, 18.0, 31.0, 29.0, 37.0, 28.0, 44.0, 55.0, 54.0, 64.0, 49.0, 68.0, 64.0, 70.0, 60.0, 57.0, 42.0, 26.0, 39.0, 29.0, 24.0, 22.0, 8.0, 6.0, 13.0, 6.0, 9.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.199715614318848, -14.759828567504883, -14.319940567016602, -13.880053520202637, -13.440166473388672, -13.00027847290039, -12.560391426086426, -12.120504379272461, -11.68061637878418, -11.240729331970215, -10.800841331481934, -10.360954284667969, -9.921066284179688, -9.481179237365723, -9.041292190551758, -8.601404190063477, -8.161517143249512, -7.721629619598389, -7.281742095947266, -6.841855049133301, -6.401967525482178, -5.962080001831055, -5.52219295501709, -5.082305431365967, -4.642417907714844, -4.202530384063721, -3.7626430988311768, -3.322755813598633, -2.8828682899475098, -2.4429807662963867, -2.0030934810638428, -1.5632061958312988, -1.1233186721801758, -0.6834312677383423, -0.2435438632965088, 0.1963435411453247, 0.6362309455871582, 1.0761184692382812, 1.5160057544708252, 1.9558930397033691, 2.395780563354492, 2.8356680870056152, 3.275555372238159, 3.715442657470703, 4.155330181121826, 4.595217704772949, 5.035104751586914, 5.474992275238037, 5.91487979888916, 6.354767322540283, 6.794654846191406, 7.234541893005371, 7.674429416656494, 8.114316940307617, 8.554203987121582, 8.994091033935547, 9.433979034423828, 9.873866081237793, 10.313754081726074, 10.753641128540039, 11.19352912902832, 11.633416175842285, 12.07330322265625, 12.513191223144531, 12.953078269958496]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 5.0, 10.0, 6.0, 8.0, 12.0, 19.0, 18.0, 15.0, 23.0, 22.0, 40.0, 27.0, 27.0, 43.0, 32.0, 48.0, 30.0, 45.0, 46.0, 43.0, 48.0, 52.0, 30.0, 38.0, 33.0, 28.0, 29.0, 30.0, 36.0, 21.0, 18.0, 21.0, 13.0, 9.0, 16.0, 17.0, 8.0, 10.0, 4.0, 5.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.122658729553223, -6.888278484344482, -6.653898239135742, -6.419517993927002, -6.185137748718262, -5.9507575035095215, -5.716377258300781, -5.481997013092041, -5.247616767883301, -5.0132365226745605, -4.77885627746582, -4.54447603225708, -4.31009578704834, -4.0757155418396, -3.8413352966308594, -3.606955051422119, -3.372574806213379, -3.1381945610046387, -2.9038143157958984, -2.669434070587158, -2.435053825378418, -2.2006735801696777, -1.9662933349609375, -1.7319130897521973, -1.497532844543457, -1.2631525993347168, -1.0287723541259766, -0.7943921089172363, -0.5600118637084961, -0.32563161849975586, -0.09125137329101562, 0.1431288719177246, 0.37750911712646484, 0.6118893623352051, 0.8462696075439453, 1.0806498527526855, 1.3150300979614258, 1.549410343170166, 1.7837905883789062, 2.0181708335876465, 2.2525510787963867, 2.486931324005127, 2.721311569213867, 2.9556918144226074, 3.1900720596313477, 3.424452304840088, 3.658832550048828, 3.8932127952575684, 4.127593040466309, 4.361973285675049, 4.596353530883789, 4.830733776092529, 5.0651140213012695, 5.29949426651001, 5.53387451171875, 5.76825475692749, 6.0026350021362305, 6.237015247344971, 6.471395492553711, 6.705775737762451, 6.940155982971191, 7.174536228179932, 7.408916473388672, 7.643296718597412, 7.877676963806152]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 11.0, 15.0, 13.0, 27.0, 23.0, 48.0, 77.0, 123.0, 173.0, 253.0, 374.0, 615.0, 928.0, 1450.0, 2358.0, 4010.0, 6708.0, 11653.0, 20363.0, 35722.0, 62003.0, 102800.0, 151774.0, 181898.0, 166256.0, 120345.0, 74851.0, 43787.0, 25109.0, 14227.0, 8214.0, 4663.0, 2807.0, 1746.0, 1086.0, 744.0, 435.0, 279.0, 170.0, 131.0, 81.0, 62.0, 43.0, 35.0, 14.0, 11.0, 15.0, 2.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-4.8515625, -4.69342041015625, -4.5352783203125, -4.37713623046875, -4.218994140625, -4.06085205078125, -3.9027099609375, -3.74456787109375, -3.58642578125, -3.42828369140625, -3.2701416015625, -3.11199951171875, -2.953857421875, -2.79571533203125, -2.6375732421875, -2.47943115234375, -2.3212890625, -2.16314697265625, -2.0050048828125, -1.84686279296875, -1.688720703125, -1.53057861328125, -1.3724365234375, -1.21429443359375, -1.05615234375, -0.89801025390625, -0.7398681640625, -0.58172607421875, -0.423583984375, -0.26544189453125, -0.1072998046875, 0.05084228515625, 0.208984375, 0.36712646484375, 0.5252685546875, 0.68341064453125, 0.841552734375, 0.99969482421875, 1.1578369140625, 1.31597900390625, 1.47412109375, 1.63226318359375, 1.7904052734375, 1.94854736328125, 2.106689453125, 2.26483154296875, 2.4229736328125, 2.58111572265625, 2.7392578125, 2.89739990234375, 3.0555419921875, 3.21368408203125, 3.371826171875, 3.52996826171875, 3.6881103515625, 3.84625244140625, 4.00439453125, 4.16253662109375, 4.3206787109375, 4.47882080078125, 4.636962890625, 4.79510498046875, 4.9532470703125, 5.11138916015625, 5.26953125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 6.0, 5.0, 4.0, 6.0, 9.0, 8.0, 11.0, 21.0, 23.0, 20.0, 24.0, 31.0, 24.0, 30.0, 29.0, 42.0, 40.0, 38.0, 42.0, 43.0, 42.0, 41.0, 46.0, 35.0, 42.0, 38.0, 46.0, 25.0, 30.0, 23.0, 29.0, 23.0, 21.0, 18.0, 29.0, 15.0, 8.0, 10.0, 6.0, 3.0, 4.0, 2.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.359375, -8.08935546875, -7.8193359375, -7.54931640625, -7.279296875, -7.00927734375, -6.7392578125, -6.46923828125, -6.19921875, -5.92919921875, -5.6591796875, -5.38916015625, -5.119140625, -4.84912109375, -4.5791015625, -4.30908203125, -4.0390625, -3.76904296875, -3.4990234375, -3.22900390625, -2.958984375, -2.68896484375, -2.4189453125, -2.14892578125, -1.87890625, -1.60888671875, -1.3388671875, -1.06884765625, -0.798828125, -0.52880859375, -0.2587890625, 0.01123046875, 0.28125, 0.55126953125, 0.8212890625, 1.09130859375, 1.361328125, 1.63134765625, 1.9013671875, 2.17138671875, 2.44140625, 2.71142578125, 2.9814453125, 3.25146484375, 3.521484375, 3.79150390625, 4.0615234375, 4.33154296875, 4.6015625, 4.87158203125, 5.1416015625, 5.41162109375, 5.681640625, 5.95166015625, 6.2216796875, 6.49169921875, 6.76171875, 7.03173828125, 7.3017578125, 7.57177734375, 7.841796875, 8.11181640625, 8.3818359375, 8.65185546875, 8.921875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 11.0, 7.0, 18.0, 23.0, 36.0, 44.0, 56.0, 92.0, 151.0, 229.0, 378.0, 663.0, 1161.0, 2211.0, 4244.0, 9483.0, 22390.0, 57744.0, 151111.0, 314725.0, 280674.0, 122559.0, 46408.0, 18313.0, 7766.0, 3694.0, 1801.0, 951.0, 583.0, 359.0, 234.0, 146.0, 103.0, 54.0, 35.0, 23.0, 19.0, 12.0, 16.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -9.0235595703125, -8.711181640625, -8.3988037109375, -8.08642578125, -7.7740478515625, -7.461669921875, -7.1492919921875, -6.8369140625, -6.5245361328125, -6.212158203125, -5.8997802734375, -5.58740234375, -5.2750244140625, -4.962646484375, -4.6502685546875, -4.337890625, -4.0255126953125, -3.713134765625, -3.4007568359375, -3.08837890625, -2.7760009765625, -2.463623046875, -2.1512451171875, -1.8388671875, -1.5264892578125, -1.214111328125, -0.9017333984375, -0.58935546875, -0.2769775390625, 0.035400390625, 0.3477783203125, 0.66015625, 0.9725341796875, 1.284912109375, 1.5972900390625, 1.90966796875, 2.2220458984375, 2.534423828125, 2.8468017578125, 3.1591796875, 3.4715576171875, 3.783935546875, 4.0963134765625, 4.40869140625, 4.7210693359375, 5.033447265625, 5.3458251953125, 5.658203125, 5.9705810546875, 6.282958984375, 6.5953369140625, 6.90771484375, 7.2200927734375, 7.532470703125, 7.8448486328125, 8.1572265625, 8.4696044921875, 8.781982421875, 9.0943603515625, 9.40673828125, 9.7191162109375, 10.031494140625, 10.3438720703125, 10.65625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 6.0, 8.0, 1.0, 11.0, 18.0, 12.0, 18.0, 19.0, 24.0, 24.0, 27.0, 33.0, 37.0, 28.0, 28.0, 38.0, 44.0, 37.0, 40.0, 46.0, 42.0, 44.0, 40.0, 41.0, 31.0, 33.0, 31.0, 28.0, 32.0, 24.0, 19.0, 18.0, 15.0, 11.0, 11.0, 14.0, 18.0, 11.0, 8.0, 6.0, 7.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37890625, -4.22601318359375, -4.0731201171875, -3.92022705078125, -3.767333984375, -3.61444091796875, -3.4615478515625, -3.30865478515625, -3.15576171875, -3.00286865234375, -2.8499755859375, -2.69708251953125, -2.544189453125, -2.39129638671875, -2.2384033203125, -2.08551025390625, -1.9326171875, -1.77972412109375, -1.6268310546875, -1.47393798828125, -1.321044921875, -1.16815185546875, -1.0152587890625, -0.86236572265625, -0.70947265625, -0.55657958984375, -0.4036865234375, -0.25079345703125, -0.097900390625, 0.05499267578125, 0.2078857421875, 0.36077880859375, 0.513671875, 0.66656494140625, 0.8194580078125, 0.97235107421875, 1.125244140625, 1.27813720703125, 1.4310302734375, 1.58392333984375, 1.73681640625, 1.88970947265625, 2.0426025390625, 2.19549560546875, 2.348388671875, 2.50128173828125, 2.6541748046875, 2.80706787109375, 2.9599609375, 3.11285400390625, 3.2657470703125, 3.41864013671875, 3.571533203125, 3.72442626953125, 3.8773193359375, 4.03021240234375, 4.18310546875, 4.33599853515625, 4.4888916015625, 4.64178466796875, 4.794677734375, 4.94757080078125, 5.1004638671875, 5.25335693359375, 5.40625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 5.0, 8.0, 9.0, 19.0, 16.0, 35.0, 49.0, 78.0, 127.0, 198.0, 307.0, 514.0, 817.0, 1408.0, 2479.0, 4874.0, 9379.0, 19312.0, 40479.0, 88094.0, 184481.0, 284976.0, 211880.0, 104394.0, 48074.0, 23119.0, 10976.0, 5483.0, 2909.0, 1653.0, 922.0, 539.0, 355.0, 223.0, 130.0, 87.0, 40.0, 37.0, 38.0, 17.0, 8.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9609375, -3.8394775390625, -3.718017578125, -3.5965576171875, -3.47509765625, -3.3536376953125, -3.232177734375, -3.1107177734375, -2.9892578125, -2.8677978515625, -2.746337890625, -2.6248779296875, -2.50341796875, -2.3819580078125, -2.260498046875, -2.1390380859375, -2.017578125, -1.8961181640625, -1.774658203125, -1.6531982421875, -1.53173828125, -1.4102783203125, -1.288818359375, -1.1673583984375, -1.0458984375, -0.9244384765625, -0.802978515625, -0.6815185546875, -0.56005859375, -0.4385986328125, -0.317138671875, -0.1956787109375, -0.07421875, 0.0472412109375, 0.168701171875, 0.2901611328125, 0.41162109375, 0.5330810546875, 0.654541015625, 0.7760009765625, 0.8974609375, 1.0189208984375, 1.140380859375, 1.2618408203125, 1.38330078125, 1.5047607421875, 1.626220703125, 1.7476806640625, 1.869140625, 1.9906005859375, 2.112060546875, 2.2335205078125, 2.35498046875, 2.4764404296875, 2.597900390625, 2.7193603515625, 2.8408203125, 2.9622802734375, 3.083740234375, 3.2052001953125, 3.32666015625, 3.4481201171875, 3.569580078125, 3.6910400390625, 3.8125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 5.0, 2.0, 4.0, 5.0, 7.0, 11.0, 15.0, 16.0, 23.0, 28.0, 22.0, 31.0, 35.0, 54.0, 40.0, 52.0, 74.0, 57.0, 53.0, 58.0, 44.0, 61.0, 40.0, 60.0, 39.0, 34.0, 19.0, 22.0, 12.0, 14.0, 11.0, 11.0, 15.0, 7.0, 7.0, 4.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013303756713867188, -0.00012862682342529297, -0.00012421607971191406, -0.00011980533599853516, -0.00011539459228515625, -0.00011098384857177734, -0.00010657310485839844, -0.00010216236114501953, -9.775161743164062e-05, -9.334087371826172e-05, -8.893013000488281e-05, -8.45193862915039e-05, -8.0108642578125e-05, -7.56978988647461e-05, -7.128715515136719e-05, -6.687641143798828e-05, -6.246566772460938e-05, -5.805492401123047e-05, -5.364418029785156e-05, -4.9233436584472656e-05, -4.482269287109375e-05, -4.0411949157714844e-05, -3.600120544433594e-05, -3.159046173095703e-05, -2.7179718017578125e-05, -2.276897430419922e-05, -1.8358230590820312e-05, -1.3947486877441406e-05, -9.5367431640625e-06, -5.125999450683594e-06, -7.152557373046875e-07, 3.6954879760742188e-06, 8.106231689453125e-06, 1.2516975402832031e-05, 1.6927719116210938e-05, 2.1338462829589844e-05, 2.574920654296875e-05, 3.0159950256347656e-05, 3.457069396972656e-05, 3.898143768310547e-05, 4.3392181396484375e-05, 4.780292510986328e-05, 5.221366882324219e-05, 5.6624412536621094e-05, 6.103515625e-05, 6.54458999633789e-05, 6.985664367675781e-05, 7.426738739013672e-05, 7.867813110351562e-05, 8.308887481689453e-05, 8.749961853027344e-05, 9.191036224365234e-05, 9.632110595703125e-05, 0.00010073184967041016, 0.00010514259338378906, 0.00010955333709716797, 0.00011396408081054688, 0.00011837482452392578, 0.0001227855682373047, 0.0001271963119506836, 0.0001316070556640625, 0.0001360177993774414, 0.0001404285430908203, 0.00014483928680419922, 0.00014925003051757812]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 12.0, 11.0, 26.0, 24.0, 34.0, 65.0, 101.0, 146.0, 250.0, 360.0, 565.0, 903.0, 1294.0, 2109.0, 3504.0, 5685.0, 9311.0, 15340.0, 25579.0, 41488.0, 65863.0, 98013.0, 132125.0, 152696.0, 147152.0, 119047.0, 84091.0, 55039.0, 34069.0, 20789.0, 12540.0, 7767.0, 4750.0, 2860.0, 1809.0, 1095.0, 694.0, 475.0, 270.0, 231.0, 110.0, 92.0, 52.0, 34.0, 27.0, 11.0, 20.0, 10.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.087890625, -2.017822265625, -1.94775390625, -1.877685546875, -1.8076171875, -1.737548828125, -1.66748046875, -1.597412109375, -1.52734375, -1.457275390625, -1.38720703125, -1.317138671875, -1.2470703125, -1.177001953125, -1.10693359375, -1.036865234375, -0.966796875, -0.896728515625, -0.82666015625, -0.756591796875, -0.6865234375, -0.616455078125, -0.54638671875, -0.476318359375, -0.40625, -0.336181640625, -0.26611328125, -0.196044921875, -0.1259765625, -0.055908203125, 0.01416015625, 0.084228515625, 0.154296875, 0.224365234375, 0.29443359375, 0.364501953125, 0.4345703125, 0.504638671875, 0.57470703125, 0.644775390625, 0.71484375, 0.784912109375, 0.85498046875, 0.925048828125, 0.9951171875, 1.065185546875, 1.13525390625, 1.205322265625, 1.275390625, 1.345458984375, 1.41552734375, 1.485595703125, 1.5556640625, 1.625732421875, 1.69580078125, 1.765869140625, 1.8359375, 1.906005859375, 1.97607421875, 2.046142578125, 2.1162109375, 2.186279296875, 2.25634765625, 2.326416015625, 2.396484375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 5.0, 11.0, 14.0, 14.0, 14.0, 19.0, 22.0, 27.0, 26.0, 27.0, 29.0, 41.0, 62.0, 57.0, 52.0, 45.0, 61.0, 51.0, 61.0, 40.0, 54.0, 47.0, 39.0, 31.0, 29.0, 24.0, 16.0, 18.0, 15.0, 7.0, 6.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.6031723022460938, -0.5789031982421875, -0.5546340942382812, -0.530364990234375, -0.5060958862304688, -0.4818267822265625, -0.45755767822265625, -0.43328857421875, -0.40901947021484375, -0.3847503662109375, -0.36048126220703125, -0.336212158203125, -0.31194305419921875, -0.2876739501953125, -0.26340484619140625, -0.2391357421875, -0.21486663818359375, -0.1905975341796875, -0.16632843017578125, -0.142059326171875, -0.11779022216796875, -0.0935211181640625, -0.06925201416015625, -0.04498291015625, -0.02071380615234375, 0.0035552978515625, 0.02782440185546875, 0.052093505859375, 0.07636260986328125, 0.1006317138671875, 0.12490081787109375, 0.149169921875, 0.17343902587890625, 0.1977081298828125, 0.22197723388671875, 0.246246337890625, 0.27051544189453125, 0.2947845458984375, 0.31905364990234375, 0.34332275390625, 0.36759185791015625, 0.3918609619140625, 0.41613006591796875, 0.440399169921875, 0.46466827392578125, 0.4889373779296875, 0.5132064819335938, 0.5374755859375, 0.5617446899414062, 0.5860137939453125, 0.6102828979492188, 0.634552001953125, 0.6588211059570312, 0.6830902099609375, 0.7073593139648438, 0.73162841796875, 0.7558975219726562, 0.7801666259765625, 0.8044357299804688, 0.828704833984375, 0.8529739379882812, 0.8772430419921875, 0.9015121459960938, 0.92578125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 5.0, 2.0, 8.0, 11.0, 8.0, 16.0, 27.0, 28.0, 34.0, 27.0, 48.0, 56.0, 46.0, 56.0, 52.0, 67.0, 62.0, 66.0, 64.0, 53.0, 43.0, 53.0, 23.0, 33.0, 27.0, 22.0, 16.0, 11.0, 9.0, 9.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.681556701660156, -14.2484130859375, -13.815269470214844, -13.382125854492188, -12.948982238769531, -12.515838623046875, -12.082695007324219, -11.649552345275879, -11.216408729553223, -10.783265113830566, -10.35012149810791, -9.916977882385254, -9.483834266662598, -9.050691604614258, -8.617547988891602, -8.184404373168945, -7.751260280609131, -7.318116664886475, -6.884973049163818, -6.45182991027832, -6.018686294555664, -5.585542678833008, -5.152399063110352, -4.719255447387695, -4.286111831665039, -3.852968215942383, -3.4198248386383057, -2.9866812229156494, -2.5535378456115723, -2.120394229888916, -1.6872506141662598, -1.2541072368621826, -0.8209638595581055, -0.3878203332424164, 0.045323193073272705, 0.4784667491912842, 0.9116102457046509, 1.3447537422180176, 1.7778973579406738, 2.211040735244751, 2.6441843509674072, 3.0773279666900635, 3.5104713439941406, 3.943614959716797, 4.376758575439453, 4.809902191162109, 5.243045806884766, 5.676188945770264, 6.10933256149292, 6.542476177215576, 6.975619792938232, 7.4087629318237305, 7.841906547546387, 8.275050163269043, 8.7081937789917, 9.141337394714355, 9.574481010437012, 10.007624626159668, 10.440768241882324, 10.87391185760498, 11.307055473327637, 11.740198135375977, 12.173341751098633, 12.606485366821289, 13.039628982543945]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 11.0, 5.0, 7.0, 17.0, 12.0, 18.0, 15.0, 25.0, 17.0, 36.0, 31.0, 33.0, 37.0, 44.0, 36.0, 34.0, 40.0, 46.0, 39.0, 50.0, 48.0, 28.0, 46.0, 30.0, 31.0, 28.0, 31.0, 31.0, 25.0, 18.0, 20.0, 13.0, 15.0, 8.0, 17.0, 14.0, 12.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.930598735809326, -6.703717231750488, -6.476836204528809, -6.249954700469971, -6.023073196411133, -5.796192169189453, -5.569310665130615, -5.342429161071777, -5.115548133850098, -4.88866662979126, -4.66178560256958, -4.434904098510742, -4.2080230712890625, -3.9811415672302246, -3.7542600631713867, -3.527378797531128, -3.300497531890869, -3.0736162662506104, -2.8467350006103516, -2.6198534965515137, -2.392972230911255, -2.166090965270996, -1.9392095804214478, -1.7123281955718994, -1.4854469299316406, -1.2585656642913818, -1.0316842794418335, -0.8048029541969299, -0.5779216289520264, -0.3510403633117676, -0.12415897846221924, 0.1027224063873291, 0.3296041488647461, 0.5564854741096497, 0.7833667993545532, 1.0102481842041016, 1.2371294498443604, 1.4640107154846191, 1.6908921003341675, 1.9177734851837158, 2.1446547508239746, 2.3715360164642334, 2.598417282104492, 2.82529878616333, 3.052180051803589, 3.2790613174438477, 3.5059428215026855, 3.7328240871429443, 3.959705352783203, 4.186586856842041, 4.413467884063721, 4.640349388122559, 4.867230415344238, 5.094111919403076, 5.320993423461914, 5.547874450683594, 5.774755954742432, 6.0016374588012695, 6.228518486022949, 6.455399990081787, 6.682281494140625, 6.909162521362305, 7.136044025421143, 7.3629255294799805, 7.58980655670166]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 4.0, 10.0, 10.0, 22.0, 19.0, 38.0, 49.0, 80.0, 93.0, 194.0, 311.0, 481.0, 788.0, 1412.0, 2529.0, 4702.0, 9058.0, 17576.0, 33667.0, 65040.0, 116735.0, 181322.0, 208403.0, 172282.0, 109402.0, 59499.0, 30620.0, 15884.0, 8203.0, 4361.0, 2441.0, 1376.0, 733.0, 454.0, 274.0, 169.0, 94.0, 73.0, 46.0, 37.0, 21.0, 11.0, 7.0, 5.0, 10.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.0224609375, -11.599609375, -11.1767578125, -10.75390625, -10.3310546875, -9.908203125, -9.4853515625, -9.0625, -8.6396484375, -8.216796875, -7.7939453125, -7.37109375, -6.9482421875, -6.525390625, -6.1025390625, -5.6796875, -5.2568359375, -4.833984375, -4.4111328125, -3.98828125, -3.5654296875, -3.142578125, -2.7197265625, -2.296875, -1.8740234375, -1.451171875, -1.0283203125, -0.60546875, -0.1826171875, 0.240234375, 0.6630859375, 1.0859375, 1.5087890625, 1.931640625, 2.3544921875, 2.77734375, 3.2001953125, 3.623046875, 4.0458984375, 4.46875, 4.8916015625, 5.314453125, 5.7373046875, 6.16015625, 6.5830078125, 7.005859375, 7.4287109375, 7.8515625, 8.2744140625, 8.697265625, 9.1201171875, 9.54296875, 9.9658203125, 10.388671875, 10.8115234375, 11.234375, 11.6572265625, 12.080078125, 12.5029296875, 12.92578125, 13.3486328125, 13.771484375, 14.1943359375, 14.6171875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 3.0, 5.0, 6.0, 9.0, 9.0, 16.0, 13.0, 14.0, 14.0, 17.0, 28.0, 35.0, 27.0, 27.0, 33.0, 33.0, 30.0, 27.0, 37.0, 39.0, 37.0, 41.0, 36.0, 34.0, 38.0, 42.0, 36.0, 38.0, 29.0, 25.0, 20.0, 25.0, 25.0, 25.0, 18.0, 16.0, 11.0, 11.0, 13.0, 6.0, 13.0, 9.0, 4.0, 6.0, 3.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 3.0], "bins": [-7.8515625, -7.6197509765625, -7.387939453125, -7.1561279296875, -6.92431640625, -6.6925048828125, -6.460693359375, -6.2288818359375, -5.9970703125, -5.7652587890625, -5.533447265625, -5.3016357421875, -5.06982421875, -4.8380126953125, -4.606201171875, -4.3743896484375, -4.142578125, -3.9107666015625, -3.678955078125, -3.4471435546875, -3.21533203125, -2.9835205078125, -2.751708984375, -2.5198974609375, -2.2880859375, -2.0562744140625, -1.824462890625, -1.5926513671875, -1.36083984375, -1.1290283203125, -0.897216796875, -0.6654052734375, -0.43359375, -0.2017822265625, 0.030029296875, 0.2618408203125, 0.49365234375, 0.7254638671875, 0.957275390625, 1.1890869140625, 1.4208984375, 1.6527099609375, 1.884521484375, 2.1163330078125, 2.34814453125, 2.5799560546875, 2.811767578125, 3.0435791015625, 3.275390625, 3.5072021484375, 3.739013671875, 3.9708251953125, 4.20263671875, 4.4344482421875, 4.666259765625, 4.8980712890625, 5.1298828125, 5.3616943359375, 5.593505859375, 5.8253173828125, 6.05712890625, 6.2889404296875, 6.520751953125, 6.7525634765625, 6.984375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 8.0, 10.0, 22.0, 18.0, 35.0, 55.0, 81.0, 128.0, 203.0, 287.0, 428.0, 747.0, 1181.0, 1803.0, 2869.0, 4695.0, 7672.0, 12534.0, 20389.0, 32999.0, 54269.0, 84435.0, 122249.0, 153612.0, 158281.0, 132701.0, 95036.0, 62270.0, 38785.0, 23481.0, 14244.0, 8773.0, 5316.0, 3322.0, 2041.0, 1305.0, 758.0, 551.0, 348.0, 209.0, 115.0, 105.0, 69.0, 42.0, 22.0, 23.0, 9.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.8125, -9.4974365234375, -9.182373046875, -8.8673095703125, -8.55224609375, -8.2371826171875, -7.922119140625, -7.6070556640625, -7.2919921875, -6.9769287109375, -6.661865234375, -6.3468017578125, -6.03173828125, -5.7166748046875, -5.401611328125, -5.0865478515625, -4.771484375, -4.4564208984375, -4.141357421875, -3.8262939453125, -3.51123046875, -3.1961669921875, -2.881103515625, -2.5660400390625, -2.2509765625, -1.9359130859375, -1.620849609375, -1.3057861328125, -0.99072265625, -0.6756591796875, -0.360595703125, -0.0455322265625, 0.26953125, 0.5845947265625, 0.899658203125, 1.2147216796875, 1.52978515625, 1.8448486328125, 2.159912109375, 2.4749755859375, 2.7900390625, 3.1051025390625, 3.420166015625, 3.7352294921875, 4.05029296875, 4.3653564453125, 4.680419921875, 4.9954833984375, 5.310546875, 5.6256103515625, 5.940673828125, 6.2557373046875, 6.57080078125, 6.8858642578125, 7.200927734375, 7.5159912109375, 7.8310546875, 8.1461181640625, 8.461181640625, 8.7762451171875, 9.09130859375, 9.4063720703125, 9.721435546875, 10.0364990234375, 10.3515625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 8.0, 5.0, 10.0, 6.0, 5.0, 19.0, 18.0, 20.0, 26.0, 24.0, 30.0, 46.0, 34.0, 39.0, 52.0, 46.0, 47.0, 54.0, 52.0, 40.0, 40.0, 43.0, 42.0, 40.0, 31.0, 26.0, 18.0, 27.0, 31.0, 18.0, 20.0, 16.0, 19.0, 11.0, 7.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.31640625, -5.13665771484375, -4.9569091796875, -4.77716064453125, -4.597412109375, -4.41766357421875, -4.2379150390625, -4.05816650390625, -3.87841796875, -3.69866943359375, -3.5189208984375, -3.33917236328125, -3.159423828125, -2.97967529296875, -2.7999267578125, -2.62017822265625, -2.4404296875, -2.26068115234375, -2.0809326171875, -1.90118408203125, -1.721435546875, -1.54168701171875, -1.3619384765625, -1.18218994140625, -1.00244140625, -0.82269287109375, -0.6429443359375, -0.46319580078125, -0.283447265625, -0.10369873046875, 0.0760498046875, 0.25579833984375, 0.435546875, 0.61529541015625, 0.7950439453125, 0.97479248046875, 1.154541015625, 1.33428955078125, 1.5140380859375, 1.69378662109375, 1.87353515625, 2.05328369140625, 2.2330322265625, 2.41278076171875, 2.592529296875, 2.77227783203125, 2.9520263671875, 3.13177490234375, 3.3115234375, 3.49127197265625, 3.6710205078125, 3.85076904296875, 4.030517578125, 4.21026611328125, 4.3900146484375, 4.56976318359375, 4.74951171875, 4.92926025390625, 5.1090087890625, 5.28875732421875, 5.468505859375, 5.64825439453125, 5.8280029296875, 6.00775146484375, 6.1875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 13.0, 12.0, 14.0, 15.0, 31.0, 43.0, 77.0, 114.0, 143.0, 220.0, 313.0, 491.0, 668.0, 994.0, 1463.0, 2106.0, 3432.0, 5189.0, 8122.0, 13602.0, 23557.0, 42698.0, 86814.0, 188916.0, 284448.0, 191806.0, 88477.0, 43775.0, 23678.0, 13768.0, 8239.0, 5236.0, 3279.0, 2188.0, 1417.0, 1034.0, 711.0, 433.0, 324.0, 229.0, 139.0, 99.0, 72.0, 50.0, 49.0, 19.0, 19.0, 10.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.8046875, -10.4505615234375, -10.096435546875, -9.7423095703125, -9.38818359375, -9.0340576171875, -8.679931640625, -8.3258056640625, -7.9716796875, -7.6175537109375, -7.263427734375, -6.9093017578125, -6.55517578125, -6.2010498046875, -5.846923828125, -5.4927978515625, -5.138671875, -4.7845458984375, -4.430419921875, -4.0762939453125, -3.72216796875, -3.3680419921875, -3.013916015625, -2.6597900390625, -2.3056640625, -1.9515380859375, -1.597412109375, -1.2432861328125, -0.88916015625, -0.5350341796875, -0.180908203125, 0.1732177734375, 0.52734375, 0.8814697265625, 1.235595703125, 1.5897216796875, 1.94384765625, 2.2979736328125, 2.652099609375, 3.0062255859375, 3.3603515625, 3.7144775390625, 4.068603515625, 4.4227294921875, 4.77685546875, 5.1309814453125, 5.485107421875, 5.8392333984375, 6.193359375, 6.5474853515625, 6.901611328125, 7.2557373046875, 7.60986328125, 7.9639892578125, 8.318115234375, 8.6722412109375, 9.0263671875, 9.3804931640625, 9.734619140625, 10.0887451171875, 10.44287109375, 10.7969970703125, 11.151123046875, 11.5052490234375, 11.859375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 11.0, 6.0, 6.0, 7.0, 5.0, 7.0, 18.0, 14.0, 25.0, 34.0, 48.0, 78.0, 86.0, 103.0, 103.0, 110.0, 73.0, 58.0, 52.0, 28.0, 20.0, 22.0, 12.0, 14.0, 10.0, 8.0, 5.0, 9.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010395050048828125, -0.0009999126195907593, -0.0009603202342987061, -0.0009207278490066528, -0.0008811354637145996, -0.0008415430784225464, -0.0008019506931304932, -0.0007623583078384399, -0.0007227659225463867, -0.0006831735372543335, -0.0006435811519622803, -0.000603988766670227, -0.0005643963813781738, -0.0005248039960861206, -0.0004852116107940674, -0.00044561922550201416, -0.00040602684020996094, -0.0003664344549179077, -0.0003268420696258545, -0.00028724968433380127, -0.00024765729904174805, -0.00020806491374969482, -0.0001684725284576416, -0.00012888014316558838, -8.928775787353516e-05, -4.9695372581481934e-05, -1.0102987289428711e-05, 2.9489398002624512e-05, 6.908178329467773e-05, 0.00010867416858673096, 0.00014826655387878418, 0.0001878589391708374, 0.00022745132446289062, 0.00026704370975494385, 0.00030663609504699707, 0.0003462284803390503, 0.0003858208656311035, 0.00042541325092315674, 0.00046500563621520996, 0.0005045980215072632, 0.0005441904067993164, 0.0005837827920913696, 0.0006233751773834229, 0.0006629675626754761, 0.0007025599479675293, 0.0007421523332595825, 0.0007817447185516357, 0.000821337103843689, 0.0008609294891357422, 0.0009005218744277954, 0.0009401142597198486, 0.0009797066450119019, 0.001019299030303955, 0.0010588914155960083, 0.0010984838008880615, 0.0011380761861801147, 0.001177668571472168, 0.0012172609567642212, 0.0012568533420562744, 0.0012964457273483276, 0.0013360381126403809, 0.001375630497932434, 0.0014152228832244873, 0.0014548152685165405, 0.0014944076538085938]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 13.0, 6.0, 14.0, 16.0, 40.0, 46.0, 88.0, 124.0, 162.0, 264.0, 380.0, 563.0, 867.0, 1261.0, 1865.0, 2881.0, 4384.0, 6940.0, 10948.0, 18172.0, 30954.0, 56219.0, 104364.0, 185292.0, 232367.0, 171203.0, 95081.0, 50678.0, 28232.0, 16427.0, 10052.0, 6452.0, 4110.0, 2691.0, 1745.0, 1217.0, 838.0, 522.0, 348.0, 220.0, 176.0, 116.0, 67.0, 51.0, 35.0, 16.0, 13.0, 11.0, 12.0, 4.0, 2.0, 4.0, 4.0, 0.0, 3.0, 2.0, 2.0], "bins": [-8.2265625, -7.9647216796875, -7.702880859375, -7.4410400390625, -7.17919921875, -6.9173583984375, -6.655517578125, -6.3936767578125, -6.1318359375, -5.8699951171875, -5.608154296875, -5.3463134765625, -5.08447265625, -4.8226318359375, -4.560791015625, -4.2989501953125, -4.037109375, -3.7752685546875, -3.513427734375, -3.2515869140625, -2.98974609375, -2.7279052734375, -2.466064453125, -2.2042236328125, -1.9423828125, -1.6805419921875, -1.418701171875, -1.1568603515625, -0.89501953125, -0.6331787109375, -0.371337890625, -0.1094970703125, 0.15234375, 0.4141845703125, 0.676025390625, 0.9378662109375, 1.19970703125, 1.4615478515625, 1.723388671875, 1.9852294921875, 2.2470703125, 2.5089111328125, 2.770751953125, 3.0325927734375, 3.29443359375, 3.5562744140625, 3.818115234375, 4.0799560546875, 4.341796875, 4.6036376953125, 4.865478515625, 5.1273193359375, 5.38916015625, 5.6510009765625, 5.912841796875, 6.1746826171875, 6.4365234375, 6.6983642578125, 6.960205078125, 7.2220458984375, 7.48388671875, 7.7457275390625, 8.007568359375, 8.2694091796875, 8.53125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 6.0, 5.0, 10.0, 13.0, 12.0, 14.0, 12.0, 18.0, 20.0, 30.0, 40.0, 60.0, 47.0, 85.0, 82.0, 94.0, 73.0, 66.0, 55.0, 55.0, 37.0, 32.0, 25.0, 22.0, 12.0, 10.0, 14.0, 12.0, 4.0, 8.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.560546875, -2.473358154296875, -2.38616943359375, -2.298980712890625, -2.2117919921875, -2.124603271484375, -2.03741455078125, -1.950225830078125, -1.863037109375, -1.775848388671875, -1.68865966796875, -1.601470947265625, -1.5142822265625, -1.427093505859375, -1.33990478515625, -1.252716064453125, -1.16552734375, -1.078338623046875, -0.99114990234375, -0.903961181640625, -0.8167724609375, -0.729583740234375, -0.64239501953125, -0.555206298828125, -0.468017578125, -0.380828857421875, -0.29364013671875, -0.206451416015625, -0.1192626953125, -0.032073974609375, 0.05511474609375, 0.142303466796875, 0.2294921875, 0.316680908203125, 0.40386962890625, 0.491058349609375, 0.5782470703125, 0.665435791015625, 0.75262451171875, 0.839813232421875, 0.927001953125, 1.014190673828125, 1.10137939453125, 1.188568115234375, 1.2757568359375, 1.362945556640625, 1.45013427734375, 1.537322998046875, 1.62451171875, 1.711700439453125, 1.79888916015625, 1.886077880859375, 1.9732666015625, 2.060455322265625, 2.14764404296875, 2.234832763671875, 2.322021484375, 2.409210205078125, 2.49639892578125, 2.583587646484375, 2.6707763671875, 2.757965087890625, 2.84515380859375, 2.932342529296875, 3.01953125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 9.0, 12.0, 11.0, 22.0, 31.0, 34.0, 34.0, 54.0, 45.0, 48.0, 47.0, 49.0, 60.0, 63.0, 69.0, 60.0, 49.0, 50.0, 44.0, 39.0, 32.0, 16.0, 23.0, 20.0, 19.0, 10.0, 10.0, 8.0, 10.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.254408836364746, -14.811325073242188, -14.368241310119629, -13.92515754699707, -13.482073783874512, -13.038990020751953, -12.595907211303711, -12.152822494506836, -11.709739685058594, -11.266655921936035, -10.823572158813477, -10.380488395690918, -9.93740463256836, -9.4943208694458, -9.051237106323242, -8.608154296875, -8.165069580078125, -7.721985816955566, -7.278902053833008, -6.835818290710449, -6.392734527587891, -5.949650764465332, -5.506567478179932, -5.063483715057373, -4.6203999519348145, -4.177316188812256, -3.7342324256896973, -3.2911489009857178, -2.848065137863159, -2.4049813747406006, -1.961897850036621, -1.5188140869140625, -1.075730323791504, -0.6326466202735901, -0.18956291675567627, 0.2535207271575928, 0.6966044902801514, 1.13968825340271, 1.5827717781066895, 2.025855541229248, 2.4689393043518066, 2.9120230674743652, 3.355106830596924, 3.7981903553009033, 4.241273880004883, 4.684357643127441, 5.12744140625, 5.570525169372559, 6.013608932495117, 6.456692695617676, 6.899776458740234, 7.342860221862793, 7.785943984985352, 8.22902774810791, 8.672111511230469, 9.115194320678711, 9.558279037475586, 10.001362800598145, 10.444446563720703, 10.887530326843262, 11.33061408996582, 11.773697853088379, 12.216781616210938, 12.65986442565918, 13.102948188781738]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 8.0, 10.0, 6.0, 9.0, 13.0, 13.0, 14.0, 16.0, 13.0, 27.0, 19.0, 24.0, 42.0, 29.0, 39.0, 41.0, 44.0, 46.0, 52.0, 41.0, 42.0, 49.0, 40.0, 31.0, 42.0, 35.0, 38.0, 20.0, 24.0, 25.0, 23.0, 19.0, 20.0, 16.0, 12.0, 17.0, 19.0, 5.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.37808609008789, -8.10845947265625, -7.838833332061768, -7.569207191467285, -7.2995805740356445, -7.029954433441162, -6.76032829284668, -6.490701675415039, -6.221075057983398, -5.951448917388916, -5.681822299957275, -5.412196159362793, -5.142569541931152, -4.87294340133667, -4.6033172607421875, -4.333690643310547, -4.0640645027160645, -3.794438123703003, -3.5248117446899414, -3.255185604095459, -2.9855589866638184, -2.715932846069336, -2.4463064670562744, -2.176680088043213, -1.9070537090301514, -1.6374273300170898, -1.3678009510040283, -1.0981746912002563, -0.8285483121871948, -0.5589219331741333, -0.28929567337036133, -0.019669294357299805, 0.24995708465576172, 0.5195834636688232, 0.78920978307724, 1.0588361024856567, 1.3284624814987183, 1.5980888605117798, 1.8677151203155518, 2.1373414993286133, 2.406967878341675, 2.6765942573547363, 2.946220636367798, 3.2158470153808594, 3.485473155975342, 3.7550997734069824, 4.024725914001465, 4.2943525314331055, 4.563978672027588, 4.83360481262207, 5.103231430053711, 5.372857570648193, 5.642484188079834, 5.912110328674316, 6.181736946105957, 6.4513630867004395, 6.720989227294922, 6.990615367889404, 7.260241985321045, 7.529868125915527, 7.799494743347168, 8.069121360778809, 8.338747024536133, 8.608373641967773, 8.878000259399414]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 21.0, 27.0, 24.0, 58.0, 72.0, 99.0, 113.0, 202.0, 283.0, 444.0, 638.0, 1012.0, 1548.0, 2501.0, 3809.0, 6126.0, 10229.0, 16863.0, 29033.0, 50711.0, 90277.0, 164210.0, 297841.0, 522338.0, 769116.0, 818685.0, 602616.0, 354351.0, 195154.0, 107993.0, 60078.0, 34665.0, 20226.0, 12039.0, 7569.0, 4711.0, 2936.0, 2006.0, 1240.0, 813.0, 565.0, 359.0, 236.0, 170.0, 102.0, 58.0, 46.0, 32.0, 15.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.7265625, -11.3831787109375, -11.039794921875, -10.6964111328125, -10.35302734375, -10.0096435546875, -9.666259765625, -9.3228759765625, -8.9794921875, -8.6361083984375, -8.292724609375, -7.9493408203125, -7.60595703125, -7.2625732421875, -6.919189453125, -6.5758056640625, -6.232421875, -5.8890380859375, -5.545654296875, -5.2022705078125, -4.85888671875, -4.5155029296875, -4.172119140625, -3.8287353515625, -3.4853515625, -3.1419677734375, -2.798583984375, -2.4552001953125, -2.11181640625, -1.7684326171875, -1.425048828125, -1.0816650390625, -0.73828125, -0.3948974609375, -0.051513671875, 0.2918701171875, 0.63525390625, 0.9786376953125, 1.322021484375, 1.6654052734375, 2.0087890625, 2.3521728515625, 2.695556640625, 3.0389404296875, 3.38232421875, 3.7257080078125, 4.069091796875, 4.4124755859375, 4.755859375, 5.0992431640625, 5.442626953125, 5.7860107421875, 6.12939453125, 6.4727783203125, 6.816162109375, 7.1595458984375, 7.5029296875, 7.8463134765625, 8.189697265625, 8.5330810546875, 8.87646484375, 9.2198486328125, 9.563232421875, 9.9066162109375, 10.25]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 6.0, 13.0, 5.0, 17.0, 18.0, 19.0, 13.0, 18.0, 18.0, 18.0, 40.0, 27.0, 36.0, 34.0, 30.0, 37.0, 37.0, 36.0, 35.0, 45.0, 34.0, 45.0, 37.0, 39.0, 32.0, 27.0, 33.0, 19.0, 32.0, 27.0, 22.0, 19.0, 11.0, 17.0, 19.0, 14.0, 8.0, 13.0, 8.0, 6.0, 8.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.578125, -5.40087890625, -5.2236328125, -5.04638671875, -4.869140625, -4.69189453125, -4.5146484375, -4.33740234375, -4.16015625, -3.98291015625, -3.8056640625, -3.62841796875, -3.451171875, -3.27392578125, -3.0966796875, -2.91943359375, -2.7421875, -2.56494140625, -2.3876953125, -2.21044921875, -2.033203125, -1.85595703125, -1.6787109375, -1.50146484375, -1.32421875, -1.14697265625, -0.9697265625, -0.79248046875, -0.615234375, -0.43798828125, -0.2607421875, -0.08349609375, 0.09375, 0.27099609375, 0.4482421875, 0.62548828125, 0.802734375, 0.97998046875, 1.1572265625, 1.33447265625, 1.51171875, 1.68896484375, 1.8662109375, 2.04345703125, 2.220703125, 2.39794921875, 2.5751953125, 2.75244140625, 2.9296875, 3.10693359375, 3.2841796875, 3.46142578125, 3.638671875, 3.81591796875, 3.9931640625, 4.17041015625, 4.34765625, 4.52490234375, 4.7021484375, 4.87939453125, 5.056640625, 5.23388671875, 5.4111328125, 5.58837890625, 5.765625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 12.0, 8.0, 22.0, 32.0, 47.0, 52.0, 84.0, 154.0, 237.0, 365.0, 588.0, 992.0, 1657.0, 2969.0, 5070.0, 9359.0, 17348.0, 32004.0, 61266.0, 116564.0, 220666.0, 399029.0, 650233.0, 835081.0, 746933.0, 492298.0, 281243.0, 150526.0, 79295.0, 41272.0, 21691.0, 11910.0, 6531.0, 3563.0, 1980.0, 1248.0, 713.0, 434.0, 291.0, 174.0, 100.0, 78.0, 47.0, 29.0, 28.0, 18.0, 11.0, 12.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0], "bins": [-13.078125, -12.66552734375, -12.2529296875, -11.84033203125, -11.427734375, -11.01513671875, -10.6025390625, -10.18994140625, -9.77734375, -9.36474609375, -8.9521484375, -8.53955078125, -8.126953125, -7.71435546875, -7.3017578125, -6.88916015625, -6.4765625, -6.06396484375, -5.6513671875, -5.23876953125, -4.826171875, -4.41357421875, -4.0009765625, -3.58837890625, -3.17578125, -2.76318359375, -2.3505859375, -1.93798828125, -1.525390625, -1.11279296875, -0.7001953125, -0.28759765625, 0.125, 0.53759765625, 0.9501953125, 1.36279296875, 1.775390625, 2.18798828125, 2.6005859375, 3.01318359375, 3.42578125, 3.83837890625, 4.2509765625, 4.66357421875, 5.076171875, 5.48876953125, 5.9013671875, 6.31396484375, 6.7265625, 7.13916015625, 7.5517578125, 7.96435546875, 8.376953125, 8.78955078125, 9.2021484375, 9.61474609375, 10.02734375, 10.43994140625, 10.8525390625, 11.26513671875, 11.677734375, 12.09033203125, 12.5029296875, 12.91552734375, 13.328125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 7.0, 12.0, 17.0, 20.0, 37.0, 50.0, 45.0, 77.0, 81.0, 106.0, 125.0, 177.0, 214.0, 214.0, 264.0, 288.0, 301.0, 303.0, 280.0, 261.0, 216.0, 189.0, 170.0, 142.0, 110.0, 78.0, 68.0, 58.0, 47.0, 44.0, 19.0, 19.0, 7.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55078125, -4.40887451171875, -4.2669677734375, -4.12506103515625, -3.983154296875, -3.84124755859375, -3.6993408203125, -3.55743408203125, -3.41552734375, -3.27362060546875, -3.1317138671875, -2.98980712890625, -2.847900390625, -2.70599365234375, -2.5640869140625, -2.42218017578125, -2.2802734375, -2.13836669921875, -1.9964599609375, -1.85455322265625, -1.712646484375, -1.57073974609375, -1.4288330078125, -1.28692626953125, -1.14501953125, -1.00311279296875, -0.8612060546875, -0.71929931640625, -0.577392578125, -0.43548583984375, -0.2935791015625, -0.15167236328125, -0.009765625, 0.13214111328125, 0.2740478515625, 0.41595458984375, 0.557861328125, 0.69976806640625, 0.8416748046875, 0.98358154296875, 1.12548828125, 1.26739501953125, 1.4093017578125, 1.55120849609375, 1.693115234375, 1.83502197265625, 1.9769287109375, 2.11883544921875, 2.2607421875, 2.40264892578125, 2.5445556640625, 2.68646240234375, 2.828369140625, 2.97027587890625, 3.1121826171875, 3.25408935546875, 3.39599609375, 3.53790283203125, 3.6798095703125, 3.82171630859375, 3.963623046875, 4.10552978515625, 4.2474365234375, 4.38934326171875, 4.53125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 14.0, 18.0, 14.0, 40.0, 24.0, 29.0, 36.0, 40.0, 41.0, 50.0, 57.0, 53.0, 49.0, 57.0, 60.0, 50.0, 44.0, 56.0, 38.0, 26.0, 41.0, 26.0, 23.0, 21.0, 17.0, 14.0, 8.0, 9.0, 8.0, 4.0, 5.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.59409236907959, -12.182097434997559, -11.770103454589844, -11.358108520507812, -10.946114540100098, -10.534119606018066, -10.122125625610352, -9.71013069152832, -9.298135757446289, -8.886140823364258, -8.474146842956543, -8.062151908874512, -7.650157928466797, -7.238162994384766, -6.826168537139893, -6.4141740798950195, -6.002180099487305, -5.590185642242432, -5.178191184997559, -4.766196250915527, -4.3542022705078125, -3.9422075748443604, -3.530212879180908, -3.118218421936035, -2.706223964691162, -2.294229507446289, -1.8822349309921265, -1.4702403545379639, -1.0582458972930908, -0.6462514400482178, -0.23425674438476562, 0.17773771286010742, 0.5897331237792969, 1.00172758102417, 1.4137221574783325, 1.8257167339324951, 2.237711191177368, 2.649705648422241, 3.0617003440856934, 3.4736948013305664, 3.8856892585754395, 4.2976837158203125, 4.7096781730651855, 5.121672630310059, 5.53366756439209, 5.945661544799805, 6.357656478881836, 6.769650936126709, 7.181645393371582, 7.593639850616455, 8.005634307861328, 8.41762924194336, 8.829623222351074, 9.241618156433105, 9.65361213684082, 10.065607070922852, 10.477602005004883, 10.889596939086914, 11.301590919494629, 11.71358585357666, 12.125579833984375, 12.537574768066406, 12.949569702148438, 13.361563682556152, 13.773557662963867]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 12.0, 12.0, 12.0, 15.0, 20.0, 15.0, 15.0, 21.0, 40.0, 32.0, 31.0, 34.0, 38.0, 41.0, 44.0, 40.0, 43.0, 26.0, 43.0, 42.0, 42.0, 39.0, 40.0, 31.0, 30.0, 19.0, 26.0, 25.0, 17.0, 17.0, 28.0, 19.0, 14.0, 14.0, 8.0, 6.0, 2.0, 8.0, 8.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.840375900268555, -7.591174125671387, -7.341972351074219, -7.092770576477051, -6.843568325042725, -6.594366550445557, -6.345164775848389, -6.095963001251221, -5.846761226654053, -5.597559452056885, -5.348357677459717, -5.099155426025391, -4.849953651428223, -4.600751876831055, -4.351550102233887, -4.102348327636719, -3.8531463146209717, -3.6039445400238037, -3.3547425270080566, -3.1055407524108887, -2.8563389778137207, -2.6071372032165527, -2.3579351902008057, -2.1087334156036377, -1.8595315217971802, -1.6103296279907227, -1.3611278533935547, -1.1119259595870972, -0.8627241253852844, -0.6135222911834717, -0.36432039737701416, -0.11511862277984619, 0.13408327102661133, 0.3832851052284241, 0.6324869394302368, 0.8816888332366943, 1.1308906078338623, 1.3800925016403198, 1.6292943954467773, 1.8784961700439453, 2.1276979446411133, 2.3768997192382812, 2.6261017322540283, 2.8753035068511963, 3.1245052814483643, 3.3737072944641113, 3.6229090690612793, 3.8721108436584473, 4.121313095092773, 4.370514869689941, 4.619716644287109, 4.868918418884277, 5.1181206703186035, 5.3673224449157715, 5.6165242195129395, 5.865725994110107, 6.114927768707275, 6.364129543304443, 6.613331317901611, 6.8625335693359375, 7.1117353439331055, 7.360937118530273, 7.610138893127441, 7.859340667724609, 8.108542442321777]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 3.0, 3.0, 6.0, 9.0, 9.0, 26.0, 37.0, 48.0, 80.0, 125.0, 172.0, 316.0, 522.0, 762.0, 1209.0, 1930.0, 3235.0, 5614.0, 10814.0, 22535.0, 53598.0, 131090.0, 261461.0, 281834.0, 154404.0, 64136.0, 26582.0, 12193.0, 6599.0, 3537.0, 2116.0, 1299.0, 810.0, 505.0, 346.0, 207.0, 146.0, 92.0, 53.0, 37.0, 28.0, 14.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.65625, -12.295654296875, -11.93505859375, -11.574462890625, -11.2138671875, -10.853271484375, -10.49267578125, -10.132080078125, -9.771484375, -9.410888671875, -9.05029296875, -8.689697265625, -8.3291015625, -7.968505859375, -7.60791015625, -7.247314453125, -6.88671875, -6.526123046875, -6.16552734375, -5.804931640625, -5.4443359375, -5.083740234375, -4.72314453125, -4.362548828125, -4.001953125, -3.641357421875, -3.28076171875, -2.920166015625, -2.5595703125, -2.198974609375, -1.83837890625, -1.477783203125, -1.1171875, -0.756591796875, -0.39599609375, -0.035400390625, 0.3251953125, 0.685791015625, 1.04638671875, 1.406982421875, 1.767578125, 2.128173828125, 2.48876953125, 2.849365234375, 3.2099609375, 3.570556640625, 3.93115234375, 4.291748046875, 4.65234375, 5.012939453125, 5.37353515625, 5.734130859375, 6.0947265625, 6.455322265625, 6.81591796875, 7.176513671875, 7.537109375, 7.897705078125, 8.25830078125, 8.618896484375, 8.9794921875, 9.340087890625, 9.70068359375, 10.061279296875, 10.421875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 12.0, 10.0, 12.0, 9.0, 18.0, 16.0, 13.0, 23.0, 27.0, 28.0, 29.0, 27.0, 27.0, 38.0, 43.0, 29.0, 46.0, 50.0, 36.0, 32.0, 36.0, 44.0, 39.0, 29.0, 37.0, 29.0, 35.0, 37.0, 27.0, 22.0, 25.0, 14.0, 20.0, 12.0, 8.0, 10.0, 12.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.5390625, -8.2694091796875, -7.999755859375, -7.7301025390625, -7.46044921875, -7.1907958984375, -6.921142578125, -6.6514892578125, -6.3818359375, -6.1121826171875, -5.842529296875, -5.5728759765625, -5.30322265625, -5.0335693359375, -4.763916015625, -4.4942626953125, -4.224609375, -3.9549560546875, -3.685302734375, -3.4156494140625, -3.14599609375, -2.8763427734375, -2.606689453125, -2.3370361328125, -2.0673828125, -1.7977294921875, -1.528076171875, -1.2584228515625, -0.98876953125, -0.7191162109375, -0.449462890625, -0.1798095703125, 0.08984375, 0.3594970703125, 0.629150390625, 0.8988037109375, 1.16845703125, 1.4381103515625, 1.707763671875, 1.9774169921875, 2.2470703125, 2.5167236328125, 2.786376953125, 3.0560302734375, 3.32568359375, 3.5953369140625, 3.864990234375, 4.1346435546875, 4.404296875, 4.6739501953125, 4.943603515625, 5.2132568359375, 5.48291015625, 5.7525634765625, 6.022216796875, 6.2918701171875, 6.5615234375, 6.8311767578125, 7.100830078125, 7.3704833984375, 7.64013671875, 7.9097900390625, 8.179443359375, 8.4490966796875, 8.71875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 6.0, 10.0, 10.0, 10.0, 15.0, 26.0, 39.0, 50.0, 79.0, 93.0, 126.0, 186.0, 240.0, 352.0, 509.0, 780.0, 1187.0, 1881.0, 3242.0, 6131.0, 13328.0, 34824.0, 118225.0, 387379.0, 331914.0, 93829.0, 29143.0, 11467.0, 5453.0, 2849.0, 1753.0, 1022.0, 673.0, 511.0, 322.0, 247.0, 156.0, 150.0, 84.0, 56.0, 59.0, 48.0, 26.0, 16.0, 14.0, 16.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0], "bins": [-20.796875, -20.201171875, -19.60546875, -19.009765625, -18.4140625, -17.818359375, -17.22265625, -16.626953125, -16.03125, -15.435546875, -14.83984375, -14.244140625, -13.6484375, -13.052734375, -12.45703125, -11.861328125, -11.265625, -10.669921875, -10.07421875, -9.478515625, -8.8828125, -8.287109375, -7.69140625, -7.095703125, -6.5, -5.904296875, -5.30859375, -4.712890625, -4.1171875, -3.521484375, -2.92578125, -2.330078125, -1.734375, -1.138671875, -0.54296875, 0.052734375, 0.6484375, 1.244140625, 1.83984375, 2.435546875, 3.03125, 3.626953125, 4.22265625, 4.818359375, 5.4140625, 6.009765625, 6.60546875, 7.201171875, 7.796875, 8.392578125, 8.98828125, 9.583984375, 10.1796875, 10.775390625, 11.37109375, 11.966796875, 12.5625, 13.158203125, 13.75390625, 14.349609375, 14.9453125, 15.541015625, 16.13671875, 16.732421875, 17.328125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 15.0, 10.0, 14.0, 9.0, 17.0, 15.0, 21.0, 34.0, 27.0, 29.0, 23.0, 33.0, 27.0, 37.0, 33.0, 30.0, 33.0, 36.0, 34.0, 32.0, 50.0, 42.0, 23.0, 36.0, 41.0, 26.0, 26.0, 34.0, 26.0, 20.0, 21.0, 26.0, 22.0, 17.0, 9.0, 11.0, 13.0, 11.0, 7.0, 6.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-5.11328125, -4.95623779296875, -4.7991943359375, -4.64215087890625, -4.485107421875, -4.32806396484375, -4.1710205078125, -4.01397705078125, -3.85693359375, -3.69989013671875, -3.5428466796875, -3.38580322265625, -3.228759765625, -3.07171630859375, -2.9146728515625, -2.75762939453125, -2.6005859375, -2.44354248046875, -2.2864990234375, -2.12945556640625, -1.972412109375, -1.81536865234375, -1.6583251953125, -1.50128173828125, -1.34423828125, -1.18719482421875, -1.0301513671875, -0.87310791015625, -0.716064453125, -0.55902099609375, -0.4019775390625, -0.24493408203125, -0.087890625, 0.06915283203125, 0.2261962890625, 0.38323974609375, 0.540283203125, 0.69732666015625, 0.8543701171875, 1.01141357421875, 1.16845703125, 1.32550048828125, 1.4825439453125, 1.63958740234375, 1.796630859375, 1.95367431640625, 2.1107177734375, 2.26776123046875, 2.4248046875, 2.58184814453125, 2.7388916015625, 2.89593505859375, 3.052978515625, 3.21002197265625, 3.3670654296875, 3.52410888671875, 3.68115234375, 3.83819580078125, 3.9952392578125, 4.15228271484375, 4.309326171875, 4.46636962890625, 4.6234130859375, 4.78045654296875, 4.9375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 7.0, 12.0, 12.0, 17.0, 21.0, 36.0, 54.0, 90.0, 106.0, 148.0, 211.0, 270.0, 350.0, 505.0, 678.0, 956.0, 1381.0, 1988.0, 3087.0, 5015.0, 8817.0, 17423.0, 39390.0, 99223.0, 248249.0, 334822.0, 164714.0, 63177.0, 26222.0, 12517.0, 6727.0, 3933.0, 2570.0, 1644.0, 1185.0, 825.0, 615.0, 460.0, 307.0, 236.0, 160.0, 116.0, 95.0, 57.0, 38.0, 31.0, 24.0, 16.0, 9.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0], "bins": [-6.015625, -5.83477783203125, -5.6539306640625, -5.47308349609375, -5.292236328125, -5.11138916015625, -4.9305419921875, -4.74969482421875, -4.56884765625, -4.38800048828125, -4.2071533203125, -4.02630615234375, -3.845458984375, -3.66461181640625, -3.4837646484375, -3.30291748046875, -3.1220703125, -2.94122314453125, -2.7603759765625, -2.57952880859375, -2.398681640625, -2.21783447265625, -2.0369873046875, -1.85614013671875, -1.67529296875, -1.49444580078125, -1.3135986328125, -1.13275146484375, -0.951904296875, -0.77105712890625, -0.5902099609375, -0.40936279296875, -0.228515625, -0.04766845703125, 0.1331787109375, 0.31402587890625, 0.494873046875, 0.67572021484375, 0.8565673828125, 1.03741455078125, 1.21826171875, 1.39910888671875, 1.5799560546875, 1.76080322265625, 1.941650390625, 2.12249755859375, 2.3033447265625, 2.48419189453125, 2.6650390625, 2.84588623046875, 3.0267333984375, 3.20758056640625, 3.388427734375, 3.56927490234375, 3.7501220703125, 3.93096923828125, 4.11181640625, 4.29266357421875, 4.4735107421875, 4.65435791015625, 4.835205078125, 5.01605224609375, 5.1968994140625, 5.37774658203125, 5.55859375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 9.0, 10.0, 12.0, 17.0, 29.0, 53.0, 77.0, 115.0, 151.0, 130.0, 138.0, 77.0, 67.0, 36.0, 15.0, 19.0, 8.0, 12.0, 4.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00036334991455078125, -0.0003500841557979584, -0.0003368183970451355, -0.0003235526382923126, -0.00031028687953948975, -0.00029702112078666687, -0.000283755362033844, -0.0002704896032810211, -0.00025722384452819824, -0.00024395808577537537, -0.0002306923270225525, -0.00021742656826972961, -0.00020416080951690674, -0.00019089505076408386, -0.00017762929201126099, -0.0001643635332584381, -0.00015109777450561523, -0.00013783201575279236, -0.00012456625699996948, -0.0001113004982471466, -9.803473949432373e-05, -8.476898074150085e-05, -7.150322198867798e-05, -5.82374632358551e-05, -4.4971704483032227e-05, -3.170594573020935e-05, -1.8440186977386475e-05, -5.174428224563599e-06, 8.091330528259277e-06, 2.1357089281082153e-05, 3.462284803390503e-05, 4.7888606786727905e-05, 6.115436553955078e-05, 7.442012429237366e-05, 8.768588304519653e-05, 0.00010095164179801941, 0.00011421740055084229, 0.00012748315930366516, 0.00014074891805648804, 0.0001540146768093109, 0.0001672804355621338, 0.00018054619431495667, 0.00019381195306777954, 0.00020707771182060242, 0.0002203434705734253, 0.00023360922932624817, 0.00024687498807907104, 0.0002601407468318939, 0.0002734065055847168, 0.00028667226433753967, 0.00029993802309036255, 0.0003132037818431854, 0.0003264695405960083, 0.0003397352993488312, 0.00035300105810165405, 0.00036626681685447693, 0.0003795325756072998, 0.0003927983343601227, 0.00040606409311294556, 0.00041932985186576843, 0.0004325956106185913, 0.0004458613693714142, 0.00045912712812423706, 0.00047239288687705994, 0.0004856586456298828]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 6.0, 2.0, 14.0, 19.0, 26.0, 49.0, 56.0, 91.0, 113.0, 136.0, 225.0, 329.0, 479.0, 722.0, 999.0, 1499.0, 2379.0, 3496.0, 5997.0, 10477.0, 21336.0, 51100.0, 128594.0, 265307.0, 287094.0, 152376.0, 60630.0, 24996.0, 12032.0, 6568.0, 3940.0, 2389.0, 1623.0, 1122.0, 704.0, 476.0, 358.0, 244.0, 178.0, 103.0, 96.0, 58.0, 37.0, 21.0, 17.0, 12.0, 10.0, 7.0, 3.0, 7.0, 1.0, 4.0, 3.0, 1.0, 2.0], "bins": [-6.08203125, -5.89825439453125, -5.7144775390625, -5.53070068359375, -5.346923828125, -5.16314697265625, -4.9793701171875, -4.79559326171875, -4.61181640625, -4.42803955078125, -4.2442626953125, -4.06048583984375, -3.876708984375, -3.69293212890625, -3.5091552734375, -3.32537841796875, -3.1416015625, -2.95782470703125, -2.7740478515625, -2.59027099609375, -2.406494140625, -2.22271728515625, -2.0389404296875, -1.85516357421875, -1.67138671875, -1.48760986328125, -1.3038330078125, -1.12005615234375, -0.936279296875, -0.75250244140625, -0.5687255859375, -0.38494873046875, -0.201171875, -0.01739501953125, 0.1663818359375, 0.35015869140625, 0.533935546875, 0.71771240234375, 0.9014892578125, 1.08526611328125, 1.26904296875, 1.45281982421875, 1.6365966796875, 1.82037353515625, 2.004150390625, 2.18792724609375, 2.3717041015625, 2.55548095703125, 2.7392578125, 2.92303466796875, 3.1068115234375, 3.29058837890625, 3.474365234375, 3.65814208984375, 3.8419189453125, 4.02569580078125, 4.20947265625, 4.39324951171875, 4.5770263671875, 4.76080322265625, 4.944580078125, 5.12835693359375, 5.3121337890625, 5.49591064453125, 5.6796875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 9.0, 8.0, 16.0, 30.0, 51.0, 108.0, 135.0, 179.0, 164.0, 122.0, 63.0, 36.0, 26.0, 12.0, 8.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.458984375, -3.369598388671875, -3.28021240234375, -3.190826416015625, -3.1014404296875, -3.012054443359375, -2.92266845703125, -2.833282470703125, -2.743896484375, -2.654510498046875, -2.56512451171875, -2.475738525390625, -2.3863525390625, -2.296966552734375, -2.20758056640625, -2.118194580078125, -2.02880859375, -1.939422607421875, -1.85003662109375, -1.760650634765625, -1.6712646484375, -1.581878662109375, -1.49249267578125, -1.403106689453125, -1.313720703125, -1.224334716796875, -1.13494873046875, -1.045562744140625, -0.9561767578125, -0.866790771484375, -0.77740478515625, -0.688018798828125, -0.5986328125, -0.509246826171875, -0.41986083984375, -0.330474853515625, -0.2410888671875, -0.151702880859375, -0.06231689453125, 0.027069091796875, 0.116455078125, 0.205841064453125, 0.29522705078125, 0.384613037109375, 0.4739990234375, 0.563385009765625, 0.65277099609375, 0.742156982421875, 0.83154296875, 0.920928955078125, 1.01031494140625, 1.099700927734375, 1.1890869140625, 1.278472900390625, 1.36785888671875, 1.457244873046875, 1.546630859375, 1.636016845703125, 1.72540283203125, 1.814788818359375, 1.9041748046875, 1.993560791015625, 2.08294677734375, 2.172332763671875, 2.26171875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 7.0, 13.0, 19.0, 22.0, 28.0, 30.0, 36.0, 32.0, 41.0, 42.0, 52.0, 56.0, 47.0, 55.0, 58.0, 59.0, 56.0, 48.0, 42.0, 34.0, 25.0, 26.0, 36.0, 28.0, 16.0, 15.0, 14.0, 10.0, 7.0, 9.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.823941230773926, -11.421636581420898, -11.019332885742188, -10.61702823638916, -10.21472454071045, -9.812419891357422, -9.410116195678711, -9.007811546325684, -8.605507850646973, -8.203203201293945, -7.800899505615234, -7.398595333099365, -6.996291160583496, -6.593986511230469, -6.191682815551758, -5.7893781661987305, -5.387073993682861, -4.984769821166992, -4.582465648651123, -4.180161476135254, -3.7778573036193848, -3.3755528926849365, -2.9732487201690674, -2.5709445476531982, -2.168640375137329, -1.76633620262146, -1.3640320301055908, -0.9617277383804321, -0.559423565864563, -0.1571192741394043, 0.24518489837646484, 0.647489070892334, 1.0497932434082031, 1.4520974159240723, 1.8544015884399414, 2.2567057609558105, 2.6590099334716797, 3.061314344406128, 3.463618516921997, 3.865922689437866, 4.268226623535156, 4.670530796051025, 5.0728349685668945, 5.475139141082764, 5.877443313598633, 6.27974796295166, 6.682051658630371, 7.084356307983398, 7.486660480499268, 7.888964653015137, 8.291269302368164, 8.693572998046875, 9.095877647399902, 9.498181343078613, 9.90048599243164, 10.302789688110352, 10.705094337463379, 11.107398986816406, 11.509702682495117, 11.912007331848145, 12.314311027526855, 12.716615676879883, 13.118919372558594, 13.521224021911621, 13.923527717590332]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 5.0, 8.0, 10.0, 15.0, 14.0, 11.0, 21.0, 15.0, 16.0, 28.0, 29.0, 29.0, 32.0, 34.0, 45.0, 39.0, 38.0, 44.0, 38.0, 34.0, 43.0, 46.0, 43.0, 45.0, 36.0, 27.0, 31.0, 26.0, 22.0, 22.0, 21.0, 13.0, 25.0, 21.0, 13.0, 11.0, 8.0, 4.0, 9.0, 4.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.86002779006958, -7.609091758728027, -7.358155250549316, -7.1072187423706055, -6.856282711029053, -6.6053466796875, -6.354410171508789, -6.103473663330078, -5.852537631988525, -5.601601600646973, -5.350665092468262, -5.099728584289551, -4.848792552947998, -4.597856521606445, -4.346920013427734, -4.095983505249023, -3.8450474739074707, -3.594111204147339, -3.343174934387207, -3.092238664627075, -2.8413023948669434, -2.5903661251068115, -2.3394298553466797, -2.088493585586548, -1.837557315826416, -1.5866210460662842, -1.3356847763061523, -1.0847485065460205, -0.8338122367858887, -0.5828759670257568, -0.331939697265625, -0.08100342750549316, 0.16993236541748047, 0.4208686351776123, 0.6718049049377441, 0.922741174697876, 1.1736774444580078, 1.4246137142181396, 1.6755499839782715, 1.9264862537384033, 2.177422523498535, 2.428358793258667, 2.679295063018799, 2.9302313327789307, 3.1811676025390625, 3.4321038722991943, 3.683040142059326, 3.933976411819458, 4.18491268157959, 4.435849189758301, 4.6867852210998535, 4.937721252441406, 5.188657760620117, 5.439594268798828, 5.690530300140381, 5.941466331481934, 6.1924028396606445, 6.4433393478393555, 6.694275379180908, 6.945211410522461, 7.196147918701172, 7.447084426879883, 7.6980204582214355, 7.948956489562988, 8.1998929977417]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 9.0, 11.0, 20.0, 26.0, 38.0, 63.0, 104.0, 184.0, 240.0, 365.0, 555.0, 868.0, 1358.0, 2118.0, 3447.0, 5157.0, 7984.0, 12596.0, 19007.0, 28995.0, 42774.0, 61266.0, 82404.0, 104134.0, 119628.0, 122351.0, 113012.0, 94105.0, 71695.0, 50968.0, 35614.0, 23969.0, 15319.0, 10064.0, 6548.0, 4089.0, 2642.0, 1642.0, 1131.0, 736.0, 464.0, 305.0, 169.0, 145.0, 84.0, 51.0, 33.0, 20.0, 14.0, 12.0, 6.0, 5.0, 1.0, 1.0, 2.0, 4.0, 2.0], "bins": [-6.71484375, -6.50665283203125, -6.2984619140625, -6.09027099609375, -5.882080078125, -5.67388916015625, -5.4656982421875, -5.25750732421875, -5.04931640625, -4.84112548828125, -4.6329345703125, -4.42474365234375, -4.216552734375, -4.00836181640625, -3.8001708984375, -3.59197998046875, -3.3837890625, -3.17559814453125, -2.9674072265625, -2.75921630859375, -2.551025390625, -2.34283447265625, -2.1346435546875, -1.92645263671875, -1.71826171875, -1.51007080078125, -1.3018798828125, -1.09368896484375, -0.885498046875, -0.67730712890625, -0.4691162109375, -0.26092529296875, -0.052734375, 0.15545654296875, 0.3636474609375, 0.57183837890625, 0.780029296875, 0.98822021484375, 1.1964111328125, 1.40460205078125, 1.61279296875, 1.82098388671875, 2.0291748046875, 2.23736572265625, 2.445556640625, 2.65374755859375, 2.8619384765625, 3.07012939453125, 3.2783203125, 3.48651123046875, 3.6947021484375, 3.90289306640625, 4.111083984375, 4.31927490234375, 4.5274658203125, 4.73565673828125, 4.94384765625, 5.15203857421875, 5.3602294921875, 5.56842041015625, 5.776611328125, 5.98480224609375, 6.1929931640625, 6.40118408203125, 6.609375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 5.0, 9.0, 5.0, 4.0, 6.0, 12.0, 15.0, 18.0, 16.0, 20.0, 26.0, 16.0, 29.0, 23.0, 31.0, 27.0, 31.0, 38.0, 51.0, 32.0, 45.0, 35.0, 37.0, 34.0, 42.0, 44.0, 34.0, 34.0, 35.0, 22.0, 33.0, 29.0, 22.0, 29.0, 16.0, 14.0, 12.0, 12.0, 12.0, 3.0, 5.0, 10.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-8.421875, -8.16748046875, -7.9130859375, -7.65869140625, -7.404296875, -7.14990234375, -6.8955078125, -6.64111328125, -6.38671875, -6.13232421875, -5.8779296875, -5.62353515625, -5.369140625, -5.11474609375, -4.8603515625, -4.60595703125, -4.3515625, -4.09716796875, -3.8427734375, -3.58837890625, -3.333984375, -3.07958984375, -2.8251953125, -2.57080078125, -2.31640625, -2.06201171875, -1.8076171875, -1.55322265625, -1.298828125, -1.04443359375, -0.7900390625, -0.53564453125, -0.28125, -0.02685546875, 0.2275390625, 0.48193359375, 0.736328125, 0.99072265625, 1.2451171875, 1.49951171875, 1.75390625, 2.00830078125, 2.2626953125, 2.51708984375, 2.771484375, 3.02587890625, 3.2802734375, 3.53466796875, 3.7890625, 4.04345703125, 4.2978515625, 4.55224609375, 4.806640625, 5.06103515625, 5.3154296875, 5.56982421875, 5.82421875, 6.07861328125, 6.3330078125, 6.58740234375, 6.841796875, 7.09619140625, 7.3505859375, 7.60498046875, 7.859375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 18.0, 32.0, 26.0, 50.0, 73.0, 126.0, 213.0, 324.0, 603.0, 942.0, 1483.0, 2359.0, 4111.0, 6770.0, 11103.0, 18347.0, 29926.0, 47037.0, 71827.0, 100929.0, 127090.0, 141703.0, 135345.0, 112509.0, 84308.0, 56962.0, 36713.0, 22757.0, 13788.0, 8351.0, 4961.0, 3024.0, 1840.0, 1093.0, 711.0, 392.0, 267.0, 172.0, 118.0, 60.0, 30.0, 22.0, 14.0, 13.0, 3.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -6.96826171875, -6.7255859375, -6.48291015625, -6.240234375, -5.99755859375, -5.7548828125, -5.51220703125, -5.26953125, -5.02685546875, -4.7841796875, -4.54150390625, -4.298828125, -4.05615234375, -3.8134765625, -3.57080078125, -3.328125, -3.08544921875, -2.8427734375, -2.60009765625, -2.357421875, -2.11474609375, -1.8720703125, -1.62939453125, -1.38671875, -1.14404296875, -0.9013671875, -0.65869140625, -0.416015625, -0.17333984375, 0.0693359375, 0.31201171875, 0.5546875, 0.79736328125, 1.0400390625, 1.28271484375, 1.525390625, 1.76806640625, 2.0107421875, 2.25341796875, 2.49609375, 2.73876953125, 2.9814453125, 3.22412109375, 3.466796875, 3.70947265625, 3.9521484375, 4.19482421875, 4.4375, 4.68017578125, 4.9228515625, 5.16552734375, 5.408203125, 5.65087890625, 5.8935546875, 6.13623046875, 6.37890625, 6.62158203125, 6.8642578125, 7.10693359375, 7.349609375, 7.59228515625, 7.8349609375, 8.07763671875, 8.3203125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 2.0, 7.0, 10.0, 11.0, 8.0, 14.0, 12.0, 22.0, 26.0, 31.0, 24.0, 23.0, 32.0, 37.0, 35.0, 46.0, 42.0, 49.0, 37.0, 42.0, 37.0, 37.0, 51.0, 41.0, 39.0, 32.0, 32.0, 23.0, 30.0, 24.0, 24.0, 26.0, 20.0, 14.0, 8.0, 10.0, 8.0, 8.0, 8.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.55859375, -6.36810302734375, -6.1776123046875, -5.98712158203125, -5.796630859375, -5.60614013671875, -5.4156494140625, -5.22515869140625, -5.03466796875, -4.84417724609375, -4.6536865234375, -4.46319580078125, -4.272705078125, -4.08221435546875, -3.8917236328125, -3.70123291015625, -3.5107421875, -3.32025146484375, -3.1297607421875, -2.93927001953125, -2.748779296875, -2.55828857421875, -2.3677978515625, -2.17730712890625, -1.98681640625, -1.79632568359375, -1.6058349609375, -1.41534423828125, -1.224853515625, -1.03436279296875, -0.8438720703125, -0.65338134765625, -0.462890625, -0.27239990234375, -0.0819091796875, 0.10858154296875, 0.299072265625, 0.48956298828125, 0.6800537109375, 0.87054443359375, 1.06103515625, 1.25152587890625, 1.4420166015625, 1.63250732421875, 1.822998046875, 2.01348876953125, 2.2039794921875, 2.39447021484375, 2.5849609375, 2.77545166015625, 2.9659423828125, 3.15643310546875, 3.346923828125, 3.53741455078125, 3.7279052734375, 3.91839599609375, 4.10888671875, 4.29937744140625, 4.4898681640625, 4.68035888671875, 4.870849609375, 5.06134033203125, 5.2518310546875, 5.44232177734375, 5.6328125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 3.0, 10.0, 15.0, 22.0, 44.0, 43.0, 72.0, 121.0, 149.0, 259.0, 347.0, 492.0, 812.0, 1296.0, 2130.0, 3418.0, 5842.0, 10504.0, 18630.0, 32863.0, 57629.0, 95226.0, 141297.0, 172917.0, 168950.0, 130670.0, 85838.0, 50980.0, 29049.0, 16298.0, 9090.0, 5174.0, 3050.0, 1904.0, 1162.0, 796.0, 459.0, 331.0, 199.0, 139.0, 103.0, 58.0, 50.0, 38.0, 26.0, 20.0, 9.0, 3.0, 7.0, 5.0, 1.0, 4.0, 2.0], "bins": [-5.6640625, -5.501708984375, -5.33935546875, -5.177001953125, -5.0146484375, -4.852294921875, -4.68994140625, -4.527587890625, -4.365234375, -4.202880859375, -4.04052734375, -3.878173828125, -3.7158203125, -3.553466796875, -3.39111328125, -3.228759765625, -3.06640625, -2.904052734375, -2.74169921875, -2.579345703125, -2.4169921875, -2.254638671875, -2.09228515625, -1.929931640625, -1.767578125, -1.605224609375, -1.44287109375, -1.280517578125, -1.1181640625, -0.955810546875, -0.79345703125, -0.631103515625, -0.46875, -0.306396484375, -0.14404296875, 0.018310546875, 0.1806640625, 0.343017578125, 0.50537109375, 0.667724609375, 0.830078125, 0.992431640625, 1.15478515625, 1.317138671875, 1.4794921875, 1.641845703125, 1.80419921875, 1.966552734375, 2.12890625, 2.291259765625, 2.45361328125, 2.615966796875, 2.7783203125, 2.940673828125, 3.10302734375, 3.265380859375, 3.427734375, 3.590087890625, 3.75244140625, 3.914794921875, 4.0771484375, 4.239501953125, 4.40185546875, 4.564208984375, 4.7265625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 6.0, 4.0, 7.0, 12.0, 10.0, 16.0, 23.0, 17.0, 30.0, 36.0, 40.0, 68.0, 75.0, 61.0, 64.0, 61.0, 67.0, 69.0, 53.0, 55.0, 32.0, 31.0, 30.0, 26.0, 14.0, 19.0, 17.0, 12.0, 3.0, 2.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.0007243156433105469, -0.0007052198052406311, -0.0006861239671707153, -0.0006670281291007996, -0.0006479322910308838, -0.000628836452960968, -0.0006097406148910522, -0.0005906447768211365, -0.0005715489387512207, -0.0005524531006813049, -0.0005333572626113892, -0.0005142614245414734, -0.0004951655864715576, -0.00047606974840164185, -0.0004569739103317261, -0.0004378780722618103, -0.00041878223419189453, -0.00039968639612197876, -0.000380590558052063, -0.0003614947199821472, -0.00034239888191223145, -0.0003233030438423157, -0.0003042072057723999, -0.00028511136770248413, -0.00026601552963256836, -0.0002469196915626526, -0.00022782385349273682, -0.00020872801542282104, -0.00018963217735290527, -0.0001705363392829895, -0.00015144050121307373, -0.00013234466314315796, -0.00011324882507324219, -9.415298700332642e-05, -7.505714893341064e-05, -5.596131086349487e-05, -3.68654727935791e-05, -1.776963472366333e-05, 1.3262033462524414e-06, 2.0422041416168213e-05, 3.9517879486083984e-05, 5.8613717555999756e-05, 7.770955562591553e-05, 9.68053936958313e-05, 0.00011590123176574707, 0.00013499706983566284, 0.0001540929079055786, 0.00017318874597549438, 0.00019228458404541016, 0.00021138042211532593, 0.0002304762601852417, 0.00024957209825515747, 0.00026866793632507324, 0.000287763774394989, 0.0003068596124649048, 0.00032595545053482056, 0.00034505128860473633, 0.0003641471266746521, 0.00038324296474456787, 0.00040233880281448364, 0.0004214346408843994, 0.0004405304789543152, 0.00045962631702423096, 0.00047872215509414673, 0.0004978179931640625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 5.0, 4.0, 3.0, 4.0, 10.0, 5.0, 7.0, 15.0, 28.0, 33.0, 57.0, 92.0, 132.0, 200.0, 363.0, 685.0, 1437.0, 3271.0, 8446.0, 23045.0, 64909.0, 166977.0, 297065.0, 270140.0, 132855.0, 49375.0, 17600.0, 6629.0, 2610.0, 1142.0, 557.0, 309.0, 199.0, 119.0, 64.0, 43.0, 37.0, 16.0, 24.0, 9.0, 9.0, 5.0, 7.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-9.6171875, -9.3245849609375, -9.031982421875, -8.7393798828125, -8.44677734375, -8.1541748046875, -7.861572265625, -7.5689697265625, -7.2763671875, -6.9837646484375, -6.691162109375, -6.3985595703125, -6.10595703125, -5.8133544921875, -5.520751953125, -5.2281494140625, -4.935546875, -4.6429443359375, -4.350341796875, -4.0577392578125, -3.76513671875, -3.4725341796875, -3.179931640625, -2.8873291015625, -2.5947265625, -2.3021240234375, -2.009521484375, -1.7169189453125, -1.42431640625, -1.1317138671875, -0.839111328125, -0.5465087890625, -0.25390625, 0.0386962890625, 0.331298828125, 0.6239013671875, 0.91650390625, 1.2091064453125, 1.501708984375, 1.7943115234375, 2.0869140625, 2.3795166015625, 2.672119140625, 2.9647216796875, 3.25732421875, 3.5499267578125, 3.842529296875, 4.1351318359375, 4.427734375, 4.7203369140625, 5.012939453125, 5.3055419921875, 5.59814453125, 5.8907470703125, 6.183349609375, 6.4759521484375, 6.7685546875, 7.0611572265625, 7.353759765625, 7.6463623046875, 7.93896484375, 8.2315673828125, 8.524169921875, 8.8167724609375, 9.109375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 10.0, 9.0, 15.0, 11.0, 19.0, 20.0, 24.0, 30.0, 42.0, 51.0, 61.0, 54.0, 47.0, 64.0, 65.0, 52.0, 67.0, 52.0, 56.0, 50.0, 43.0, 34.0, 26.0, 22.0, 14.0, 13.0, 12.0, 6.0, 10.0, 6.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9990234375, -1.9424591064453125, -1.885894775390625, -1.8293304443359375, -1.77276611328125, -1.7162017822265625, -1.659637451171875, -1.6030731201171875, -1.5465087890625, -1.4899444580078125, -1.433380126953125, -1.3768157958984375, -1.32025146484375, -1.2636871337890625, -1.207122802734375, -1.1505584716796875, -1.093994140625, -1.0374298095703125, -0.980865478515625, -0.9243011474609375, -0.86773681640625, -0.8111724853515625, -0.754608154296875, -0.6980438232421875, -0.6414794921875, -0.5849151611328125, -0.528350830078125, -0.4717864990234375, -0.41522216796875, -0.3586578369140625, -0.302093505859375, -0.2455291748046875, -0.18896484375, -0.1324005126953125, -0.075836181640625, -0.0192718505859375, 0.03729248046875, 0.0938568115234375, 0.150421142578125, 0.2069854736328125, 0.2635498046875, 0.3201141357421875, 0.376678466796875, 0.4332427978515625, 0.48980712890625, 0.5463714599609375, 0.602935791015625, 0.6595001220703125, 0.716064453125, 0.7726287841796875, 0.829193115234375, 0.8857574462890625, 0.94232177734375, 0.9988861083984375, 1.055450439453125, 1.1120147705078125, 1.1685791015625, 1.2251434326171875, 1.281707763671875, 1.3382720947265625, 1.39483642578125, 1.4514007568359375, 1.507965087890625, 1.5645294189453125, 1.62109375]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 6.0, 5.0, 5.0, 15.0, 12.0, 14.0, 15.0, 19.0, 35.0, 28.0, 26.0, 33.0, 44.0, 50.0, 43.0, 49.0, 49.0, 42.0, 59.0, 50.0, 48.0, 53.0, 36.0, 37.0, 38.0, 20.0, 22.0, 29.0, 20.0, 21.0, 13.0, 14.0, 6.0, 6.0, 9.0, 7.0, 0.0, 4.0, 8.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28453540802002, -9.909186363220215, -9.53383731842041, -9.158489227294922, -8.783140182495117, -8.407791137695312, -8.032442092895508, -7.657093048095703, -7.281744003295898, -6.906394958496094, -6.531046390533447, -6.155697345733643, -5.780348300933838, -5.404999732971191, -5.029650688171387, -4.654301643371582, -4.2789530754089355, -3.90360426902771, -3.5282552242279053, -3.1529064178466797, -2.777557373046875, -2.4022085666656494, -2.026859760284424, -1.6515107154846191, -1.2761619091033936, -0.9008129835128784, -0.5254641175270081, -0.1501152515411377, 0.22523367404937744, 0.6005825996398926, 0.9759314060211182, 1.3512804508209229, 1.7266292572021484, 2.101978063583374, 2.4773271083831787, 2.8526759147644043, 3.228024959564209, 3.6033737659454346, 3.97872257232666, 4.354071617126465, 4.7294206619262695, 5.104769706726074, 5.480118274688721, 5.855467319488525, 6.23081636428833, 6.606164932250977, 6.981513977050781, 7.356863021850586, 7.732211589813232, 8.107560157775879, 8.482909202575684, 8.858258247375488, 9.233607292175293, 9.608956336975098, 9.984304428100586, 10.35965347290039, 10.735002517700195, 11.1103515625, 11.485700607299805, 11.86104965209961, 12.236397743225098, 12.611746788024902, 12.987095832824707, 13.362444877624512, 13.737793922424316]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 2.0, 11.0, 13.0, 10.0, 6.0, 19.0, 7.0, 12.0, 14.0, 18.0, 26.0, 14.0, 20.0, 22.0, 39.0, 39.0, 36.0, 44.0, 35.0, 32.0, 41.0, 35.0, 28.0, 37.0, 32.0, 31.0, 29.0, 40.0, 45.0, 30.0, 26.0, 25.0, 20.0, 17.0, 27.0, 19.0, 12.0, 17.0, 11.0, 11.0, 11.0, 10.0, 8.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.382548332214355, -8.111221313476562, -7.8398942947387695, -7.568567752838135, -7.297240734100342, -7.025913715362549, -6.754587173461914, -6.483260154724121, -6.211933135986328, -5.940606117248535, -5.669279098510742, -5.397952556610107, -5.1266255378723145, -4.8552985191345215, -4.583971977233887, -4.312644958496094, -4.041317939758301, -3.769990921020508, -3.498664140701294, -3.22733736038208, -2.956010341644287, -2.684683322906494, -2.4133565425872803, -2.1420297622680664, -1.8707027435302734, -1.59937584400177, -1.3280489444732666, -1.0567220449447632, -0.7853951454162598, -0.5140682458877563, -0.24274134635925293, 0.02858555316925049, 0.2999134063720703, 0.5712403059005737, 0.8425672054290771, 1.1138941049575806, 1.385221004486084, 1.6565479040145874, 1.9278748035430908, 2.1992015838623047, 2.4705286026000977, 2.7418556213378906, 3.0131824016571045, 3.2845091819763184, 3.5558362007141113, 3.8271632194519043, 4.098489761352539, 4.369816780090332, 4.641143798828125, 4.912470817565918, 5.183797836303711, 5.455124378204346, 5.726451396942139, 5.997778415679932, 6.269104957580566, 6.540431976318359, 6.811758995056152, 7.083086013793945, 7.354413032531738, 7.625739574432373, 7.897066593170166, 8.1683931350708, 8.439720153808594, 8.711047172546387, 8.98237419128418]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 2.0, 9.0, 23.0, 41.0, 48.0, 59.0, 116.0, 164.0, 222.0, 310.0, 480.0, 743.0, 1222.0, 1933.0, 3143.0, 5128.0, 8579.0, 15300.0, 27300.0, 49707.0, 93703.0, 178261.0, 338441.0, 602870.0, 857206.0, 822108.0, 546818.0, 300972.0, 157482.0, 81806.0, 43506.0, 23626.0, 13404.0, 7661.0, 4456.0, 2736.0, 1646.0, 1029.0, 660.0, 440.0, 288.0, 210.0, 141.0, 96.0, 51.0, 47.0, 23.0, 27.0, 16.0, 6.0, 10.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-12.4140625, -12.0123291015625, -11.610595703125, -11.2088623046875, -10.80712890625, -10.4053955078125, -10.003662109375, -9.6019287109375, -9.2001953125, -8.7984619140625, -8.396728515625, -7.9949951171875, -7.59326171875, -7.1915283203125, -6.789794921875, -6.3880615234375, -5.986328125, -5.5845947265625, -5.182861328125, -4.7811279296875, -4.37939453125, -3.9776611328125, -3.575927734375, -3.1741943359375, -2.7724609375, -2.3707275390625, -1.968994140625, -1.5672607421875, -1.16552734375, -0.7637939453125, -0.362060546875, 0.0396728515625, 0.44140625, 0.8431396484375, 1.244873046875, 1.6466064453125, 2.04833984375, 2.4500732421875, 2.851806640625, 3.2535400390625, 3.6552734375, 4.0570068359375, 4.458740234375, 4.8604736328125, 5.26220703125, 5.6639404296875, 6.065673828125, 6.4674072265625, 6.869140625, 7.2708740234375, 7.672607421875, 8.0743408203125, 8.47607421875, 8.8778076171875, 9.279541015625, 9.6812744140625, 10.0830078125, 10.4847412109375, 10.886474609375, 11.2882080078125, 11.68994140625, 12.0916748046875, 12.493408203125, 12.8951416015625, 13.296875]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 7.0, 5.0, 7.0, 5.0, 12.0, 7.0, 18.0, 17.0, 21.0, 29.0, 25.0, 31.0, 29.0, 36.0, 48.0, 56.0, 36.0, 31.0, 62.0, 41.0, 42.0, 41.0, 37.0, 40.0, 32.0, 43.0, 36.0, 33.0, 35.0, 25.0, 30.0, 19.0, 9.0, 14.0, 9.0, 10.0, 7.0, 12.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.9140625, -8.66387939453125, -8.4136962890625, -8.16351318359375, -7.913330078125, -7.66314697265625, -7.4129638671875, -7.16278076171875, -6.91259765625, -6.66241455078125, -6.4122314453125, -6.16204833984375, -5.911865234375, -5.66168212890625, -5.4114990234375, -5.16131591796875, -4.9111328125, -4.66094970703125, -4.4107666015625, -4.16058349609375, -3.910400390625, -3.66021728515625, -3.4100341796875, -3.15985107421875, -2.90966796875, -2.65948486328125, -2.4093017578125, -2.15911865234375, -1.908935546875, -1.65875244140625, -1.4085693359375, -1.15838623046875, -0.908203125, -0.65802001953125, -0.4078369140625, -0.15765380859375, 0.092529296875, 0.34271240234375, 0.5928955078125, 0.84307861328125, 1.09326171875, 1.34344482421875, 1.5936279296875, 1.84381103515625, 2.093994140625, 2.34417724609375, 2.5943603515625, 2.84454345703125, 3.0947265625, 3.34490966796875, 3.5950927734375, 3.84527587890625, 4.095458984375, 4.34564208984375, 4.5958251953125, 4.84600830078125, 5.09619140625, 5.34637451171875, 5.5965576171875, 5.84674072265625, 6.096923828125, 6.34710693359375, 6.5972900390625, 6.84747314453125, 7.09765625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 9.0, 2.0, 18.0, 15.0, 34.0, 46.0, 61.0, 137.0, 231.0, 383.0, 673.0, 1186.0, 2069.0, 4014.0, 7289.0, 14057.0, 28082.0, 55662.0, 109030.0, 212423.0, 393573.0, 645418.0, 840383.0, 764533.0, 512751.0, 290494.0, 153044.0, 77640.0, 39126.0, 19873.0, 10218.0, 5394.0, 2853.0, 1481.0, 861.0, 495.0, 266.0, 185.0, 109.0, 58.0, 41.0, 25.0, 16.0, 18.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.0, -13.544677734375, -13.08935546875, -12.634033203125, -12.1787109375, -11.723388671875, -11.26806640625, -10.812744140625, -10.357421875, -9.902099609375, -9.44677734375, -8.991455078125, -8.5361328125, -8.080810546875, -7.62548828125, -7.170166015625, -6.71484375, -6.259521484375, -5.80419921875, -5.348876953125, -4.8935546875, -4.438232421875, -3.98291015625, -3.527587890625, -3.072265625, -2.616943359375, -2.16162109375, -1.706298828125, -1.2509765625, -0.795654296875, -0.34033203125, 0.114990234375, 0.5703125, 1.025634765625, 1.48095703125, 1.936279296875, 2.3916015625, 2.846923828125, 3.30224609375, 3.757568359375, 4.212890625, 4.668212890625, 5.12353515625, 5.578857421875, 6.0341796875, 6.489501953125, 6.94482421875, 7.400146484375, 7.85546875, 8.310791015625, 8.76611328125, 9.221435546875, 9.6767578125, 10.132080078125, 10.58740234375, 11.042724609375, 11.498046875, 11.953369140625, 12.40869140625, 12.864013671875, 13.3193359375, 13.774658203125, 14.22998046875, 14.685302734375, 15.140625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 10.0, 17.0, 25.0, 28.0, 25.0, 35.0, 38.0, 58.0, 71.0, 95.0, 98.0, 132.0, 137.0, 162.0, 171.0, 217.0, 214.0, 247.0, 260.0, 261.0, 253.0, 245.0, 216.0, 188.0, 158.0, 145.0, 128.0, 104.0, 76.0, 61.0, 49.0, 37.0, 30.0, 13.0, 14.0, 18.0, 11.0, 3.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.841796875, -3.704254150390625, -3.56671142578125, -3.429168701171875, -3.2916259765625, -3.154083251953125, -3.01654052734375, -2.878997802734375, -2.741455078125, -2.603912353515625, -2.46636962890625, -2.328826904296875, -2.1912841796875, -2.053741455078125, -1.91619873046875, -1.778656005859375, -1.64111328125, -1.503570556640625, -1.36602783203125, -1.228485107421875, -1.0909423828125, -0.953399658203125, -0.81585693359375, -0.678314208984375, -0.540771484375, -0.403228759765625, -0.26568603515625, -0.128143310546875, 0.0093994140625, 0.146942138671875, 0.28448486328125, 0.422027587890625, 0.5595703125, 0.697113037109375, 0.83465576171875, 0.972198486328125, 1.1097412109375, 1.247283935546875, 1.38482666015625, 1.522369384765625, 1.659912109375, 1.797454833984375, 1.93499755859375, 2.072540283203125, 2.2100830078125, 2.347625732421875, 2.48516845703125, 2.622711181640625, 2.76025390625, 2.897796630859375, 3.03533935546875, 3.172882080078125, 3.3104248046875, 3.447967529296875, 3.58551025390625, 3.723052978515625, 3.860595703125, 3.998138427734375, 4.13568115234375, 4.273223876953125, 4.4107666015625, 4.548309326171875, 4.68585205078125, 4.823394775390625, 4.9609375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 10.0, 8.0, 9.0, 14.0, 15.0, 11.0, 27.0, 18.0, 26.0, 38.0, 32.0, 34.0, 41.0, 64.0, 45.0, 48.0, 64.0, 50.0, 53.0, 54.0, 36.0, 38.0, 34.0, 45.0, 23.0, 31.0, 24.0, 20.0, 14.0, 15.0, 7.0, 10.0, 7.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-14.245359420776367, -13.836874008178711, -13.428388595581055, -13.019903182983398, -12.611416816711426, -12.20293140411377, -11.794445991516113, -11.385960578918457, -10.977474212646484, -10.568988800048828, -10.160503387451172, -9.752017974853516, -9.343531608581543, -8.935046195983887, -8.52656078338623, -8.118075370788574, -7.709589958190918, -7.301104545593262, -6.892618656158447, -6.484133243560791, -6.075647354125977, -5.66716194152832, -5.258676528930664, -4.850191116333008, -4.441705226898193, -4.033219814300537, -3.6247339248657227, -3.2162485122680664, -2.807762861251831, -2.3992772102355957, -1.9907917976379395, -1.582306146621704, -1.1738204956054688, -0.7653349041938782, -0.3568493127822876, 0.0516362190246582, 0.46012187004089355, 0.8686075210571289, 1.2770929336547852, 1.6855785846710205, 2.094064235687256, 2.502549886703491, 2.9110355377197266, 3.319520950317383, 3.728006601333618, 4.1364922523498535, 4.54497766494751, 4.953463554382324, 5.3619489669799805, 5.770434379577637, 6.178920269012451, 6.587405681610107, 6.995891571044922, 7.404376983642578, 7.812862396240234, 8.22134780883789, 8.629833221435547, 9.038318634033203, 9.44680404663086, 9.855289459228516, 10.263775825500488, 10.672261238098145, 11.0807466506958, 11.489232063293457, 11.89771842956543]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 6.0, 6.0, 5.0, 4.0, 12.0, 8.0, 10.0, 12.0, 11.0, 15.0, 16.0, 15.0, 20.0, 33.0, 36.0, 38.0, 31.0, 40.0, 37.0, 39.0, 38.0, 47.0, 39.0, 31.0, 38.0, 41.0, 34.0, 45.0, 37.0, 42.0, 28.0, 30.0, 25.0, 14.0, 15.0, 6.0, 18.0, 10.0, 14.0, 13.0, 12.0, 3.0, 6.0, 6.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-9.541315078735352, -9.253632545471191, -8.965950012207031, -8.678268432617188, -8.390585899353027, -8.102903366088867, -7.815221309661865, -7.527539253234863, -7.239856719970703, -6.952174186706543, -6.664492130279541, -6.376810073852539, -6.089127540588379, -5.801445007324219, -5.513762950897217, -5.226080894470215, -4.938398361206055, -4.6507158279418945, -4.363033771514893, -4.075351715087891, -3.7876691818237305, -3.4999868869781494, -3.2123045921325684, -2.9246222972869873, -2.6369400024414062, -2.349257707595825, -2.061575412750244, -1.773893117904663, -1.486210823059082, -1.198528528213501, -0.9108462333679199, -0.6231639385223389, -0.3354816436767578, -0.04779934883117676, 0.2398829460144043, 0.5275652408599854, 0.8152475357055664, 1.1029298305511475, 1.3906121253967285, 1.6782944202423096, 1.9659767150878906, 2.2536590099334717, 2.5413413047790527, 2.829023599624634, 3.116705894470215, 3.404388189315796, 3.692070484161377, 3.979752779006958, 4.267435073852539, 4.555117607116699, 4.842799663543701, 5.130481719970703, 5.418164253234863, 5.705846786499023, 5.993528842926025, 6.281210899353027, 6.5688934326171875, 6.856575965881348, 7.14425802230835, 7.431940078735352, 7.719622611999512, 8.007305145263672, 8.294986724853516, 8.582669258117676, 8.870351791381836]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 10.0, 8.0, 15.0, 26.0, 49.0, 56.0, 116.0, 181.0, 298.0, 494.0, 895.0, 1580.0, 2672.0, 4993.0, 9245.0, 17285.0, 32923.0, 61636.0, 109065.0, 169931.0, 204632.0, 175910.0, 115427.0, 65791.0, 35035.0, 18288.0, 9749.0, 5328.0, 2858.0, 1732.0, 912.0, 534.0, 325.0, 205.0, 121.0, 81.0, 58.0, 24.0, 19.0, 13.0, 8.0, 8.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.7265625, -7.49627685546875, -7.2659912109375, -7.03570556640625, -6.805419921875, -6.57513427734375, -6.3448486328125, -6.11456298828125, -5.88427734375, -5.65399169921875, -5.4237060546875, -5.19342041015625, -4.963134765625, -4.73284912109375, -4.5025634765625, -4.27227783203125, -4.0419921875, -3.81170654296875, -3.5814208984375, -3.35113525390625, -3.120849609375, -2.89056396484375, -2.6602783203125, -2.42999267578125, -2.19970703125, -1.96942138671875, -1.7391357421875, -1.50885009765625, -1.278564453125, -1.04827880859375, -0.8179931640625, -0.58770751953125, -0.357421875, -0.12713623046875, 0.1031494140625, 0.33343505859375, 0.563720703125, 0.79400634765625, 1.0242919921875, 1.25457763671875, 1.48486328125, 1.71514892578125, 1.9454345703125, 2.17572021484375, 2.406005859375, 2.63629150390625, 2.8665771484375, 3.09686279296875, 3.3271484375, 3.55743408203125, 3.7877197265625, 4.01800537109375, 4.248291015625, 4.47857666015625, 4.7088623046875, 4.93914794921875, 5.16943359375, 5.39971923828125, 5.6300048828125, 5.86029052734375, 6.090576171875, 6.32086181640625, 6.5511474609375, 6.78143310546875, 7.01171875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 5.0, 6.0, 4.0, 9.0, 7.0, 3.0, 9.0, 7.0, 8.0, 7.0, 16.0, 12.0, 18.0, 20.0, 28.0, 26.0, 26.0, 29.0, 41.0, 37.0, 38.0, 35.0, 45.0, 26.0, 40.0, 39.0, 48.0, 38.0, 31.0, 37.0, 36.0, 36.0, 37.0, 32.0, 30.0, 19.0, 15.0, 21.0, 10.0, 8.0, 12.0, 12.0, 11.0, 11.0, 6.0, 2.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.75, -9.443115234375, -9.13623046875, -8.829345703125, -8.5224609375, -8.215576171875, -7.90869140625, -7.601806640625, -7.294921875, -6.988037109375, -6.68115234375, -6.374267578125, -6.0673828125, -5.760498046875, -5.45361328125, -5.146728515625, -4.83984375, -4.532958984375, -4.22607421875, -3.919189453125, -3.6123046875, -3.305419921875, -2.99853515625, -2.691650390625, -2.384765625, -2.077880859375, -1.77099609375, -1.464111328125, -1.1572265625, -0.850341796875, -0.54345703125, -0.236572265625, 0.0703125, 0.377197265625, 0.68408203125, 0.990966796875, 1.2978515625, 1.604736328125, 1.91162109375, 2.218505859375, 2.525390625, 2.832275390625, 3.13916015625, 3.446044921875, 3.7529296875, 4.059814453125, 4.36669921875, 4.673583984375, 4.98046875, 5.287353515625, 5.59423828125, 5.901123046875, 6.2080078125, 6.514892578125, 6.82177734375, 7.128662109375, 7.435546875, 7.742431640625, 8.04931640625, 8.356201171875, 8.6630859375, 8.969970703125, 9.27685546875, 9.583740234375, 9.890625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 7.0, 20.0, 10.0, 25.0, 37.0, 58.0, 87.0, 126.0, 214.0, 386.0, 637.0, 1179.0, 2197.0, 4358.0, 9042.0, 19944.0, 46456.0, 110054.0, 243794.0, 309272.0, 170891.0, 72740.0, 30619.0, 13366.0, 6168.0, 3091.0, 1562.0, 869.0, 543.0, 295.0, 174.0, 98.0, 81.0, 58.0, 30.0, 21.0, 18.0, 7.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.5655517578125, -10.177978515625, -9.7904052734375, -9.40283203125, -9.0152587890625, -8.627685546875, -8.2401123046875, -7.8525390625, -7.4649658203125, -7.077392578125, -6.6898193359375, -6.30224609375, -5.9146728515625, -5.527099609375, -5.1395263671875, -4.751953125, -4.3643798828125, -3.976806640625, -3.5892333984375, -3.20166015625, -2.8140869140625, -2.426513671875, -2.0389404296875, -1.6513671875, -1.2637939453125, -0.876220703125, -0.4886474609375, -0.10107421875, 0.2864990234375, 0.674072265625, 1.0616455078125, 1.44921875, 1.8367919921875, 2.224365234375, 2.6119384765625, 2.99951171875, 3.3870849609375, 3.774658203125, 4.1622314453125, 4.5498046875, 4.9373779296875, 5.324951171875, 5.7125244140625, 6.10009765625, 6.4876708984375, 6.875244140625, 7.2628173828125, 7.650390625, 8.0379638671875, 8.425537109375, 8.8131103515625, 9.20068359375, 9.5882568359375, 9.975830078125, 10.3634033203125, 10.7509765625, 11.1385498046875, 11.526123046875, 11.9136962890625, 12.30126953125, 12.6888427734375, 13.076416015625, 13.4639892578125, 13.8515625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 2.0, 11.0, 12.0, 9.0, 4.0, 7.0, 7.0, 18.0, 18.0, 14.0, 25.0, 22.0, 23.0, 37.0, 23.0, 29.0, 24.0, 29.0, 29.0, 42.0, 41.0, 24.0, 40.0, 36.0, 47.0, 39.0, 25.0, 44.0, 34.0, 35.0, 33.0, 35.0, 26.0, 20.0, 19.0, 15.0, 13.0, 13.0, 21.0, 10.0, 13.0, 9.0, 9.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.91015625, -5.732666015625, -5.55517578125, -5.377685546875, -5.2001953125, -5.022705078125, -4.84521484375, -4.667724609375, -4.490234375, -4.312744140625, -4.13525390625, -3.957763671875, -3.7802734375, -3.602783203125, -3.42529296875, -3.247802734375, -3.0703125, -2.892822265625, -2.71533203125, -2.537841796875, -2.3603515625, -2.182861328125, -2.00537109375, -1.827880859375, -1.650390625, -1.472900390625, -1.29541015625, -1.117919921875, -0.9404296875, -0.762939453125, -0.58544921875, -0.407958984375, -0.23046875, -0.052978515625, 0.12451171875, 0.302001953125, 0.4794921875, 0.656982421875, 0.83447265625, 1.011962890625, 1.189453125, 1.366943359375, 1.54443359375, 1.721923828125, 1.8994140625, 2.076904296875, 2.25439453125, 2.431884765625, 2.609375, 2.786865234375, 2.96435546875, 3.141845703125, 3.3193359375, 3.496826171875, 3.67431640625, 3.851806640625, 4.029296875, 4.206787109375, 4.38427734375, 4.561767578125, 4.7392578125, 4.916748046875, 5.09423828125, 5.271728515625, 5.44921875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 12.0, 8.0, 10.0, 7.0, 13.0, 31.0, 51.0, 47.0, 60.0, 105.0, 138.0, 216.0, 313.0, 390.0, 636.0, 922.0, 1433.0, 2292.0, 3654.0, 5870.0, 9751.0, 16500.0, 28281.0, 49177.0, 85076.0, 139935.0, 197995.0, 190024.0, 129367.0, 77531.0, 44373.0, 25697.0, 14918.0, 9024.0, 5410.0, 3287.0, 2024.0, 1335.0, 818.0, 540.0, 384.0, 259.0, 183.0, 125.0, 91.0, 65.0, 51.0, 37.0, 34.0, 14.0, 13.0, 17.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0], "bins": [-3.478515625, -3.372833251953125, -3.26715087890625, -3.161468505859375, -3.0557861328125, -2.950103759765625, -2.84442138671875, -2.738739013671875, -2.633056640625, -2.527374267578125, -2.42169189453125, -2.316009521484375, -2.2103271484375, -2.104644775390625, -1.99896240234375, -1.893280029296875, -1.78759765625, -1.681915283203125, -1.57623291015625, -1.470550537109375, -1.3648681640625, -1.259185791015625, -1.15350341796875, -1.047821044921875, -0.942138671875, -0.836456298828125, -0.73077392578125, -0.625091552734375, -0.5194091796875, -0.413726806640625, -0.30804443359375, -0.202362060546875, -0.0966796875, 0.009002685546875, 0.11468505859375, 0.220367431640625, 0.3260498046875, 0.431732177734375, 0.53741455078125, 0.643096923828125, 0.748779296875, 0.854461669921875, 0.96014404296875, 1.065826416015625, 1.1715087890625, 1.277191162109375, 1.38287353515625, 1.488555908203125, 1.59423828125, 1.699920654296875, 1.80560302734375, 1.911285400390625, 2.0169677734375, 2.122650146484375, 2.22833251953125, 2.334014892578125, 2.439697265625, 2.545379638671875, 2.65106201171875, 2.756744384765625, 2.8624267578125, 2.968109130859375, 3.07379150390625, 3.179473876953125, 3.28515625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 4.0, 2.0, 7.0, 11.0, 14.0, 14.0, 21.0, 24.0, 28.0, 31.0, 57.0, 52.0, 67.0, 59.0, 47.0, 54.0, 56.0, 52.0, 58.0, 42.0, 53.0, 46.0, 33.0, 22.0, 34.0, 14.0, 20.0, 17.0, 16.0, 8.0, 3.0, 5.0, 8.0, 8.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016796588897705078, -0.00016265921294689178, -0.0001573525369167328, -0.0001520458608865738, -0.0001467391848564148, -0.0001414325088262558, -0.0001361258327960968, -0.0001308191567659378, -0.0001255124807357788, -0.00012020580470561981, -0.00011489912867546082, -0.00010959245264530182, -0.00010428577661514282, -9.897910058498383e-05, -9.367242455482483e-05, -8.836574852466583e-05, -8.305907249450684e-05, -7.775239646434784e-05, -7.244572043418884e-05, -6.713904440402985e-05, -6.183236837387085e-05, -5.652569234371185e-05, -5.1219016313552856e-05, -4.591234028339386e-05, -4.060566425323486e-05, -3.529898822307587e-05, -2.999231219291687e-05, -2.4685636162757874e-05, -1.9378960132598877e-05, -1.407228410243988e-05, -8.765608072280884e-06, -3.458932042121887e-06, 1.8477439880371094e-06, 7.154420018196106e-06, 1.2461096048355103e-05, 1.77677720785141e-05, 2.3074448108673096e-05, 2.8381124138832092e-05, 3.368780016899109e-05, 3.8994476199150085e-05, 4.430115222930908e-05, 4.960782825946808e-05, 5.4914504289627075e-05, 6.022118031978607e-05, 6.552785634994507e-05, 7.083453238010406e-05, 7.614120841026306e-05, 8.144788444042206e-05, 8.675456047058105e-05, 9.206123650074005e-05, 9.736791253089905e-05, 0.00010267458856105804, 0.00010798126459121704, 0.00011328794062137604, 0.00011859461665153503, 0.00012390129268169403, 0.00012920796871185303, 0.00013451464474201202, 0.00013982132077217102, 0.00014512799680233002, 0.00015043467283248901, 0.000155741348862648, 0.000161048024892807, 0.000166354700922966, 0.000171661376953125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 9.0, 11.0, 25.0, 36.0, 58.0, 83.0, 146.0, 195.0, 341.0, 500.0, 985.0, 1635.0, 3111.0, 6061.0, 12107.0, 24661.0, 50614.0, 98856.0, 168828.0, 220375.0, 197023.0, 126988.0, 68245.0, 33836.0, 16330.0, 8079.0, 4281.0, 2170.0, 1167.0, 678.0, 391.0, 267.0, 159.0, 116.0, 66.0, 40.0, 23.0, 16.0, 9.0, 14.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.296875, -4.156982421875, -4.01708984375, -3.877197265625, -3.7373046875, -3.597412109375, -3.45751953125, -3.317626953125, -3.177734375, -3.037841796875, -2.89794921875, -2.758056640625, -2.6181640625, -2.478271484375, -2.33837890625, -2.198486328125, -2.05859375, -1.918701171875, -1.77880859375, -1.638916015625, -1.4990234375, -1.359130859375, -1.21923828125, -1.079345703125, -0.939453125, -0.799560546875, -0.65966796875, -0.519775390625, -0.3798828125, -0.239990234375, -0.10009765625, 0.039794921875, 0.1796875, 0.319580078125, 0.45947265625, 0.599365234375, 0.7392578125, 0.879150390625, 1.01904296875, 1.158935546875, 1.298828125, 1.438720703125, 1.57861328125, 1.718505859375, 1.8583984375, 1.998291015625, 2.13818359375, 2.278076171875, 2.41796875, 2.557861328125, 2.69775390625, 2.837646484375, 2.9775390625, 3.117431640625, 3.25732421875, 3.397216796875, 3.537109375, 3.677001953125, 3.81689453125, 3.956787109375, 4.0966796875, 4.236572265625, 4.37646484375, 4.516357421875, 4.65625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 8.0, 6.0, 8.0, 7.0, 15.0, 17.0, 15.0, 16.0, 24.0, 30.0, 27.0, 35.0, 26.0, 49.0, 46.0, 54.0, 54.0, 51.0, 53.0, 49.0, 42.0, 42.0, 53.0, 39.0, 43.0, 23.0, 34.0, 21.0, 19.0, 15.0, 13.0, 13.0, 10.0, 7.0, 15.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.107421875, -1.0760650634765625, -1.044708251953125, -1.0133514404296875, -0.98199462890625, -0.9506378173828125, -0.919281005859375, -0.8879241943359375, -0.8565673828125, -0.8252105712890625, -0.793853759765625, -0.7624969482421875, -0.73114013671875, -0.6997833251953125, -0.668426513671875, -0.6370697021484375, -0.605712890625, -0.5743560791015625, -0.542999267578125, -0.5116424560546875, -0.48028564453125, -0.4489288330078125, -0.417572021484375, -0.3862152099609375, -0.3548583984375, -0.3235015869140625, -0.292144775390625, -0.2607879638671875, -0.22943115234375, -0.1980743408203125, -0.166717529296875, -0.1353607177734375, -0.10400390625, -0.0726470947265625, -0.041290283203125, -0.0099334716796875, 0.02142333984375, 0.0527801513671875, 0.084136962890625, 0.1154937744140625, 0.1468505859375, 0.1782073974609375, 0.209564208984375, 0.2409210205078125, 0.27227783203125, 0.3036346435546875, 0.334991455078125, 0.3663482666015625, 0.397705078125, 0.4290618896484375, 0.460418701171875, 0.4917755126953125, 0.52313232421875, 0.5544891357421875, 0.585845947265625, 0.6172027587890625, 0.6485595703125, 0.6799163818359375, 0.711273193359375, 0.7426300048828125, 0.77398681640625, 0.8053436279296875, 0.836700439453125, 0.8680572509765625, 0.8994140625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 5.0, 9.0, 12.0, 5.0, 10.0, 15.0, 19.0, 16.0, 27.0, 30.0, 33.0, 29.0, 42.0, 35.0, 44.0, 51.0, 48.0, 58.0, 47.0, 56.0, 38.0, 51.0, 38.0, 36.0, 37.0, 30.0, 28.0, 34.0, 13.0, 22.0, 11.0, 11.0, 14.0, 6.0, 7.0, 4.0, 6.0, 0.0, 2.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.258878707885742, -12.870595932006836, -12.482312202453613, -12.094029426574707, -11.705745697021484, -11.317462921142578, -10.929180145263672, -10.54089641571045, -10.152613639831543, -9.764330863952637, -9.376047134399414, -8.987764358520508, -8.599480628967285, -8.211197853088379, -7.8229146003723145, -7.43463134765625, -7.0463480949401855, -6.658064842224121, -6.269781589508057, -5.881498336791992, -5.493215560913086, -5.1049323081970215, -4.716649055480957, -4.328366279602051, -3.9400827884674072, -3.5517995357513428, -3.1635165214538574, -2.775233268737793, -2.3869500160217285, -1.9986670017242432, -1.6103837490081787, -1.2221007347106934, -0.8338174819946289, -0.4455343186855316, -0.057251155376434326, 0.33103203773498535, 0.7193151712417603, 1.1075983047485352, 1.4958815574645996, 1.884164571762085, 2.2724478244781494, 2.660731077194214, 3.049014091491699, 3.4372973442077637, 3.825580596923828, 4.213863372802734, 4.602147102355957, 4.990429878234863, 5.378713130950928, 5.766996383666992, 6.155279636383057, 6.543562889099121, 6.931845664978027, 7.320128917694092, 7.708412170410156, 8.096694946289062, 8.484978675842285, 8.873261451721191, 9.261545181274414, 9.64982795715332, 10.038111686706543, 10.42639446258545, 10.814678192138672, 11.202960968017578, 11.591243743896484]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 4.0, 6.0, 6.0, 5.0, 6.0, 10.0, 9.0, 7.0, 12.0, 10.0, 13.0, 15.0, 16.0, 20.0, 35.0, 38.0, 33.0, 34.0, 38.0, 32.0, 41.0, 39.0, 44.0, 41.0, 30.0, 40.0, 39.0, 41.0, 33.0, 42.0, 37.0, 28.0, 27.0, 28.0, 22.0, 13.0, 15.0, 7.0, 16.0, 14.0, 12.0, 13.0, 6.0, 5.0, 7.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.440264701843262, -9.157435417175293, -8.874605178833008, -8.591775894165039, -8.308945655822754, -8.026116371154785, -7.7432861328125, -7.460456848144531, -7.177626609802246, -6.894796848297119, -6.611967086791992, -6.329137325286865, -6.046307563781738, -5.763477802276611, -5.480648040771484, -5.197818756103516, -4.914988994598389, -4.632159233093262, -4.349329471588135, -4.066499710083008, -3.783669948577881, -3.500840187072754, -3.218010663986206, -2.935180902481079, -2.652351140975952, -2.369521379470825, -2.0866916179656982, -1.8038619756698608, -1.5210322141647339, -1.238202452659607, -0.9553728103637695, -0.6725430488586426, -0.3897132873535156, -0.10688355565071106, 0.1759461760520935, 0.4587758779525757, 0.7416056394577026, 1.0244354009628296, 1.307265043258667, 1.590094804763794, 1.872924566268921, 2.155754327774048, 2.438584089279175, 2.7214136123657227, 3.0042433738708496, 3.2870731353759766, 3.5699028968811035, 3.8527326583862305, 4.135562419891357, 4.418392181396484, 4.701221942901611, 4.984051704406738, 5.266881465911865, 5.549711227416992, 5.832540512084961, 6.115370750427246, 6.398200035095215, 6.681029796600342, 6.963859558105469, 7.246689319610596, 7.529519081115723, 7.81234884262085, 8.095178604125977, 8.378007888793945, 8.66083812713623]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 13.0, 20.0, 30.0, 34.0, 54.0, 114.0, 162.0, 253.0, 411.0, 537.0, 904.0, 1331.0, 2028.0, 3208.0, 5021.0, 7827.0, 11830.0, 18557.0, 27573.0, 41294.0, 59460.0, 80701.0, 101539.0, 118042.0, 122573.0, 113347.0, 96074.0, 74610.0, 53787.0, 36970.0, 24769.0, 16079.0, 10540.0, 6628.0, 4248.0, 2802.0, 1752.0, 1152.0, 798.0, 496.0, 336.0, 220.0, 157.0, 90.0, 67.0, 46.0, 22.0, 24.0, 11.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-7.09765625, -6.88482666015625, -6.6719970703125, -6.45916748046875, -6.246337890625, -6.03350830078125, -5.8206787109375, -5.60784912109375, -5.39501953125, -5.18218994140625, -4.9693603515625, -4.75653076171875, -4.543701171875, -4.33087158203125, -4.1180419921875, -3.90521240234375, -3.6923828125, -3.47955322265625, -3.2667236328125, -3.05389404296875, -2.841064453125, -2.62823486328125, -2.4154052734375, -2.20257568359375, -1.98974609375, -1.77691650390625, -1.5640869140625, -1.35125732421875, -1.138427734375, -0.92559814453125, -0.7127685546875, -0.49993896484375, -0.287109375, -0.07427978515625, 0.1385498046875, 0.35137939453125, 0.564208984375, 0.77703857421875, 0.9898681640625, 1.20269775390625, 1.41552734375, 1.62835693359375, 1.8411865234375, 2.05401611328125, 2.266845703125, 2.47967529296875, 2.6925048828125, 2.90533447265625, 3.1181640625, 3.33099365234375, 3.5438232421875, 3.75665283203125, 3.969482421875, 4.18231201171875, 4.3951416015625, 4.60797119140625, 4.82080078125, 5.03363037109375, 5.2464599609375, 5.45928955078125, 5.672119140625, 5.88494873046875, 6.0977783203125, 6.31060791015625, 6.5234375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 7.0, 7.0, 5.0, 5.0, 4.0, 13.0, 6.0, 6.0, 14.0, 13.0, 22.0, 17.0, 34.0, 27.0, 26.0, 43.0, 42.0, 38.0, 32.0, 41.0, 43.0, 35.0, 50.0, 36.0, 49.0, 44.0, 36.0, 45.0, 26.0, 39.0, 37.0, 23.0, 19.0, 16.0, 25.0, 9.0, 15.0, 13.0, 13.0, 9.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.6640625, -10.3333740234375, -10.002685546875, -9.6719970703125, -9.34130859375, -9.0106201171875, -8.679931640625, -8.3492431640625, -8.0185546875, -7.6878662109375, -7.357177734375, -7.0264892578125, -6.69580078125, -6.3651123046875, -6.034423828125, -5.7037353515625, -5.373046875, -5.0423583984375, -4.711669921875, -4.3809814453125, -4.05029296875, -3.7196044921875, -3.388916015625, -3.0582275390625, -2.7275390625, -2.3968505859375, -2.066162109375, -1.7354736328125, -1.40478515625, -1.0740966796875, -0.743408203125, -0.4127197265625, -0.08203125, 0.2486572265625, 0.579345703125, 0.9100341796875, 1.24072265625, 1.5714111328125, 1.902099609375, 2.2327880859375, 2.5634765625, 2.8941650390625, 3.224853515625, 3.5555419921875, 3.88623046875, 4.2169189453125, 4.547607421875, 4.8782958984375, 5.208984375, 5.5396728515625, 5.870361328125, 6.2010498046875, 6.53173828125, 6.8624267578125, 7.193115234375, 7.5238037109375, 7.8544921875, 8.1851806640625, 8.515869140625, 8.8465576171875, 9.17724609375, 9.5079345703125, 9.838623046875, 10.1693115234375, 10.5]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 17.0, 16.0, 34.0, 45.0, 51.0, 88.0, 146.0, 194.0, 335.0, 546.0, 845.0, 1296.0, 2018.0, 3222.0, 5084.0, 7953.0, 12514.0, 19833.0, 30906.0, 46760.0, 67944.0, 92393.0, 115353.0, 129363.0, 128110.0, 111246.0, 87237.0, 63727.0, 43146.0, 28360.0, 18327.0, 11598.0, 7257.0, 4533.0, 2864.0, 1878.0, 1173.0, 754.0, 442.0, 331.0, 214.0, 133.0, 86.0, 66.0, 34.0, 24.0, 13.0, 10.0, 16.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-7.6953125, -7.46142578125, -7.2275390625, -6.99365234375, -6.759765625, -6.52587890625, -6.2919921875, -6.05810546875, -5.82421875, -5.59033203125, -5.3564453125, -5.12255859375, -4.888671875, -4.65478515625, -4.4208984375, -4.18701171875, -3.953125, -3.71923828125, -3.4853515625, -3.25146484375, -3.017578125, -2.78369140625, -2.5498046875, -2.31591796875, -2.08203125, -1.84814453125, -1.6142578125, -1.38037109375, -1.146484375, -0.91259765625, -0.6787109375, -0.44482421875, -0.2109375, 0.02294921875, 0.2568359375, 0.49072265625, 0.724609375, 0.95849609375, 1.1923828125, 1.42626953125, 1.66015625, 1.89404296875, 2.1279296875, 2.36181640625, 2.595703125, 2.82958984375, 3.0634765625, 3.29736328125, 3.53125, 3.76513671875, 3.9990234375, 4.23291015625, 4.466796875, 4.70068359375, 4.9345703125, 5.16845703125, 5.40234375, 5.63623046875, 5.8701171875, 6.10400390625, 6.337890625, 6.57177734375, 6.8056640625, 7.03955078125, 7.2734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 7.0, 6.0, 7.0, 4.0, 4.0, 9.0, 11.0, 16.0, 16.0, 21.0, 21.0, 18.0, 29.0, 35.0, 29.0, 20.0, 30.0, 36.0, 42.0, 36.0, 37.0, 44.0, 43.0, 35.0, 39.0, 41.0, 41.0, 45.0, 26.0, 31.0, 35.0, 28.0, 22.0, 29.0, 15.0, 15.0, 12.0, 13.0, 13.0, 14.0, 6.0, 4.0, 3.0, 0.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.4609375, -6.25384521484375, -6.0467529296875, -5.83966064453125, -5.632568359375, -5.42547607421875, -5.2183837890625, -5.01129150390625, -4.80419921875, -4.59710693359375, -4.3900146484375, -4.18292236328125, -3.975830078125, -3.76873779296875, -3.5616455078125, -3.35455322265625, -3.1474609375, -2.94036865234375, -2.7332763671875, -2.52618408203125, -2.319091796875, -2.11199951171875, -1.9049072265625, -1.69781494140625, -1.49072265625, -1.28363037109375, -1.0765380859375, -0.86944580078125, -0.662353515625, -0.45526123046875, -0.2481689453125, -0.04107666015625, 0.166015625, 0.37310791015625, 0.5802001953125, 0.78729248046875, 0.994384765625, 1.20147705078125, 1.4085693359375, 1.61566162109375, 1.82275390625, 2.02984619140625, 2.2369384765625, 2.44403076171875, 2.651123046875, 2.85821533203125, 3.0653076171875, 3.27239990234375, 3.4794921875, 3.68658447265625, 3.8936767578125, 4.10076904296875, 4.307861328125, 4.51495361328125, 4.7220458984375, 4.92913818359375, 5.13623046875, 5.34332275390625, 5.5504150390625, 5.75750732421875, 5.964599609375, 6.17169189453125, 6.3787841796875, 6.58587646484375, 6.79296875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 3.0, 8.0, 14.0, 30.0, 26.0, 59.0, 68.0, 121.0, 195.0, 288.0, 420.0, 671.0, 1122.0, 1766.0, 2863.0, 4774.0, 7491.0, 12359.0, 19477.0, 30698.0, 46826.0, 69801.0, 95626.0, 120293.0, 134581.0, 131063.0, 111891.0, 85752.0, 60932.0, 40194.0, 25900.0, 16588.0, 9998.0, 6371.0, 3810.0, 2363.0, 1545.0, 904.0, 603.0, 400.0, 225.0, 128.0, 91.0, 67.0, 48.0, 31.0, 26.0, 13.0, 13.0, 6.0, 9.0, 3.0, 1.0, 1.0, 3.0], "bins": [-3.806640625, -3.694061279296875, -3.58148193359375, -3.468902587890625, -3.3563232421875, -3.243743896484375, -3.13116455078125, -3.018585205078125, -2.906005859375, -2.793426513671875, -2.68084716796875, -2.568267822265625, -2.4556884765625, -2.343109130859375, -2.23052978515625, -2.117950439453125, -2.00537109375, -1.892791748046875, -1.78021240234375, -1.667633056640625, -1.5550537109375, -1.442474365234375, -1.32989501953125, -1.217315673828125, -1.104736328125, -0.992156982421875, -0.87957763671875, -0.766998291015625, -0.6544189453125, -0.541839599609375, -0.42926025390625, -0.316680908203125, -0.2041015625, -0.091522216796875, 0.02105712890625, 0.133636474609375, 0.2462158203125, 0.358795166015625, 0.47137451171875, 0.583953857421875, 0.696533203125, 0.809112548828125, 0.92169189453125, 1.034271240234375, 1.1468505859375, 1.259429931640625, 1.37200927734375, 1.484588623046875, 1.59716796875, 1.709747314453125, 1.82232666015625, 1.934906005859375, 2.0474853515625, 2.160064697265625, 2.27264404296875, 2.385223388671875, 2.497802734375, 2.610382080078125, 2.72296142578125, 2.835540771484375, 2.9481201171875, 3.060699462890625, 3.17327880859375, 3.285858154296875, 3.3984375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 10.0, 6.0, 10.0, 21.0, 20.0, 17.0, 19.0, 26.0, 35.0, 43.0, 52.0, 51.0, 59.0, 62.0, 65.0, 55.0, 60.0, 52.0, 46.0, 49.0, 51.0, 35.0, 24.0, 17.0, 23.0, 15.0, 8.0, 9.0, 11.0, 10.0, 8.0, 6.0, 2.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000453948974609375, -0.0004408732056617737, -0.00042779743671417236, -0.00041472166776657104, -0.0004016458988189697, -0.0003885701298713684, -0.0003754943609237671, -0.00036241859197616577, -0.00034934282302856445, -0.00033626705408096313, -0.0003231912851333618, -0.0003101155161857605, -0.0002970397472381592, -0.00028396397829055786, -0.00027088820934295654, -0.0002578124403953552, -0.0002447366714477539, -0.0002316609025001526, -0.00021858513355255127, -0.00020550936460494995, -0.00019243359565734863, -0.00017935782670974731, -0.000166282057762146, -0.00015320628881454468, -0.00014013051986694336, -0.00012705475091934204, -0.00011397898197174072, -0.0001009032130241394, -8.782744407653809e-05, -7.475167512893677e-05, -6.167590618133545e-05, -4.860013723373413e-05, -3.552436828613281e-05, -2.2448599338531494e-05, -9.372830390930176e-06, 3.7029385566711426e-06, 1.677870750427246e-05, 2.985447645187378e-05, 4.29302453994751e-05, 5.6006014347076416e-05, 6.908178329467773e-05, 8.215755224227905e-05, 9.523332118988037e-05, 0.00010830909013748169, 0.00012138485908508301, 0.00013446062803268433, 0.00014753639698028564, 0.00016061216592788696, 0.00017368793487548828, 0.0001867637038230896, 0.00019983947277069092, 0.00021291524171829224, 0.00022599101066589355, 0.00023906677961349487, 0.0002521425485610962, 0.0002652183175086975, 0.00027829408645629883, 0.00029136985540390015, 0.00030444562435150146, 0.0003175213932991028, 0.0003305971622467041, 0.0003436729311943054, 0.00035674870014190674, 0.00036982446908950806, 0.0003829002380371094]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 15.0, 21.0, 29.0, 39.0, 78.0, 105.0, 211.0, 307.0, 528.0, 842.0, 1394.0, 2310.0, 3946.0, 6743.0, 10884.0, 17939.0, 28870.0, 45484.0, 67596.0, 94103.0, 119484.0, 134954.0, 133577.0, 115144.0, 89248.0, 63444.0, 42271.0, 26847.0, 16813.0, 9957.0, 6153.0, 3686.0, 2126.0, 1313.0, 809.0, 497.0, 279.0, 195.0, 109.0, 69.0, 59.0, 32.0, 19.0, 8.0, 6.0, 2.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.919921875, -3.804351806640625, -3.68878173828125, -3.573211669921875, -3.4576416015625, -3.342071533203125, -3.22650146484375, -3.110931396484375, -2.995361328125, -2.879791259765625, -2.76422119140625, -2.648651123046875, -2.5330810546875, -2.417510986328125, -2.30194091796875, -2.186370849609375, -2.07080078125, -1.955230712890625, -1.83966064453125, -1.724090576171875, -1.6085205078125, -1.492950439453125, -1.37738037109375, -1.261810302734375, -1.146240234375, -1.030670166015625, -0.91510009765625, -0.799530029296875, -0.6839599609375, -0.568389892578125, -0.45281982421875, -0.337249755859375, -0.2216796875, -0.106109619140625, 0.00946044921875, 0.125030517578125, 0.2406005859375, 0.356170654296875, 0.47174072265625, 0.587310791015625, 0.702880859375, 0.818450927734375, 0.93402099609375, 1.049591064453125, 1.1651611328125, 1.280731201171875, 1.39630126953125, 1.511871337890625, 1.62744140625, 1.743011474609375, 1.85858154296875, 1.974151611328125, 2.0897216796875, 2.205291748046875, 2.32086181640625, 2.436431884765625, 2.552001953125, 2.667572021484375, 2.78314208984375, 2.898712158203125, 3.0142822265625, 3.129852294921875, 3.24542236328125, 3.360992431640625, 3.4765625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 15.0, 13.0, 12.0, 25.0, 26.0, 31.0, 45.0, 50.0, 50.0, 53.0, 58.0, 54.0, 58.0, 62.0, 44.0, 61.0, 42.0, 52.0, 36.0, 37.0, 20.0, 41.0, 18.0, 19.0, 15.0, 13.0, 7.0, 3.0, 5.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.501953125, -1.4488525390625, -1.395751953125, -1.3426513671875, -1.28955078125, -1.2364501953125, -1.183349609375, -1.1302490234375, -1.0771484375, -1.0240478515625, -0.970947265625, -0.9178466796875, -0.86474609375, -0.8116455078125, -0.758544921875, -0.7054443359375, -0.65234375, -0.5992431640625, -0.546142578125, -0.4930419921875, -0.43994140625, -0.3868408203125, -0.333740234375, -0.2806396484375, -0.2275390625, -0.1744384765625, -0.121337890625, -0.0682373046875, -0.01513671875, 0.0379638671875, 0.091064453125, 0.1441650390625, 0.197265625, 0.2503662109375, 0.303466796875, 0.3565673828125, 0.40966796875, 0.4627685546875, 0.515869140625, 0.5689697265625, 0.6220703125, 0.6751708984375, 0.728271484375, 0.7813720703125, 0.83447265625, 0.8875732421875, 0.940673828125, 0.9937744140625, 1.046875, 1.0999755859375, 1.153076171875, 1.2061767578125, 1.25927734375, 1.3123779296875, 1.365478515625, 1.4185791015625, 1.4716796875, 1.5247802734375, 1.577880859375, 1.6309814453125, 1.68408203125, 1.7371826171875, 1.790283203125, 1.8433837890625, 1.896484375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 4.0, 11.0, 6.0, 11.0, 14.0, 16.0, 14.0, 16.0, 27.0, 31.0, 35.0, 31.0, 35.0, 46.0, 41.0, 40.0, 48.0, 52.0, 44.0, 50.0, 46.0, 47.0, 35.0, 37.0, 35.0, 38.0, 32.0, 20.0, 25.0, 18.0, 18.0, 11.0, 10.0, 11.0, 5.0, 11.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-12.742839813232422, -12.358771324157715, -11.974701881408691, -11.590633392333984, -11.206563949584961, -10.822495460510254, -10.43842601776123, -10.054357528686523, -9.6702880859375, -9.286219596862793, -8.90215015411377, -8.518081665039062, -8.134012222290039, -7.749943256378174, -7.365874290466309, -6.981805801391602, -6.597736835479736, -6.213667869567871, -5.829598903656006, -5.445529937744141, -5.061460971832275, -4.67739200592041, -4.293323516845703, -3.909254312515259, -3.5251853466033936, -3.1411163806915283, -2.757047414779663, -2.372978687286377, -1.9889096021652222, -1.604840636253357, -1.2207717895507812, -0.836702823638916, -0.4526338577270508, -0.06856492161750793, 0.3155040144920349, 0.6995729207992554, 1.0836418867111206, 1.4677108526229858, 1.8517796993255615, 2.2358486652374268, 2.619917631149292, 3.0039865970611572, 3.3880555629730225, 3.7721242904663086, 4.156193256378174, 4.540262222290039, 4.924331188201904, 5.3084001541137695, 5.692469120025635, 6.0765380859375, 6.460607051849365, 6.8446760177612305, 7.228744983673096, 7.612813949584961, 7.996882438659668, 8.380951881408691, 8.765020370483398, 9.149088859558105, 9.533158302307129, 9.917226791381836, 10.30129623413086, 10.685364723205566, 11.06943416595459, 11.453502655029297, 11.83757209777832]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 9.0, 8.0, 6.0, 13.0, 23.0, 11.0, 11.0, 15.0, 23.0, 23.0, 33.0, 24.0, 30.0, 28.0, 40.0, 34.0, 40.0, 31.0, 43.0, 44.0, 34.0, 45.0, 34.0, 42.0, 35.0, 42.0, 29.0, 34.0, 24.0, 27.0, 34.0, 11.0, 28.0, 11.0, 13.0, 12.0, 6.0, 12.0, 3.0, 6.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.63618278503418, -9.311650276184082, -8.987116813659668, -8.66258430480957, -8.338051795959473, -8.013519287109375, -7.688985824584961, -7.364453315734863, -7.039920806884766, -6.71538782119751, -6.390855312347412, -6.066322326660156, -5.741789817810059, -5.417256832122803, -5.092723846435547, -4.768191337585449, -4.443658351898193, -4.1191253662109375, -3.79459285736084, -3.470059871673584, -3.1455273628234863, -2.8209943771362305, -2.4964616298675537, -2.171928882598877, -1.8473961353302002, -1.5228633880615234, -1.1983306407928467, -0.8737977743148804, -0.5492650270462036, -0.22473227977752686, 0.09980058670043945, 0.4243333339691162, 0.748866081237793, 1.0733988285064697, 1.3979315757751465, 1.7224644422531128, 2.0469970703125, 2.371530055999756, 2.6960628032684326, 3.0205955505371094, 3.345128297805786, 3.669661045074463, 3.9941937923431396, 4.318726539611816, 4.643259525299072, 4.96779203414917, 5.292325019836426, 5.616857528686523, 5.941390514373779, 6.265923500061035, 6.590456008911133, 6.914988994598389, 7.239521503448486, 7.564054489135742, 7.88858699798584, 8.213119506835938, 8.537652969360352, 8.86218547821045, 9.186718940734863, 9.511251449584961, 9.835783958435059, 10.160316467285156, 10.48484992980957, 10.809382438659668, 11.133914947509766]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 12.0, 8.0, 20.0, 28.0, 45.0, 75.0, 104.0, 162.0, 282.0, 392.0, 632.0, 1078.0, 1736.0, 2788.0, 4719.0, 8120.0, 14810.0, 26804.0, 51242.0, 100562.0, 201512.0, 397875.0, 699301.0, 922894.0, 787594.0, 474858.0, 245218.0, 120864.0, 61066.0, 31585.0, 16209.0, 9054.0, 4894.0, 2896.0, 1798.0, 1094.0, 651.0, 438.0, 281.0, 199.0, 110.0, 83.0, 55.0, 48.0, 23.0, 21.0, 18.0, 12.0, 8.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.84375, -13.376708984375, -12.90966796875, -12.442626953125, -11.9755859375, -11.508544921875, -11.04150390625, -10.574462890625, -10.107421875, -9.640380859375, -9.17333984375, -8.706298828125, -8.2392578125, -7.772216796875, -7.30517578125, -6.838134765625, -6.37109375, -5.904052734375, -5.43701171875, -4.969970703125, -4.5029296875, -4.035888671875, -3.56884765625, -3.101806640625, -2.634765625, -2.167724609375, -1.70068359375, -1.233642578125, -0.7666015625, -0.299560546875, 0.16748046875, 0.634521484375, 1.1015625, 1.568603515625, 2.03564453125, 2.502685546875, 2.9697265625, 3.436767578125, 3.90380859375, 4.370849609375, 4.837890625, 5.304931640625, 5.77197265625, 6.239013671875, 6.7060546875, 7.173095703125, 7.64013671875, 8.107177734375, 8.57421875, 9.041259765625, 9.50830078125, 9.975341796875, 10.4423828125, 10.909423828125, 11.37646484375, 11.843505859375, 12.310546875, 12.777587890625, 13.24462890625, 13.711669921875, 14.1787109375, 14.645751953125, 15.11279296875, 15.579833984375, 16.046875]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 4.0, 8.0, 10.0, 11.0, 5.0, 14.0, 11.0, 13.0, 12.0, 16.0, 23.0, 25.0, 22.0, 22.0, 28.0, 37.0, 28.0, 42.0, 35.0, 48.0, 42.0, 47.0, 37.0, 34.0, 40.0, 41.0, 40.0, 40.0, 32.0, 31.0, 32.0, 28.0, 15.0, 30.0, 17.0, 13.0, 13.0, 10.0, 13.0, 4.0, 5.0, 8.0, 8.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0, -7.7410888671875, -7.482177734375, -7.2232666015625, -6.96435546875, -6.7054443359375, -6.446533203125, -6.1876220703125, -5.9287109375, -5.6697998046875, -5.410888671875, -5.1519775390625, -4.89306640625, -4.6341552734375, -4.375244140625, -4.1163330078125, -3.857421875, -3.5985107421875, -3.339599609375, -3.0806884765625, -2.82177734375, -2.5628662109375, -2.303955078125, -2.0450439453125, -1.7861328125, -1.5272216796875, -1.268310546875, -1.0093994140625, -0.75048828125, -0.4915771484375, -0.232666015625, 0.0262451171875, 0.28515625, 0.5440673828125, 0.802978515625, 1.0618896484375, 1.32080078125, 1.5797119140625, 1.838623046875, 2.0975341796875, 2.3564453125, 2.6153564453125, 2.874267578125, 3.1331787109375, 3.39208984375, 3.6510009765625, 3.909912109375, 4.1688232421875, 4.427734375, 4.6866455078125, 4.945556640625, 5.2044677734375, 5.46337890625, 5.7222900390625, 5.981201171875, 6.2401123046875, 6.4990234375, 6.7579345703125, 7.016845703125, 7.2757568359375, 7.53466796875, 7.7935791015625, 8.052490234375, 8.3114013671875, 8.5703125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 14.0, 24.0, 26.0, 43.0, 58.0, 83.0, 148.0, 219.0, 375.0, 613.0, 961.0, 1571.0, 2673.0, 4691.0, 8161.0, 15369.0, 28300.0, 53908.0, 102935.0, 193480.0, 345911.0, 559467.0, 751554.0, 758976.0, 575571.0, 358487.0, 200883.0, 107277.0, 56369.0, 29823.0, 15778.0, 8621.0, 4871.0, 2809.0, 1595.0, 952.0, 614.0, 390.0, 233.0, 177.0, 99.0, 62.0, 35.0, 18.0, 20.0, 17.0, 7.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6640625, -14.1915283203125, -13.718994140625, -13.2464599609375, -12.77392578125, -12.3013916015625, -11.828857421875, -11.3563232421875, -10.8837890625, -10.4112548828125, -9.938720703125, -9.4661865234375, -8.99365234375, -8.5211181640625, -8.048583984375, -7.5760498046875, -7.103515625, -6.6309814453125, -6.158447265625, -5.6859130859375, -5.21337890625, -4.7408447265625, -4.268310546875, -3.7957763671875, -3.3232421875, -2.8507080078125, -2.378173828125, -1.9056396484375, -1.43310546875, -0.9605712890625, -0.488037109375, -0.0155029296875, 0.45703125, 0.9295654296875, 1.402099609375, 1.8746337890625, 2.34716796875, 2.8197021484375, 3.292236328125, 3.7647705078125, 4.2373046875, 4.7098388671875, 5.182373046875, 5.6549072265625, 6.12744140625, 6.5999755859375, 7.072509765625, 7.5450439453125, 8.017578125, 8.4901123046875, 8.962646484375, 9.4351806640625, 9.90771484375, 10.3802490234375, 10.852783203125, 11.3253173828125, 11.7978515625, 12.2703857421875, 12.742919921875, 13.2154541015625, 13.68798828125, 14.1605224609375, 14.633056640625, 15.1055908203125, 15.578125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 8.0, 7.0, 13.0, 6.0, 20.0, 12.0, 22.0, 25.0, 33.0, 39.0, 49.0, 57.0, 75.0, 107.0, 104.0, 115.0, 145.0, 144.0, 160.0, 178.0, 204.0, 186.0, 193.0, 222.0, 222.0, 222.0, 213.0, 192.0, 177.0, 151.0, 145.0, 93.0, 102.0, 82.0, 83.0, 60.0, 51.0, 33.0, 25.0, 25.0, 20.0, 11.0, 10.0, 10.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.26953125, -4.13360595703125, -3.9976806640625, -3.86175537109375, -3.725830078125, -3.58990478515625, -3.4539794921875, -3.31805419921875, -3.18212890625, -3.04620361328125, -2.9102783203125, -2.77435302734375, -2.638427734375, -2.50250244140625, -2.3665771484375, -2.23065185546875, -2.0947265625, -1.95880126953125, -1.8228759765625, -1.68695068359375, -1.551025390625, -1.41510009765625, -1.2791748046875, -1.14324951171875, -1.00732421875, -0.87139892578125, -0.7354736328125, -0.59954833984375, -0.463623046875, -0.32769775390625, -0.1917724609375, -0.05584716796875, 0.080078125, 0.21600341796875, 0.3519287109375, 0.48785400390625, 0.623779296875, 0.75970458984375, 0.8956298828125, 1.03155517578125, 1.16748046875, 1.30340576171875, 1.4393310546875, 1.57525634765625, 1.711181640625, 1.84710693359375, 1.9830322265625, 2.11895751953125, 2.2548828125, 2.39080810546875, 2.5267333984375, 2.66265869140625, 2.798583984375, 2.93450927734375, 3.0704345703125, 3.20635986328125, 3.34228515625, 3.47821044921875, 3.6141357421875, 3.75006103515625, 3.885986328125, 4.02191162109375, 4.1578369140625, 4.29376220703125, 4.4296875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 6.0, 14.0, 10.0, 12.0, 21.0, 24.0, 24.0, 38.0, 34.0, 30.0, 39.0, 46.0, 54.0, 62.0, 59.0, 68.0, 61.0, 48.0, 48.0, 51.0, 37.0, 40.0, 27.0, 32.0, 27.0, 19.0, 14.0, 7.0, 9.0, 7.0, 3.0, 5.0, 9.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.830389022827148, -13.32155704498291, -12.812725067138672, -12.303893089294434, -11.795061111450195, -11.28622817993164, -10.777396202087402, -10.268564224243164, -9.759732246398926, -9.250900268554688, -8.74206829071045, -8.233236312866211, -7.7244038581848145, -7.215571880340576, -6.70673942565918, -6.197907447814941, -5.689075469970703, -5.180243492126465, -4.671411514282227, -4.16257905960083, -3.653747081756592, -3.1449151039123535, -2.636082887649536, -2.1272506713867188, -1.6184186935424805, -1.1095865964889526, -0.6007544994354248, -0.09192240238189697, 0.41690969467163086, 0.9257416725158691, 1.4345738887786865, 1.943406105041504, 2.452239990234375, 2.9610719680786133, 3.4699041843414307, 3.978736400604248, 4.487568378448486, 4.996400356292725, 5.505232810974121, 6.014064788818359, 6.522896766662598, 7.031728744506836, 7.540560722351074, 8.049392700195312, 8.558225631713867, 9.067056655883789, 9.575889587402344, 10.084721565246582, 10.59355354309082, 11.102385520935059, 11.611217498779297, 12.120049476623535, 12.628881454467773, 13.137714385986328, 13.646546363830566, 14.155378341674805, 14.664210319519043, 15.173042297363281, 15.68187427520752, 16.190706253051758, 16.699539184570312, 17.208370208740234, 17.71720314025879, 18.226036071777344, 18.734867095947266]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 9.0, 8.0, 4.0, 12.0, 14.0, 10.0, 17.0, 12.0, 23.0, 19.0, 26.0, 17.0, 21.0, 29.0, 26.0, 36.0, 38.0, 44.0, 51.0, 28.0, 40.0, 44.0, 54.0, 49.0, 29.0, 34.0, 41.0, 27.0, 30.0, 30.0, 26.0, 19.0, 19.0, 14.0, 20.0, 18.0, 13.0, 8.0, 13.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.03309154510498, -9.698530197143555, -9.363967895507812, -9.029406547546387, -8.694845199584961, -8.360282897949219, -8.025721549987793, -7.691159725189209, -7.356597900390625, -7.022036075592041, -6.687474250793457, -6.352912902832031, -6.018351078033447, -5.683789253234863, -5.3492279052734375, -5.0146660804748535, -4.6801042556762695, -4.3455424308776855, -4.010980606079102, -3.676419258117676, -3.341857433319092, -3.007295608520508, -2.672734022140503, -2.338172435760498, -2.003610610961914, -1.6690489053726196, -1.3344871997833252, -0.9999254941940308, -0.6653637886047363, -0.3308020830154419, 0.003759622573852539, 0.3383212089538574, 0.6728830337524414, 1.0074447393417358, 1.3420064449310303, 1.6765681505203247, 2.011129856109619, 2.345691680908203, 2.680253267288208, 3.014814853668213, 3.349376678466797, 3.683938503265381, 4.018500328063965, 4.353061676025391, 4.687623500823975, 5.022185325622559, 5.356746673583984, 5.691308498382568, 6.025870323181152, 6.360432147979736, 6.69499397277832, 7.029555320739746, 7.36411714553833, 7.698678970336914, 8.03324031829834, 8.367801666259766, 8.702363967895508, 9.036925315856934, 9.371487617492676, 9.706048965454102, 10.040611267089844, 10.37517261505127, 10.709733963012695, 11.044296264648438, 11.378857612609863]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 3.0, 11.0, 10.0, 22.0, 21.0, 27.0, 54.0, 62.0, 115.0, 196.0, 279.0, 466.0, 683.0, 1145.0, 1975.0, 3301.0, 5399.0, 9242.0, 15999.0, 26981.0, 45177.0, 73031.0, 110781.0, 147804.0, 163609.0, 147737.0, 110619.0, 72800.0, 44989.0, 26979.0, 15810.0, 9380.0, 5491.0, 3300.0, 1901.0, 1193.0, 728.0, 441.0, 289.0, 164.0, 117.0, 66.0, 54.0, 40.0, 16.0, 16.0, 8.0, 8.0, 5.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.61328125, -6.4033203125, -6.193359375, -5.9833984375, -5.7734375, -5.5634765625, -5.353515625, -5.1435546875, -4.93359375, -4.7236328125, -4.513671875, -4.3037109375, -4.09375, -3.8837890625, -3.673828125, -3.4638671875, -3.25390625, -3.0439453125, -2.833984375, -2.6240234375, -2.4140625, -2.2041015625, -1.994140625, -1.7841796875, -1.57421875, -1.3642578125, -1.154296875, -0.9443359375, -0.734375, -0.5244140625, -0.314453125, -0.1044921875, 0.10546875, 0.3154296875, 0.525390625, 0.7353515625, 0.9453125, 1.1552734375, 1.365234375, 1.5751953125, 1.78515625, 1.9951171875, 2.205078125, 2.4150390625, 2.625, 2.8349609375, 3.044921875, 3.2548828125, 3.46484375, 3.6748046875, 3.884765625, 4.0947265625, 4.3046875, 4.5146484375, 4.724609375, 4.9345703125, 5.14453125, 5.3544921875, 5.564453125, 5.7744140625, 5.984375, 6.1943359375, 6.404296875, 6.6142578125, 6.82421875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 5.0, 9.0, 8.0, 4.0, 12.0, 16.0, 24.0, 13.0, 14.0, 16.0, 34.0, 27.0, 43.0, 43.0, 32.0, 40.0, 39.0, 43.0, 47.0, 53.0, 54.0, 35.0, 52.0, 43.0, 35.0, 28.0, 29.0, 29.0, 33.0, 17.0, 23.0, 24.0, 15.0, 19.0, 8.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.421875, -13.0181884765625, -12.614501953125, -12.2108154296875, -11.80712890625, -11.4034423828125, -10.999755859375, -10.5960693359375, -10.1923828125, -9.7886962890625, -9.385009765625, -8.9813232421875, -8.57763671875, -8.1739501953125, -7.770263671875, -7.3665771484375, -6.962890625, -6.5592041015625, -6.155517578125, -5.7518310546875, -5.34814453125, -4.9444580078125, -4.540771484375, -4.1370849609375, -3.7333984375, -3.3297119140625, -2.926025390625, -2.5223388671875, -2.11865234375, -1.7149658203125, -1.311279296875, -0.9075927734375, -0.50390625, -0.1002197265625, 0.303466796875, 0.7071533203125, 1.11083984375, 1.5145263671875, 1.918212890625, 2.3218994140625, 2.7255859375, 3.1292724609375, 3.532958984375, 3.9366455078125, 4.34033203125, 4.7440185546875, 5.147705078125, 5.5513916015625, 5.955078125, 6.3587646484375, 6.762451171875, 7.1661376953125, 7.56982421875, 7.9735107421875, 8.377197265625, 8.7808837890625, 9.1845703125, 9.5882568359375, 9.991943359375, 10.3956298828125, 10.79931640625, 11.2030029296875, 11.606689453125, 12.0103759765625, 12.4140625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 6.0, 13.0, 23.0, 18.0, 33.0, 46.0, 47.0, 83.0, 99.0, 147.0, 197.0, 278.0, 399.0, 572.0, 852.0, 1189.0, 1775.0, 2675.0, 4119.0, 6692.0, 11046.0, 19215.0, 34040.0, 62894.0, 114688.0, 190051.0, 224188.0, 162106.0, 92214.0, 50094.0, 27588.0, 15558.0, 9272.0, 5556.0, 3620.0, 2250.0, 1478.0, 1049.0, 672.0, 479.0, 370.0, 252.0, 169.0, 124.0, 100.0, 65.0, 41.0, 41.0, 27.0, 15.0, 10.0, 7.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.3125, -9.00537109375, -8.6982421875, -8.39111328125, -8.083984375, -7.77685546875, -7.4697265625, -7.16259765625, -6.85546875, -6.54833984375, -6.2412109375, -5.93408203125, -5.626953125, -5.31982421875, -5.0126953125, -4.70556640625, -4.3984375, -4.09130859375, -3.7841796875, -3.47705078125, -3.169921875, -2.86279296875, -2.5556640625, -2.24853515625, -1.94140625, -1.63427734375, -1.3271484375, -1.02001953125, -0.712890625, -0.40576171875, -0.0986328125, 0.20849609375, 0.515625, 0.82275390625, 1.1298828125, 1.43701171875, 1.744140625, 2.05126953125, 2.3583984375, 2.66552734375, 2.97265625, 3.27978515625, 3.5869140625, 3.89404296875, 4.201171875, 4.50830078125, 4.8154296875, 5.12255859375, 5.4296875, 5.73681640625, 6.0439453125, 6.35107421875, 6.658203125, 6.96533203125, 7.2724609375, 7.57958984375, 7.88671875, 8.19384765625, 8.5009765625, 8.80810546875, 9.115234375, 9.42236328125, 9.7294921875, 10.03662109375, 10.34375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 5.0, 4.0, 12.0, 9.0, 10.0, 11.0, 15.0, 9.0, 23.0, 33.0, 33.0, 28.0, 27.0, 33.0, 32.0, 41.0, 35.0, 40.0, 44.0, 40.0, 65.0, 36.0, 39.0, 28.0, 36.0, 39.0, 28.0, 21.0, 25.0, 29.0, 22.0, 22.0, 18.0, 18.0, 28.0, 13.0, 12.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9921875, -6.7708740234375, -6.549560546875, -6.3282470703125, -6.10693359375, -5.8856201171875, -5.664306640625, -5.4429931640625, -5.2216796875, -5.0003662109375, -4.779052734375, -4.5577392578125, -4.33642578125, -4.1151123046875, -3.893798828125, -3.6724853515625, -3.451171875, -3.2298583984375, -3.008544921875, -2.7872314453125, -2.56591796875, -2.3446044921875, -2.123291015625, -1.9019775390625, -1.6806640625, -1.4593505859375, -1.238037109375, -1.0167236328125, -0.79541015625, -0.5740966796875, -0.352783203125, -0.1314697265625, 0.08984375, 0.3111572265625, 0.532470703125, 0.7537841796875, 0.97509765625, 1.1964111328125, 1.417724609375, 1.6390380859375, 1.8603515625, 2.0816650390625, 2.302978515625, 2.5242919921875, 2.74560546875, 2.9669189453125, 3.188232421875, 3.4095458984375, 3.630859375, 3.8521728515625, 4.073486328125, 4.2947998046875, 4.51611328125, 4.7374267578125, 4.958740234375, 5.1800537109375, 5.4013671875, 5.6226806640625, 5.843994140625, 6.0653076171875, 6.28662109375, 6.5079345703125, 6.729248046875, 6.9505615234375, 7.171875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 10.0, 10.0, 9.0, 29.0, 34.0, 69.0, 83.0, 103.0, 193.0, 296.0, 445.0, 706.0, 1090.0, 1837.0, 2881.0, 4741.0, 7842.0, 13171.0, 22066.0, 36898.0, 62636.0, 104081.0, 158966.0, 195025.0, 163796.0, 108440.0, 65895.0, 39026.0, 23196.0, 13674.0, 8198.0, 4943.0, 2986.0, 1915.0, 1241.0, 775.0, 445.0, 284.0, 184.0, 138.0, 89.0, 38.0, 26.0, 17.0, 12.0, 9.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.90234375, -3.77862548828125, -3.6549072265625, -3.53118896484375, -3.407470703125, -3.28375244140625, -3.1600341796875, -3.03631591796875, -2.91259765625, -2.78887939453125, -2.6651611328125, -2.54144287109375, -2.417724609375, -2.29400634765625, -2.1702880859375, -2.04656982421875, -1.9228515625, -1.79913330078125, -1.6754150390625, -1.55169677734375, -1.427978515625, -1.30426025390625, -1.1805419921875, -1.05682373046875, -0.93310546875, -0.80938720703125, -0.6856689453125, -0.56195068359375, -0.438232421875, -0.31451416015625, -0.1907958984375, -0.06707763671875, 0.056640625, 0.18035888671875, 0.3040771484375, 0.42779541015625, 0.551513671875, 0.67523193359375, 0.7989501953125, 0.92266845703125, 1.04638671875, 1.17010498046875, 1.2938232421875, 1.41754150390625, 1.541259765625, 1.66497802734375, 1.7886962890625, 1.91241455078125, 2.0361328125, 2.15985107421875, 2.2835693359375, 2.40728759765625, 2.531005859375, 2.65472412109375, 2.7784423828125, 2.90216064453125, 3.02587890625, 3.14959716796875, 3.2733154296875, 3.39703369140625, 3.520751953125, 3.64447021484375, 3.7681884765625, 3.89190673828125, 4.015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 4.0, 9.0, 12.0, 9.0, 17.0, 18.0, 19.0, 27.0, 29.0, 28.0, 59.0, 52.0, 51.0, 64.0, 55.0, 54.0, 65.0, 56.0, 59.0, 46.0, 51.0, 41.0, 31.0, 30.0, 16.0, 23.0, 18.0, 17.0, 9.0, 5.0, 5.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019788742065429688, -0.00019199401140213013, -0.00018610060214996338, -0.00018020719289779663, -0.00017431378364562988, -0.00016842037439346313, -0.0001625269651412964, -0.00015663355588912964, -0.0001507401466369629, -0.00014484673738479614, -0.0001389533281326294, -0.00013305991888046265, -0.0001271665096282959, -0.00012127310037612915, -0.0001153796911239624, -0.00010948628187179565, -0.0001035928726196289, -9.769946336746216e-05, -9.180605411529541e-05, -8.591264486312866e-05, -8.001923561096191e-05, -7.412582635879517e-05, -6.823241710662842e-05, -6.233900785446167e-05, -5.644559860229492e-05, -5.0552189350128174e-05, -4.4658780097961426e-05, -3.876537084579468e-05, -3.287196159362793e-05, -2.697855234146118e-05, -2.1085143089294434e-05, -1.5191733837127686e-05, -9.298324584960938e-06, -3.4049153327941895e-06, 2.4884939193725586e-06, 8.381903171539307e-06, 1.4275312423706055e-05, 2.0168721675872803e-05, 2.606213092803955e-05, 3.19555401802063e-05, 3.784894943237305e-05, 4.3742358684539795e-05, 4.963576793670654e-05, 5.552917718887329e-05, 6.142258644104004e-05, 6.731599569320679e-05, 7.320940494537354e-05, 7.910281419754028e-05, 8.499622344970703e-05, 9.088963270187378e-05, 9.678304195404053e-05, 0.00010267645120620728, 0.00010856986045837402, 0.00011446326971054077, 0.00012035667896270752, 0.00012625008821487427, 0.00013214349746704102, 0.00013803690671920776, 0.0001439303159713745, 0.00014982372522354126, 0.000155717134475708, 0.00016161054372787476, 0.0001675039529800415, 0.00017339736223220825, 0.000179290771484375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 6.0, 12.0, 23.0, 22.0, 56.0, 106.0, 163.0, 279.0, 433.0, 652.0, 1065.0, 1722.0, 2587.0, 4244.0, 6571.0, 10547.0, 16649.0, 25985.0, 40262.0, 61635.0, 89246.0, 118773.0, 140730.0, 140322.0, 119912.0, 90169.0, 62463.0, 41254.0, 26645.0, 16994.0, 10636.0, 6738.0, 4293.0, 2675.0, 1661.0, 1157.0, 709.0, 446.0, 299.0, 170.0, 92.0, 65.0, 32.0, 25.0, 15.0, 12.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69140625, -3.579620361328125, -3.46783447265625, -3.356048583984375, -3.2442626953125, -3.132476806640625, -3.02069091796875, -2.908905029296875, -2.797119140625, -2.685333251953125, -2.57354736328125, -2.461761474609375, -2.3499755859375, -2.238189697265625, -2.12640380859375, -2.014617919921875, -1.90283203125, -1.791046142578125, -1.67926025390625, -1.567474365234375, -1.4556884765625, -1.343902587890625, -1.23211669921875, -1.120330810546875, -1.008544921875, -0.896759033203125, -0.78497314453125, -0.673187255859375, -0.5614013671875, -0.449615478515625, -0.33782958984375, -0.226043701171875, -0.1142578125, -0.002471923828125, 0.10931396484375, 0.221099853515625, 0.3328857421875, 0.444671630859375, 0.55645751953125, 0.668243408203125, 0.780029296875, 0.891815185546875, 1.00360107421875, 1.115386962890625, 1.2271728515625, 1.338958740234375, 1.45074462890625, 1.562530517578125, 1.67431640625, 1.786102294921875, 1.89788818359375, 2.009674072265625, 2.1214599609375, 2.233245849609375, 2.34503173828125, 2.456817626953125, 2.568603515625, 2.680389404296875, 2.79217529296875, 2.903961181640625, 3.0157470703125, 3.127532958984375, 3.23931884765625, 3.351104736328125, 3.462890625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 3.0, 6.0, 6.0, 8.0, 5.0, 9.0, 17.0, 11.0, 15.0, 16.0, 19.0, 23.0, 33.0, 45.0, 27.0, 33.0, 43.0, 54.0, 56.0, 51.0, 54.0, 57.0, 45.0, 43.0, 47.0, 36.0, 43.0, 39.0, 30.0, 20.0, 21.0, 15.0, 13.0, 6.0, 12.0, 9.0, 4.0, 7.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.458984375, -1.418792724609375, -1.37860107421875, -1.338409423828125, -1.2982177734375, -1.258026123046875, -1.21783447265625, -1.177642822265625, -1.137451171875, -1.097259521484375, -1.05706787109375, -1.016876220703125, -0.9766845703125, -0.936492919921875, -0.89630126953125, -0.856109619140625, -0.81591796875, -0.775726318359375, -0.73553466796875, -0.695343017578125, -0.6551513671875, -0.614959716796875, -0.57476806640625, -0.534576416015625, -0.494384765625, -0.454193115234375, -0.41400146484375, -0.373809814453125, -0.3336181640625, -0.293426513671875, -0.25323486328125, -0.213043212890625, -0.1728515625, -0.132659912109375, -0.09246826171875, -0.052276611328125, -0.0120849609375, 0.028106689453125, 0.06829833984375, 0.108489990234375, 0.148681640625, 0.188873291015625, 0.22906494140625, 0.269256591796875, 0.3094482421875, 0.349639892578125, 0.38983154296875, 0.430023193359375, 0.47021484375, 0.510406494140625, 0.55059814453125, 0.590789794921875, 0.6309814453125, 0.671173095703125, 0.71136474609375, 0.751556396484375, 0.791748046875, 0.831939697265625, 0.87213134765625, 0.912322998046875, 0.9525146484375, 0.992706298828125, 1.03289794921875, 1.073089599609375, 1.11328125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 4.0, 5.0, 11.0, 12.0, 14.0, 18.0, 30.0, 22.0, 36.0, 35.0, 33.0, 29.0, 50.0, 55.0, 58.0, 62.0, 59.0, 53.0, 54.0, 59.0, 51.0, 43.0, 34.0, 33.0, 33.0, 20.0, 13.0, 16.0, 16.0, 7.0, 4.0, 7.0, 4.0, 4.0, 9.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.750786781311035, -13.245479583740234, -12.740172386169434, -12.234865188598633, -11.729557991027832, -11.224250793457031, -10.71894359588623, -10.21363639831543, -9.708329200744629, -9.203022003173828, -8.697714805603027, -8.192407608032227, -7.687100410461426, -7.181793212890625, -6.676486015319824, -6.171178817749023, -5.665871620178223, -5.160564422607422, -4.655257225036621, -4.14995002746582, -3.6446428298950195, -3.1393356323242188, -2.634028434753418, -2.128721237182617, -1.6234140396118164, -1.1181068420410156, -0.6127996444702148, -0.10749244689941406, 0.3978147506713867, 0.9031219482421875, 1.4084291458129883, 1.913736343383789, 2.4190425872802734, 2.924349784851074, 3.429656982421875, 3.934964179992676, 4.440271377563477, 4.945578575134277, 5.450885772705078, 5.956192970275879, 6.46150016784668, 6.9668073654174805, 7.472114562988281, 7.977421760559082, 8.482728958129883, 8.988036155700684, 9.493343353271484, 9.998650550842285, 10.503957748413086, 11.009264945983887, 11.514572143554688, 12.019879341125488, 12.525186538696289, 13.03049373626709, 13.53580093383789, 14.041108131408691, 14.546415328979492, 15.051722526550293, 15.557029724121094, 16.062335968017578, 16.567644119262695, 17.072952270507812, 17.578258514404297, 18.08356475830078, 18.5888729095459]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 9.0, 8.0, 5.0, 11.0, 11.0, 14.0, 14.0, 11.0, 20.0, 29.0, 23.0, 10.0, 32.0, 22.0, 28.0, 27.0, 38.0, 48.0, 36.0, 41.0, 36.0, 43.0, 46.0, 55.0, 37.0, 34.0, 39.0, 31.0, 27.0, 28.0, 19.0, 26.0, 20.0, 16.0, 15.0, 18.0, 17.0, 16.0, 9.0, 9.0, 5.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.926182746887207, -9.598474502563477, -9.270766258239746, -8.943058013916016, -8.615350723266602, -8.287642478942871, -7.959934234619141, -7.63222599029541, -7.30451774597168, -6.976809501647949, -6.649101257324219, -6.3213934898376465, -5.993685245513916, -5.6659770011901855, -5.338269233703613, -5.010560989379883, -4.682852745056152, -4.355144500732422, -4.027436256408691, -3.699728488922119, -3.3720202445983887, -3.044312000274658, -2.716603994369507, -2.3888959884643555, -2.061187744140625, -1.733479619026184, -1.4057714939117432, -1.0780633687973022, -0.7503552436828613, -0.4226471185684204, -0.09493899345397949, 0.23276901245117188, 0.5604763031005859, 0.8881844282150269, 1.2158925533294678, 1.5436006784439087, 1.8713088035583496, 2.19901704788208, 2.5267250537872314, 2.854433059692383, 3.1821413040161133, 3.5098495483398438, 3.837557554244995, 4.1652655601501465, 4.492973804473877, 4.820682048797607, 5.14838981628418, 5.47609806060791, 5.803806304931641, 6.131514549255371, 6.459222793579102, 6.786930561065674, 7.114638805389404, 7.442347049713135, 7.770054817199707, 8.097763061523438, 8.425471305847168, 8.753179550170898, 9.080887794494629, 9.40859603881836, 9.736303329467773, 10.064011573791504, 10.391719818115234, 10.719428062438965, 11.047136306762695]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 14.0, 18.0, 30.0, 29.0, 71.0, 79.0, 160.0, 196.0, 335.0, 515.0, 841.0, 1335.0, 2134.0, 3247.0, 5078.0, 8372.0, 12753.0, 20128.0, 30665.0, 45608.0, 65379.0, 87569.0, 109460.0, 123851.0, 124605.0, 111309.0, 90329.0, 66950.0, 47287.0, 31963.0, 21072.0, 13442.0, 8694.0, 5594.0, 3495.0, 2142.0, 1421.0, 868.0, 522.0, 382.0, 227.0, 139.0, 85.0, 54.0, 30.0, 27.0, 13.0, 17.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-7.6015625, -7.37158203125, -7.1416015625, -6.91162109375, -6.681640625, -6.45166015625, -6.2216796875, -5.99169921875, -5.76171875, -5.53173828125, -5.3017578125, -5.07177734375, -4.841796875, -4.61181640625, -4.3818359375, -4.15185546875, -3.921875, -3.69189453125, -3.4619140625, -3.23193359375, -3.001953125, -2.77197265625, -2.5419921875, -2.31201171875, -2.08203125, -1.85205078125, -1.6220703125, -1.39208984375, -1.162109375, -0.93212890625, -0.7021484375, -0.47216796875, -0.2421875, -0.01220703125, 0.2177734375, 0.44775390625, 0.677734375, 0.90771484375, 1.1376953125, 1.36767578125, 1.59765625, 1.82763671875, 2.0576171875, 2.28759765625, 2.517578125, 2.74755859375, 2.9775390625, 3.20751953125, 3.4375, 3.66748046875, 3.8974609375, 4.12744140625, 4.357421875, 4.58740234375, 4.8173828125, 5.04736328125, 5.27734375, 5.50732421875, 5.7373046875, 5.96728515625, 6.197265625, 6.42724609375, 6.6572265625, 6.88720703125, 7.1171875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 11.0, 7.0, 7.0, 11.0, 6.0, 7.0, 17.0, 24.0, 14.0, 20.0, 26.0, 26.0, 22.0, 38.0, 36.0, 35.0, 35.0, 33.0, 42.0, 55.0, 36.0, 49.0, 46.0, 31.0, 33.0, 41.0, 35.0, 29.0, 31.0, 22.0, 17.0, 20.0, 13.0, 22.0, 20.0, 8.0, 22.0, 9.0, 10.0, 9.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4765625, -10.1246337890625, -9.772705078125, -9.4207763671875, -9.06884765625, -8.7169189453125, -8.364990234375, -8.0130615234375, -7.6611328125, -7.3092041015625, -6.957275390625, -6.6053466796875, -6.25341796875, -5.9014892578125, -5.549560546875, -5.1976318359375, -4.845703125, -4.4937744140625, -4.141845703125, -3.7899169921875, -3.43798828125, -3.0860595703125, -2.734130859375, -2.3822021484375, -2.0302734375, -1.6783447265625, -1.326416015625, -0.9744873046875, -0.62255859375, -0.2706298828125, 0.081298828125, 0.4332275390625, 0.78515625, 1.1370849609375, 1.489013671875, 1.8409423828125, 2.19287109375, 2.5447998046875, 2.896728515625, 3.2486572265625, 3.6005859375, 3.9525146484375, 4.304443359375, 4.6563720703125, 5.00830078125, 5.3602294921875, 5.712158203125, 6.0640869140625, 6.416015625, 6.7679443359375, 7.119873046875, 7.4718017578125, 7.82373046875, 8.1756591796875, 8.527587890625, 8.8795166015625, 9.2314453125, 9.5833740234375, 9.935302734375, 10.2872314453125, 10.63916015625, 10.9910888671875, 11.343017578125, 11.6949462890625, 12.046875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 0.0, 5.0, 8.0, 19.0, 21.0, 17.0, 40.0, 67.0, 93.0, 125.0, 185.0, 345.0, 439.0, 665.0, 1026.0, 1632.0, 2428.0, 3819.0, 5984.0, 9487.0, 15211.0, 23844.0, 36730.0, 55594.0, 79212.0, 104322.0, 124122.0, 131603.0, 123059.0, 101691.0, 76072.0, 53295.0, 35431.0, 22485.0, 14357.0, 9014.0, 5656.0, 3635.0, 2325.0, 1572.0, 992.0, 653.0, 410.0, 279.0, 178.0, 115.0, 95.0, 77.0, 46.0, 22.0, 25.0, 5.0, 15.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.76171875, -7.50677490234375, -7.2518310546875, -6.99688720703125, -6.741943359375, -6.48699951171875, -6.2320556640625, -5.97711181640625, -5.72216796875, -5.46722412109375, -5.2122802734375, -4.95733642578125, -4.702392578125, -4.44744873046875, -4.1925048828125, -3.93756103515625, -3.6826171875, -3.42767333984375, -3.1727294921875, -2.91778564453125, -2.662841796875, -2.40789794921875, -2.1529541015625, -1.89801025390625, -1.64306640625, -1.38812255859375, -1.1331787109375, -0.87823486328125, -0.623291015625, -0.36834716796875, -0.1134033203125, 0.14154052734375, 0.396484375, 0.65142822265625, 0.9063720703125, 1.16131591796875, 1.416259765625, 1.67120361328125, 1.9261474609375, 2.18109130859375, 2.43603515625, 2.69097900390625, 2.9459228515625, 3.20086669921875, 3.455810546875, 3.71075439453125, 3.9656982421875, 4.22064208984375, 4.4755859375, 4.73052978515625, 4.9854736328125, 5.24041748046875, 5.495361328125, 5.75030517578125, 6.0052490234375, 6.26019287109375, 6.51513671875, 6.77008056640625, 7.0250244140625, 7.27996826171875, 7.534912109375, 7.78985595703125, 8.0447998046875, 8.29974365234375, 8.5546875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 7.0, 6.0, 4.0, 8.0, 8.0, 9.0, 8.0, 17.0, 10.0, 14.0, 18.0, 27.0, 35.0, 22.0, 28.0, 31.0, 35.0, 34.0, 36.0, 33.0, 41.0, 29.0, 45.0, 43.0, 47.0, 35.0, 48.0, 32.0, 31.0, 34.0, 21.0, 32.0, 28.0, 27.0, 17.0, 22.0, 16.0, 8.0, 9.0, 5.0, 7.0, 10.0, 5.0, 7.0, 1.0, 9.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6953125, -6.47113037109375, -6.2469482421875, -6.02276611328125, -5.798583984375, -5.57440185546875, -5.3502197265625, -5.12603759765625, -4.90185546875, -4.67767333984375, -4.4534912109375, -4.22930908203125, -4.005126953125, -3.78094482421875, -3.5567626953125, -3.33258056640625, -3.1083984375, -2.88421630859375, -2.6600341796875, -2.43585205078125, -2.211669921875, -1.98748779296875, -1.7633056640625, -1.53912353515625, -1.31494140625, -1.09075927734375, -0.8665771484375, -0.64239501953125, -0.418212890625, -0.19403076171875, 0.0301513671875, 0.25433349609375, 0.478515625, 0.70269775390625, 0.9268798828125, 1.15106201171875, 1.375244140625, 1.59942626953125, 1.8236083984375, 2.04779052734375, 2.27197265625, 2.49615478515625, 2.7203369140625, 2.94451904296875, 3.168701171875, 3.39288330078125, 3.6170654296875, 3.84124755859375, 4.0654296875, 4.28961181640625, 4.5137939453125, 4.73797607421875, 4.962158203125, 5.18634033203125, 5.4105224609375, 5.63470458984375, 5.85888671875, 6.08306884765625, 6.3072509765625, 6.53143310546875, 6.755615234375, 6.97979736328125, 7.2039794921875, 7.42816162109375, 7.65234375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 13.0, 19.0, 16.0, 27.0, 50.0, 50.0, 98.0, 148.0, 204.0, 279.0, 464.0, 695.0, 1141.0, 1926.0, 3066.0, 5182.0, 8403.0, 13677.0, 22276.0, 36146.0, 55638.0, 81327.0, 110863.0, 133339.0, 140396.0, 127781.0, 101678.0, 73655.0, 48776.0, 31377.0, 19456.0, 11686.0, 7189.0, 4329.0, 2666.0, 1567.0, 1023.0, 684.0, 437.0, 270.0, 190.0, 105.0, 79.0, 56.0, 29.0, 30.0, 13.0, 15.0, 5.0, 10.0, 3.0, 5.0, 2.0, 1.0], "bins": [-4.3125, -4.18695068359375, -4.0614013671875, -3.93585205078125, -3.810302734375, -3.68475341796875, -3.5592041015625, -3.43365478515625, -3.30810546875, -3.18255615234375, -3.0570068359375, -2.93145751953125, -2.805908203125, -2.68035888671875, -2.5548095703125, -2.42926025390625, -2.3037109375, -2.17816162109375, -2.0526123046875, -1.92706298828125, -1.801513671875, -1.67596435546875, -1.5504150390625, -1.42486572265625, -1.29931640625, -1.17376708984375, -1.0482177734375, -0.92266845703125, -0.797119140625, -0.67156982421875, -0.5460205078125, -0.42047119140625, -0.294921875, -0.16937255859375, -0.0438232421875, 0.08172607421875, 0.207275390625, 0.33282470703125, 0.4583740234375, 0.58392333984375, 0.70947265625, 0.83502197265625, 0.9605712890625, 1.08612060546875, 1.211669921875, 1.33721923828125, 1.4627685546875, 1.58831787109375, 1.7138671875, 1.83941650390625, 1.9649658203125, 2.09051513671875, 2.216064453125, 2.34161376953125, 2.4671630859375, 2.59271240234375, 2.71826171875, 2.84381103515625, 2.9693603515625, 3.09490966796875, 3.220458984375, 3.34600830078125, 3.4715576171875, 3.59710693359375, 3.72265625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 5.0, 5.0, 9.0, 9.0, 10.0, 10.0, 16.0, 22.0, 23.0, 25.0, 33.0, 34.0, 32.0, 42.0, 36.0, 50.0, 75.0, 47.0, 39.0, 37.0, 54.0, 52.0, 43.0, 42.0, 29.0, 17.0, 28.0, 30.0, 19.0, 26.0, 11.0, 13.0, 16.0, 12.0, 4.0, 5.0, 11.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0003695487976074219, -0.0003574453294277191, -0.00034534186124801636, -0.0003332383930683136, -0.00032113492488861084, -0.0003090314567089081, -0.0002969279885292053, -0.00028482452034950256, -0.0002727210521697998, -0.00026061758399009705, -0.0002485141158103943, -0.00023641064763069153, -0.00022430717945098877, -0.000212203711271286, -0.00020010024309158325, -0.0001879967749118805, -0.00017589330673217773, -0.00016378983855247498, -0.00015168637037277222, -0.00013958290219306946, -0.0001274794340133667, -0.00011537596583366394, -0.00010327249765396118, -9.116902947425842e-05, -7.906556129455566e-05, -6.69620931148529e-05, -5.4858624935150146e-05, -4.275515675544739e-05, -3.065168857574463e-05, -1.854822039604187e-05, -6.444752216339111e-06, 5.6587159633636475e-06, 1.7762184143066406e-05, 2.9865652322769165e-05, 4.1969120502471924e-05, 5.407258868217468e-05, 6.617605686187744e-05, 7.82795250415802e-05, 9.038299322128296e-05, 0.00010248646140098572, 0.00011458992958068848, 0.00012669339776039124, 0.000138796865940094, 0.00015090033411979675, 0.0001630038022994995, 0.00017510727047920227, 0.00018721073865890503, 0.0001993142068386078, 0.00021141767501831055, 0.0002235211431980133, 0.00023562461137771606, 0.0002477280795574188, 0.0002598315477371216, 0.00027193501591682434, 0.0002840384840965271, 0.00029614195227622986, 0.0003082454204559326, 0.0003203488886356354, 0.00033245235681533813, 0.0003445558249950409, 0.00035665929317474365, 0.0003687627613544464, 0.00038086622953414917, 0.00039296969771385193, 0.0004050731658935547]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 16.0, 14.0, 19.0, 31.0, 40.0, 65.0, 116.0, 162.0, 285.0, 486.0, 888.0, 1601.0, 3271.0, 6011.0, 12230.0, 23540.0, 45461.0, 82261.0, 133540.0, 182031.0, 189725.0, 152432.0, 98138.0, 55738.0, 29322.0, 14934.0, 7601.0, 3945.0, 2024.0, 1107.0, 628.0, 349.0, 201.0, 115.0, 72.0, 47.0, 38.0, 20.0, 23.0, 5.0, 6.0, 7.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.70703125, -5.52960205078125, -5.3521728515625, -5.17474365234375, -4.997314453125, -4.81988525390625, -4.6424560546875, -4.46502685546875, -4.28759765625, -4.11016845703125, -3.9327392578125, -3.75531005859375, -3.577880859375, -3.40045166015625, -3.2230224609375, -3.04559326171875, -2.8681640625, -2.69073486328125, -2.5133056640625, -2.33587646484375, -2.158447265625, -1.98101806640625, -1.8035888671875, -1.62615966796875, -1.44873046875, -1.27130126953125, -1.0938720703125, -0.91644287109375, -0.739013671875, -0.56158447265625, -0.3841552734375, -0.20672607421875, -0.029296875, 0.14813232421875, 0.3255615234375, 0.50299072265625, 0.680419921875, 0.85784912109375, 1.0352783203125, 1.21270751953125, 1.39013671875, 1.56756591796875, 1.7449951171875, 1.92242431640625, 2.099853515625, 2.27728271484375, 2.4547119140625, 2.63214111328125, 2.8095703125, 2.98699951171875, 3.1644287109375, 3.34185791015625, 3.519287109375, 3.69671630859375, 3.8741455078125, 4.05157470703125, 4.22900390625, 4.40643310546875, 4.5838623046875, 4.76129150390625, 4.938720703125, 5.11614990234375, 5.2935791015625, 5.47100830078125, 5.6484375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 3.0, 4.0, 8.0, 8.0, 14.0, 13.0, 14.0, 22.0, 34.0, 27.0, 30.0, 41.0, 40.0, 56.0, 59.0, 57.0, 59.0, 64.0, 47.0, 58.0, 52.0, 61.0, 34.0, 32.0, 36.0, 17.0, 22.0, 14.0, 13.0, 18.0, 7.0, 8.0, 8.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2099609375, -1.1640625, -1.1181640625, -1.072265625, -1.0263671875, -0.98046875, -0.9345703125, -0.888671875, -0.8427734375, -0.796875, -0.7509765625, -0.705078125, -0.6591796875, -0.61328125, -0.5673828125, -0.521484375, -0.4755859375, -0.4296875, -0.3837890625, -0.337890625, -0.2919921875, -0.24609375, -0.2001953125, -0.154296875, -0.1083984375, -0.0625, -0.0166015625, 0.029296875, 0.0751953125, 0.12109375, 0.1669921875, 0.212890625, 0.2587890625, 0.3046875, 0.3505859375, 0.396484375, 0.4423828125, 0.48828125, 0.5341796875, 0.580078125, 0.6259765625, 0.671875, 0.7177734375, 0.763671875, 0.8095703125, 0.85546875, 0.9013671875, 0.947265625, 0.9931640625, 1.0390625, 1.0849609375, 1.130859375, 1.1767578125, 1.22265625, 1.2685546875, 1.314453125, 1.3603515625, 1.40625, 1.4521484375, 1.498046875, 1.5439453125, 1.58984375, 1.6357421875, 1.681640625, 1.7275390625]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 11.0, 9.0, 10.0, 11.0, 10.0, 13.0, 14.0, 22.0, 32.0, 35.0, 28.0, 29.0, 37.0, 40.0, 39.0, 41.0, 49.0, 54.0, 48.0, 51.0, 58.0, 41.0, 43.0, 47.0, 31.0, 32.0, 30.0, 14.0, 19.0, 19.0, 12.0, 21.0, 6.0, 4.0, 10.0, 5.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.616525650024414, -12.1820068359375, -11.747488021850586, -11.312968254089355, -10.878449440002441, -10.443930625915527, -10.009410858154297, -9.574892044067383, -9.140373229980469, -8.705854415893555, -8.27133560180664, -7.83681583404541, -7.402297019958496, -6.967778205871582, -6.53325891494751, -6.0987396240234375, -5.664220809936523, -5.229701995849609, -4.795182704925537, -4.360663414001465, -3.926144599914551, -3.4916255474090576, -3.0571064949035645, -2.6225874423980713, -2.188068389892578, -1.753549337387085, -1.3190302848815918, -0.8845112323760986, -0.44999217987060547, -0.015473127365112305, 0.41904592514038086, 0.853564977645874, 1.2880840301513672, 1.7226030826568604, 2.1571221351623535, 2.5916411876678467, 3.02616024017334, 3.460679292678833, 3.895198345184326, 4.329717636108398, 4.7642364501953125, 5.198755264282227, 5.633274555206299, 6.067793846130371, 6.502312660217285, 6.936831474304199, 7.3713507652282715, 7.805870056152344, 8.240388870239258, 8.674907684326172, 9.109426498413086, 9.543946266174316, 9.97846508026123, 10.412983894348145, 10.847503662109375, 11.282022476196289, 11.716541290283203, 12.151060104370117, 12.585578918457031, 13.020098686218262, 13.454617500305176, 13.88913631439209, 14.32365608215332, 14.758174896240234, 15.192693710327148]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 6.0, 5.0, 8.0, 10.0, 11.0, 14.0, 16.0, 18.0, 28.0, 11.0, 26.0, 23.0, 26.0, 31.0, 34.0, 42.0, 37.0, 44.0, 48.0, 33.0, 41.0, 59.0, 37.0, 48.0, 37.0, 36.0, 38.0, 24.0, 34.0, 26.0, 30.0, 13.0, 14.0, 26.0, 17.0, 9.0, 13.0, 3.0, 7.0, 8.0, 6.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.88176155090332, -12.493916511535645, -12.106071472167969, -11.718225479125977, -11.3303804397583, -10.942535400390625, -10.55469036102295, -10.166845321655273, -9.778999328613281, -9.391154289245605, -9.00330924987793, -8.615463256835938, -8.227618217468262, -7.839773178100586, -7.45192813873291, -7.064083099365234, -6.676238059997559, -6.288393020629883, -5.900547504425049, -5.512702465057373, -5.124856948852539, -4.737011909484863, -4.3491668701171875, -3.9613215923309326, -3.5734763145446777, -3.185631036758423, -2.797785758972168, -2.409940719604492, -2.0220954418182373, -1.6342501640319824, -1.2464051246643066, -0.8585598468780518, -0.4707155227661133, -0.08287030458450317, 0.30497491359710693, 0.6928200721740723, 1.0806653499603271, 1.468510627746582, 1.8563556671142578, 2.2442009449005127, 2.6320462226867676, 3.0198915004730225, 3.4077367782592773, 3.795581817626953, 4.183426856994629, 4.571272373199463, 4.959117412567139, 5.346962928771973, 5.734807968139648, 6.122653007507324, 6.510498523712158, 6.898343563079834, 7.286189079284668, 7.674034118652344, 8.06187915802002, 8.449724197387695, 8.837570190429688, 9.225415229797363, 9.613260269165039, 10.001106262207031, 10.388951301574707, 10.776796340942383, 11.164641380310059, 11.552486419677734, 11.94033145904541]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 9.0, 7.0, 5.0, 4.0, 13.0, 22.0, 31.0, 69.0, 91.0, 137.0, 210.0, 371.0, 560.0, 908.0, 1653.0, 2768.0, 4975.0, 9501.0, 17683.0, 35113.0, 70745.0, 143372.0, 288723.0, 543133.0, 838155.0, 889380.0, 636194.0, 353085.0, 179407.0, 88110.0, 42995.0, 21870.0, 11278.0, 5860.0, 3302.0, 1760.0, 1043.0, 598.0, 420.0, 239.0, 142.0, 102.0, 74.0, 46.0, 40.0, 27.0, 17.0, 13.0, 4.0, 8.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.953125, -14.421875, -13.890625, -13.359375, -12.828125, -12.296875, -11.765625, -11.234375, -10.703125, -10.171875, -9.640625, -9.109375, -8.578125, -8.046875, -7.515625, -6.984375, -6.453125, -5.921875, -5.390625, -4.859375, -4.328125, -3.796875, -3.265625, -2.734375, -2.203125, -1.671875, -1.140625, -0.609375, -0.078125, 0.453125, 0.984375, 1.515625, 2.046875, 2.578125, 3.109375, 3.640625, 4.171875, 4.703125, 5.234375, 5.765625, 6.296875, 6.828125, 7.359375, 7.890625, 8.421875, 8.953125, 9.484375, 10.015625, 10.546875, 11.078125, 11.609375, 12.140625, 12.671875, 13.203125, 13.734375, 14.265625, 14.796875, 15.328125, 15.859375, 16.390625, 16.921875, 17.453125, 17.984375, 18.515625, 19.046875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 7.0, 5.0, 4.0, 5.0, 17.0, 10.0, 12.0, 19.0, 15.0, 21.0, 26.0, 25.0, 23.0, 29.0, 35.0, 33.0, 42.0, 41.0, 43.0, 46.0, 38.0, 49.0, 42.0, 43.0, 51.0, 29.0, 43.0, 36.0, 26.0, 31.0, 22.0, 25.0, 21.0, 12.0, 15.0, 14.0, 7.0, 13.0, 0.0, 6.0, 5.0, 11.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.0625, -9.74609375, -9.4296875, -9.11328125, -8.796875, -8.48046875, -8.1640625, -7.84765625, -7.53125, -7.21484375, -6.8984375, -6.58203125, -6.265625, -5.94921875, -5.6328125, -5.31640625, -5.0, -4.68359375, -4.3671875, -4.05078125, -3.734375, -3.41796875, -3.1015625, -2.78515625, -2.46875, -2.15234375, -1.8359375, -1.51953125, -1.203125, -0.88671875, -0.5703125, -0.25390625, 0.0625, 0.37890625, 0.6953125, 1.01171875, 1.328125, 1.64453125, 1.9609375, 2.27734375, 2.59375, 2.91015625, 3.2265625, 3.54296875, 3.859375, 4.17578125, 4.4921875, 4.80859375, 5.125, 5.44140625, 5.7578125, 6.07421875, 6.390625, 6.70703125, 7.0234375, 7.33984375, 7.65625, 7.97265625, 8.2890625, 8.60546875, 8.921875, 9.23828125, 9.5546875, 9.87109375, 10.1875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 8.0, 14.0, 24.0, 27.0, 50.0, 72.0, 99.0, 217.0, 272.0, 482.0, 757.0, 1285.0, 2117.0, 3589.0, 6575.0, 11503.0, 21202.0, 39733.0, 74219.0, 135460.0, 242642.0, 403165.0, 595891.0, 723040.0, 682791.0, 509697.0, 325403.0, 187600.0, 103315.0, 55900.0, 29880.0, 16080.0, 9005.0, 5096.0, 2857.0, 1619.0, 952.0, 670.0, 358.0, 221.0, 147.0, 94.0, 59.0, 36.0, 23.0, 13.0, 11.0, 6.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.890625, -15.35693359375, -14.8232421875, -14.28955078125, -13.755859375, -13.22216796875, -12.6884765625, -12.15478515625, -11.62109375, -11.08740234375, -10.5537109375, -10.02001953125, -9.486328125, -8.95263671875, -8.4189453125, -7.88525390625, -7.3515625, -6.81787109375, -6.2841796875, -5.75048828125, -5.216796875, -4.68310546875, -4.1494140625, -3.61572265625, -3.08203125, -2.54833984375, -2.0146484375, -1.48095703125, -0.947265625, -0.41357421875, 0.1201171875, 0.65380859375, 1.1875, 1.72119140625, 2.2548828125, 2.78857421875, 3.322265625, 3.85595703125, 4.3896484375, 4.92333984375, 5.45703125, 5.99072265625, 6.5244140625, 7.05810546875, 7.591796875, 8.12548828125, 8.6591796875, 9.19287109375, 9.7265625, 10.26025390625, 10.7939453125, 11.32763671875, 11.861328125, 12.39501953125, 12.9287109375, 13.46240234375, 13.99609375, 14.52978515625, 15.0634765625, 15.59716796875, 16.130859375, 16.66455078125, 17.1982421875, 17.73193359375, 18.265625]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 7.0, 7.0, 11.0, 24.0, 14.0, 36.0, 23.0, 35.0, 47.0, 64.0, 70.0, 80.0, 109.0, 137.0, 156.0, 167.0, 183.0, 237.0, 218.0, 240.0, 244.0, 225.0, 238.0, 209.0, 203.0, 173.0, 157.0, 122.0, 121.0, 119.0, 76.0, 63.0, 53.0, 51.0, 33.0, 31.0, 23.0, 13.0, 13.0, 8.0, 4.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-6.18359375, -6.009765625, -5.8359375, -5.662109375, -5.48828125, -5.314453125, -5.140625, -4.966796875, -4.79296875, -4.619140625, -4.4453125, -4.271484375, -4.09765625, -3.923828125, -3.75, -3.576171875, -3.40234375, -3.228515625, -3.0546875, -2.880859375, -2.70703125, -2.533203125, -2.359375, -2.185546875, -2.01171875, -1.837890625, -1.6640625, -1.490234375, -1.31640625, -1.142578125, -0.96875, -0.794921875, -0.62109375, -0.447265625, -0.2734375, -0.099609375, 0.07421875, 0.248046875, 0.421875, 0.595703125, 0.76953125, 0.943359375, 1.1171875, 1.291015625, 1.46484375, 1.638671875, 1.8125, 1.986328125, 2.16015625, 2.333984375, 2.5078125, 2.681640625, 2.85546875, 3.029296875, 3.203125, 3.376953125, 3.55078125, 3.724609375, 3.8984375, 4.072265625, 4.24609375, 4.419921875, 4.59375, 4.767578125, 4.94140625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 9.0, 10.0, 10.0, 14.0, 21.0, 24.0, 26.0, 33.0, 26.0, 45.0, 36.0, 47.0, 49.0, 72.0, 73.0, 52.0, 64.0, 71.0, 47.0, 58.0, 32.0, 32.0, 32.0, 30.0, 23.0, 15.0, 12.0, 16.0, 14.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.393949508666992, -18.704517364501953, -18.015085220336914, -17.325653076171875, -16.636220932006836, -15.946788787841797, -15.257355690002441, -14.567923545837402, -13.878491401672363, -13.189059257507324, -12.499627113342285, -11.81019401550293, -11.12076187133789, -10.431329727172852, -9.741897583007812, -9.052465438842773, -8.363033294677734, -7.673601150512695, -6.984169006347656, -6.294736385345459, -5.60530424118042, -4.915872097015381, -4.226439476013184, -3.5370073318481445, -2.8475751876831055, -2.1581430435180664, -1.4687106609344482, -0.7792782783508301, -0.08984613418579102, 0.599586009979248, 1.2890186309814453, 1.9784507751464844, 2.6678829193115234, 3.3573150634765625, 4.046747207641602, 4.736179828643799, 5.425611972808838, 6.115044116973877, 6.804476737976074, 7.493908882141113, 8.183341026306152, 8.872773170471191, 9.56220531463623, 10.251638412475586, 10.941070556640625, 11.630502700805664, 12.319934844970703, 13.009366989135742, 13.698799133300781, 14.38823127746582, 15.07766342163086, 15.767095565795898, 16.456527709960938, 17.145959854125977, 17.835391998291016, 18.524826049804688, 19.214256286621094, 19.903688430786133, 20.593120574951172, 21.28255271911621, 21.97198486328125, 22.66141700744629, 23.350849151611328, 24.040283203125, 24.72971534729004]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 4.0, 2.0, 9.0, 9.0, 10.0, 13.0, 21.0, 18.0, 16.0, 27.0, 29.0, 32.0, 30.0, 38.0, 30.0, 34.0, 42.0, 41.0, 48.0, 42.0, 50.0, 42.0, 58.0, 44.0, 35.0, 31.0, 35.0, 25.0, 29.0, 30.0, 15.0, 26.0, 15.0, 16.0, 7.0, 13.0, 14.0, 6.0, 5.0, 4.0, 6.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.413304328918457, -13.99051284790039, -13.567721366882324, -13.144929885864258, -12.722137451171875, -12.299345970153809, -11.876554489135742, -11.453763008117676, -11.03097152709961, -10.608180046081543, -10.185388565063477, -9.762596130371094, -9.339804649353027, -8.917013168334961, -8.494221687316895, -8.071430206298828, -7.648637771606445, -7.225846290588379, -6.803054332733154, -6.380262851715088, -5.957470893859863, -5.534679412841797, -5.1118879318237305, -4.689096450805664, -4.2663044929504395, -3.843512773513794, -3.4207210540771484, -2.997929573059082, -2.5751378536224365, -2.152346134185791, -1.7295546531677246, -1.306762933731079, -0.8839702606201172, -0.46117860078811646, -0.03838694095611572, 0.38440465927124023, 0.8071963787078857, 1.2299880981445312, 1.6527795791625977, 2.075571298599243, 2.4983630180358887, 2.921154737472534, 3.3439464569091797, 3.766737937927246, 4.1895294189453125, 4.612321376800537, 5.0351128578186035, 5.457904815673828, 5.8806962966918945, 6.303487777709961, 6.7262797355651855, 7.149071216583252, 7.571863174438477, 7.994654655456543, 8.41744613647461, 8.840237617492676, 9.263029098510742, 9.685820579528809, 10.108612060546875, 10.531404495239258, 10.954195976257324, 11.37698745727539, 11.799778938293457, 12.222570419311523, 12.645362854003906]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 8.0, 7.0, 12.0, 28.0, 42.0, 55.0, 71.0, 101.0, 154.0, 228.0, 323.0, 536.0, 758.0, 1074.0, 1682.0, 2405.0, 3744.0, 5804.0, 8694.0, 13652.0, 21008.0, 32204.0, 48192.0, 70765.0, 97883.0, 122745.0, 135973.0, 129946.0, 106802.0, 79903.0, 56031.0, 37504.0, 24436.0, 15662.0, 10224.0, 6756.0, 4437.0, 2831.0, 1899.0, 1330.0, 870.0, 585.0, 411.0, 278.0, 155.0, 111.0, 77.0, 50.0, 37.0, 28.0, 12.0, 15.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0], "bins": [-6.44140625, -6.224365234375, -6.00732421875, -5.790283203125, -5.5732421875, -5.356201171875, -5.13916015625, -4.922119140625, -4.705078125, -4.488037109375, -4.27099609375, -4.053955078125, -3.8369140625, -3.619873046875, -3.40283203125, -3.185791015625, -2.96875, -2.751708984375, -2.53466796875, -2.317626953125, -2.1005859375, -1.883544921875, -1.66650390625, -1.449462890625, -1.232421875, -1.015380859375, -0.79833984375, -0.581298828125, -0.3642578125, -0.147216796875, 0.06982421875, 0.286865234375, 0.50390625, 0.720947265625, 0.93798828125, 1.155029296875, 1.3720703125, 1.589111328125, 1.80615234375, 2.023193359375, 2.240234375, 2.457275390625, 2.67431640625, 2.891357421875, 3.1083984375, 3.325439453125, 3.54248046875, 3.759521484375, 3.9765625, 4.193603515625, 4.41064453125, 4.627685546875, 4.8447265625, 5.061767578125, 5.27880859375, 5.495849609375, 5.712890625, 5.929931640625, 6.14697265625, 6.364013671875, 6.5810546875, 6.798095703125, 7.01513671875, 7.232177734375, 7.44921875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 9.0, 6.0, 16.0, 13.0, 15.0, 19.0, 14.0, 23.0, 29.0, 27.0, 28.0, 29.0, 37.0, 41.0, 31.0, 55.0, 29.0, 41.0, 54.0, 45.0, 45.0, 39.0, 39.0, 35.0, 36.0, 32.0, 27.0, 28.0, 24.0, 37.0, 24.0, 13.0, 7.0, 10.0, 13.0, 9.0, 6.0, 6.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.1328125, -13.6868896484375, -13.240966796875, -12.7950439453125, -12.34912109375, -11.9031982421875, -11.457275390625, -11.0113525390625, -10.5654296875, -10.1195068359375, -9.673583984375, -9.2276611328125, -8.78173828125, -8.3358154296875, -7.889892578125, -7.4439697265625, -6.998046875, -6.5521240234375, -6.106201171875, -5.6602783203125, -5.21435546875, -4.7684326171875, -4.322509765625, -3.8765869140625, -3.4306640625, -2.9847412109375, -2.538818359375, -2.0928955078125, -1.64697265625, -1.2010498046875, -0.755126953125, -0.3092041015625, 0.13671875, 0.5826416015625, 1.028564453125, 1.4744873046875, 1.92041015625, 2.3663330078125, 2.812255859375, 3.2581787109375, 3.7041015625, 4.1500244140625, 4.595947265625, 5.0418701171875, 5.48779296875, 5.9337158203125, 6.379638671875, 6.8255615234375, 7.271484375, 7.7174072265625, 8.163330078125, 8.6092529296875, 9.05517578125, 9.5010986328125, 9.947021484375, 10.3929443359375, 10.8388671875, 11.2847900390625, 11.730712890625, 12.1766357421875, 12.62255859375, 13.0684814453125, 13.514404296875, 13.9603271484375, 14.40625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 10.0, 10.0, 20.0, 16.0, 30.0, 40.0, 56.0, 72.0, 100.0, 168.0, 227.0, 311.0, 507.0, 776.0, 1285.0, 2228.0, 3947.0, 7345.0, 14991.0, 33546.0, 79150.0, 186002.0, 315896.0, 224339.0, 97957.0, 41260.0, 18364.0, 8780.0, 4618.0, 2494.0, 1393.0, 898.0, 550.0, 363.0, 250.0, 140.0, 112.0, 94.0, 63.0, 45.0, 38.0, 17.0, 14.0, 11.0, 5.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-18.125, -17.5859375, -17.046875, -16.5078125, -15.96875, -15.4296875, -14.890625, -14.3515625, -13.8125, -13.2734375, -12.734375, -12.1953125, -11.65625, -11.1171875, -10.578125, -10.0390625, -9.5, -8.9609375, -8.421875, -7.8828125, -7.34375, -6.8046875, -6.265625, -5.7265625, -5.1875, -4.6484375, -4.109375, -3.5703125, -3.03125, -2.4921875, -1.953125, -1.4140625, -0.875, -0.3359375, 0.203125, 0.7421875, 1.28125, 1.8203125, 2.359375, 2.8984375, 3.4375, 3.9765625, 4.515625, 5.0546875, 5.59375, 6.1328125, 6.671875, 7.2109375, 7.75, 8.2890625, 8.828125, 9.3671875, 9.90625, 10.4453125, 10.984375, 11.5234375, 12.0625, 12.6015625, 13.140625, 13.6796875, 14.21875, 14.7578125, 15.296875, 15.8359375, 16.375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 5.0, 1.0, 13.0, 4.0, 6.0, 11.0, 21.0, 20.0, 16.0, 22.0, 16.0, 30.0, 41.0, 39.0, 36.0, 49.0, 40.0, 35.0, 47.0, 57.0, 57.0, 48.0, 39.0, 51.0, 36.0, 42.0, 26.0, 31.0, 18.0, 13.0, 25.0, 28.0, 17.0, 11.0, 10.0, 10.0, 2.0, 5.0, 12.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.8125, -8.5382080078125, -8.263916015625, -7.9896240234375, -7.71533203125, -7.4410400390625, -7.166748046875, -6.8924560546875, -6.6181640625, -6.3438720703125, -6.069580078125, -5.7952880859375, -5.52099609375, -5.2467041015625, -4.972412109375, -4.6981201171875, -4.423828125, -4.1495361328125, -3.875244140625, -3.6009521484375, -3.32666015625, -3.0523681640625, -2.778076171875, -2.5037841796875, -2.2294921875, -1.9552001953125, -1.680908203125, -1.4066162109375, -1.13232421875, -0.8580322265625, -0.583740234375, -0.3094482421875, -0.03515625, 0.2391357421875, 0.513427734375, 0.7877197265625, 1.06201171875, 1.3363037109375, 1.610595703125, 1.8848876953125, 2.1591796875, 2.4334716796875, 2.707763671875, 2.9820556640625, 3.25634765625, 3.5306396484375, 3.804931640625, 4.0792236328125, 4.353515625, 4.6278076171875, 4.902099609375, 5.1763916015625, 5.45068359375, 5.7249755859375, 5.999267578125, 6.2735595703125, 6.5478515625, 6.8221435546875, 7.096435546875, 7.3707275390625, 7.64501953125, 7.9193115234375, 8.193603515625, 8.4678955078125, 8.7421875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 4.0, 7.0, 10.0, 14.0, 29.0, 47.0, 46.0, 92.0, 134.0, 224.0, 367.0, 651.0, 1080.0, 2022.0, 4147.0, 8652.0, 18661.0, 43499.0, 104305.0, 231483.0, 312060.0, 181592.0, 78062.0, 33003.0, 14408.0, 6678.0, 3346.0, 1627.0, 953.0, 537.0, 290.0, 180.0, 122.0, 70.0, 55.0, 30.0, 19.0, 15.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0], "bins": [-9.2109375, -8.95025634765625, -8.6895751953125, -8.42889404296875, -8.168212890625, -7.90753173828125, -7.6468505859375, -7.38616943359375, -7.12548828125, -6.86480712890625, -6.6041259765625, -6.34344482421875, -6.082763671875, -5.82208251953125, -5.5614013671875, -5.30072021484375, -5.0400390625, -4.77935791015625, -4.5186767578125, -4.25799560546875, -3.997314453125, -3.73663330078125, -3.4759521484375, -3.21527099609375, -2.95458984375, -2.69390869140625, -2.4332275390625, -2.17254638671875, -1.911865234375, -1.65118408203125, -1.3905029296875, -1.12982177734375, -0.869140625, -0.60845947265625, -0.3477783203125, -0.08709716796875, 0.173583984375, 0.43426513671875, 0.6949462890625, 0.95562744140625, 1.21630859375, 1.47698974609375, 1.7376708984375, 1.99835205078125, 2.259033203125, 2.51971435546875, 2.7803955078125, 3.04107666015625, 3.3017578125, 3.56243896484375, 3.8231201171875, 4.08380126953125, 4.344482421875, 4.60516357421875, 4.8658447265625, 5.12652587890625, 5.38720703125, 5.64788818359375, 5.9085693359375, 6.16925048828125, 6.429931640625, 6.69061279296875, 6.9512939453125, 7.21197509765625, 7.47265625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 18.0, 26.0, 40.0, 32.0, 44.0, 59.0, 86.0, 91.0, 86.0, 104.0, 77.0, 80.0, 70.0, 43.0, 34.0, 23.0, 27.0, 17.0, 10.0, 3.0, 5.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025725364685058594, -0.00024600327014923096, -0.00023475289344787598, -0.000223502516746521, -0.00021225214004516602, -0.00020100176334381104, -0.00018975138664245605, -0.00017850100994110107, -0.0001672506332397461, -0.0001560002565383911, -0.00014474987983703613, -0.00013349950313568115, -0.00012224912643432617, -0.00011099874973297119, -9.974837303161621e-05, -8.849799633026123e-05, -7.724761962890625e-05, -6.599724292755127e-05, -5.474686622619629e-05, -4.349648952484131e-05, -3.224611282348633e-05, -2.0995736122131348e-05, -9.745359420776367e-06, 1.5050172805786133e-06, 1.2755393981933594e-05, 2.4005770683288574e-05, 3.5256147384643555e-05, 4.6506524085998535e-05, 5.7756900787353516e-05, 6.90072774887085e-05, 8.025765419006348e-05, 9.150803089141846e-05, 0.00010275840759277344, 0.00011400878429412842, 0.0001252591609954834, 0.00013650953769683838, 0.00014775991439819336, 0.00015901029109954834, 0.00017026066780090332, 0.0001815110445022583, 0.00019276142120361328, 0.00020401179790496826, 0.00021526217460632324, 0.00022651255130767822, 0.0002377629280090332, 0.0002490133047103882, 0.00026026368141174316, 0.00027151405811309814, 0.0002827644348144531, 0.0002940148115158081, 0.0003052651882171631, 0.00031651556491851807, 0.00032776594161987305, 0.00033901631832122803, 0.000350266695022583, 0.000361517071723938, 0.00037276744842529297, 0.00038401782512664795, 0.00039526820182800293, 0.0004065185785293579, 0.0004177689552307129, 0.00042901933193206787, 0.00044026970863342285, 0.00045152008533477783, 0.0004627704620361328]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 8.0, 13.0, 12.0, 23.0, 28.0, 46.0, 69.0, 110.0, 159.0, 229.0, 417.0, 580.0, 957.0, 1598.0, 2669.0, 4507.0, 7868.0, 13435.0, 23550.0, 40633.0, 67744.0, 105759.0, 148062.0, 171329.0, 156566.0, 116137.0, 75469.0, 45992.0, 27303.0, 15374.0, 9058.0, 4945.0, 3071.0, 1834.0, 1128.0, 690.0, 430.0, 259.0, 175.0, 109.0, 67.0, 49.0, 34.0, 23.0, 17.0, 6.0, 9.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75390625, -5.5775146484375, -5.401123046875, -5.2247314453125, -5.04833984375, -4.8719482421875, -4.695556640625, -4.5191650390625, -4.3427734375, -4.1663818359375, -3.989990234375, -3.8135986328125, -3.63720703125, -3.4608154296875, -3.284423828125, -3.1080322265625, -2.931640625, -2.7552490234375, -2.578857421875, -2.4024658203125, -2.22607421875, -2.0496826171875, -1.873291015625, -1.6968994140625, -1.5205078125, -1.3441162109375, -1.167724609375, -0.9913330078125, -0.81494140625, -0.6385498046875, -0.462158203125, -0.2857666015625, -0.109375, 0.0670166015625, 0.243408203125, 0.4197998046875, 0.59619140625, 0.7725830078125, 0.948974609375, 1.1253662109375, 1.3017578125, 1.4781494140625, 1.654541015625, 1.8309326171875, 2.00732421875, 2.1837158203125, 2.360107421875, 2.5364990234375, 2.712890625, 2.8892822265625, 3.065673828125, 3.2420654296875, 3.41845703125, 3.5948486328125, 3.771240234375, 3.9476318359375, 4.1240234375, 4.3004150390625, 4.476806640625, 4.6531982421875, 4.82958984375, 5.0059814453125, 5.182373046875, 5.3587646484375, 5.53515625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 4.0, 10.0, 11.0, 6.0, 15.0, 20.0, 28.0, 29.0, 42.0, 39.0, 44.0, 50.0, 57.0, 69.0, 63.0, 88.0, 68.0, 66.0, 50.0, 37.0, 43.0, 36.0, 19.0, 25.0, 18.0, 18.0, 8.0, 13.0, 6.0, 5.0, 3.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.34765625, -2.27862548828125, -2.2095947265625, -2.14056396484375, -2.071533203125, -2.00250244140625, -1.9334716796875, -1.86444091796875, -1.79541015625, -1.72637939453125, -1.6573486328125, -1.58831787109375, -1.519287109375, -1.45025634765625, -1.3812255859375, -1.31219482421875, -1.2431640625, -1.17413330078125, -1.1051025390625, -1.03607177734375, -0.967041015625, -0.89801025390625, -0.8289794921875, -0.75994873046875, -0.69091796875, -0.62188720703125, -0.5528564453125, -0.48382568359375, -0.414794921875, -0.34576416015625, -0.2767333984375, -0.20770263671875, -0.138671875, -0.06964111328125, -0.0006103515625, 0.06842041015625, 0.137451171875, 0.20648193359375, 0.2755126953125, 0.34454345703125, 0.41357421875, 0.48260498046875, 0.5516357421875, 0.62066650390625, 0.689697265625, 0.75872802734375, 0.8277587890625, 0.89678955078125, 0.9658203125, 1.03485107421875, 1.1038818359375, 1.17291259765625, 1.241943359375, 1.31097412109375, 1.3800048828125, 1.44903564453125, 1.51806640625, 1.58709716796875, 1.6561279296875, 1.72515869140625, 1.794189453125, 1.86322021484375, 1.9322509765625, 2.00128173828125, 2.0703125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 12.0, 10.0, 14.0, 12.0, 18.0, 19.0, 23.0, 33.0, 40.0, 36.0, 36.0, 45.0, 54.0, 64.0, 67.0, 62.0, 63.0, 51.0, 58.0, 53.0, 38.0, 39.0, 28.0, 23.0, 22.0, 19.0, 18.0, 13.0, 15.0, 10.0, 6.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.2086238861084, -17.542585372924805, -16.87654685974121, -16.210508346557617, -15.544469833374023, -14.87843132019043, -14.212393760681152, -13.546355247497559, -12.880316734313965, -12.214278221130371, -11.548239707946777, -10.882201194763184, -10.216163635253906, -9.550125122070312, -8.884086608886719, -8.218048095703125, -7.552009582519531, -6.8859710693359375, -6.219932556152344, -5.553894519805908, -4.8878560066223145, -4.221817493438721, -3.555779218673706, -2.8897409439086914, -2.2237024307250977, -1.5576640367507935, -0.8916256427764893, -0.22558724880218506, 0.44045114517211914, 1.106489658355713, 1.7725279331207275, 2.438566207885742, 3.104602813720703, 3.770641326904297, 4.436679840087891, 5.102717876434326, 5.76875638961792, 6.434794902801514, 7.100832939147949, 7.766871452331543, 8.432909965515137, 9.09894847869873, 9.764986991882324, 10.431025505065918, 11.097063064575195, 11.763101577758789, 12.429140090942383, 13.095178604125977, 13.76121711730957, 14.427255630493164, 15.093294143676758, 15.759332656860352, 16.425371170043945, 17.09140968322754, 17.757448196411133, 18.423484802246094, 19.089523315429688, 19.75556182861328, 20.421600341796875, 21.08763885498047, 21.753677368164062, 22.419715881347656, 23.08575439453125, 23.751792907714844, 24.417831420898438]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 8.0, 8.0, 8.0, 15.0, 21.0, 16.0, 19.0, 18.0, 28.0, 31.0, 42.0, 32.0, 40.0, 28.0, 43.0, 43.0, 44.0, 36.0, 49.0, 52.0, 50.0, 45.0, 39.0, 38.0, 28.0, 22.0, 32.0, 29.0, 20.0, 21.0, 19.0, 12.0, 8.0, 18.0, 5.0, 11.0, 4.0, 6.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.421575546264648, -14.000016212463379, -13.57845687866211, -13.15689754486084, -12.73533821105957, -12.313777923583984, -11.892218589782715, -11.470659255981445, -11.049099922180176, -10.627540588378906, -10.205981254577637, -9.784421920776367, -9.362861633300781, -8.941303253173828, -8.519742965698242, -8.098183631896973, -7.676624298095703, -7.255064964294434, -6.833505630493164, -6.411945819854736, -5.990386486053467, -5.568827152252197, -5.1472673416137695, -4.7257080078125, -4.3041486740112305, -3.882589340209961, -3.4610297679901123, -3.0394701957702637, -2.617910861968994, -2.1963515281677246, -1.774791955947876, -1.3532323837280273, -0.9316720962524414, -0.5101126432418823, -0.08855319023132324, 0.33300626277923584, 0.7545657157897949, 1.1761250495910645, 1.597684621810913, 2.0192441940307617, 2.4408035278320312, 2.862362861633301, 3.2839224338531494, 3.705482006072998, 4.127041339874268, 4.548600673675537, 4.970160484313965, 5.391719818115234, 5.813279151916504, 6.234838485717773, 6.656397819519043, 7.077957630157471, 7.49951696395874, 7.92107629776001, 8.342636108398438, 8.764195442199707, 9.185754776000977, 9.607314109802246, 10.028873443603516, 10.450432777404785, 10.871992111206055, 11.29355239868164, 11.71511173248291, 12.13667106628418, 12.55823040008545]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 4.0, 3.0, 9.0, 18.0, 32.0, 38.0, 42.0, 97.0, 114.0, 175.0, 281.0, 447.0, 721.0, 1054.0, 1615.0, 2625.0, 4214.0, 6750.0, 10061.0, 15996.0, 24552.0, 37102.0, 54470.0, 76297.0, 99314.0, 117226.0, 125344.0, 118914.0, 101661.0, 79429.0, 57020.0, 39215.0, 26326.0, 17329.0, 10738.0, 7058.0, 4462.0, 2810.0, 1839.0, 1097.0, 696.0, 505.0, 298.0, 194.0, 111.0, 67.0, 65.0, 36.0, 30.0, 11.0, 11.0, 11.0, 10.0, 4.0, 3.0, 4.0, 5.0], "bins": [-8.953125, -8.6864013671875, -8.419677734375, -8.1529541015625, -7.88623046875, -7.6195068359375, -7.352783203125, -7.0860595703125, -6.8193359375, -6.5526123046875, -6.285888671875, -6.0191650390625, -5.75244140625, -5.4857177734375, -5.218994140625, -4.9522705078125, -4.685546875, -4.4188232421875, -4.152099609375, -3.8853759765625, -3.61865234375, -3.3519287109375, -3.085205078125, -2.8184814453125, -2.5517578125, -2.2850341796875, -2.018310546875, -1.7515869140625, -1.48486328125, -1.2181396484375, -0.951416015625, -0.6846923828125, -0.41796875, -0.1512451171875, 0.115478515625, 0.3822021484375, 0.64892578125, 0.9156494140625, 1.182373046875, 1.4490966796875, 1.7158203125, 1.9825439453125, 2.249267578125, 2.5159912109375, 2.78271484375, 3.0494384765625, 3.316162109375, 3.5828857421875, 3.849609375, 4.1163330078125, 4.383056640625, 4.6497802734375, 4.91650390625, 5.1832275390625, 5.449951171875, 5.7166748046875, 5.9833984375, 6.2501220703125, 6.516845703125, 6.7835693359375, 7.05029296875, 7.3170166015625, 7.583740234375, 7.8504638671875, 8.1171875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 8.0, 10.0, 11.0, 15.0, 16.0, 24.0, 25.0, 20.0, 30.0, 31.0, 35.0, 26.0, 39.0, 39.0, 33.0, 35.0, 52.0, 44.0, 53.0, 34.0, 41.0, 43.0, 41.0, 43.0, 30.0, 25.0, 31.0, 22.0, 29.0, 23.0, 19.0, 12.0, 10.0, 11.0, 8.0, 6.0, 5.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.3046875, -13.85693359375, -13.4091796875, -12.96142578125, -12.513671875, -12.06591796875, -11.6181640625, -11.17041015625, -10.72265625, -10.27490234375, -9.8271484375, -9.37939453125, -8.931640625, -8.48388671875, -8.0361328125, -7.58837890625, -7.140625, -6.69287109375, -6.2451171875, -5.79736328125, -5.349609375, -4.90185546875, -4.4541015625, -4.00634765625, -3.55859375, -3.11083984375, -2.6630859375, -2.21533203125, -1.767578125, -1.31982421875, -0.8720703125, -0.42431640625, 0.0234375, 0.47119140625, 0.9189453125, 1.36669921875, 1.814453125, 2.26220703125, 2.7099609375, 3.15771484375, 3.60546875, 4.05322265625, 4.5009765625, 4.94873046875, 5.396484375, 5.84423828125, 6.2919921875, 6.73974609375, 7.1875, 7.63525390625, 8.0830078125, 8.53076171875, 8.978515625, 9.42626953125, 9.8740234375, 10.32177734375, 10.76953125, 11.21728515625, 11.6650390625, 12.11279296875, 12.560546875, 13.00830078125, 13.4560546875, 13.90380859375, 14.3515625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 7.0, 10.0, 10.0, 12.0, 19.0, 39.0, 68.0, 117.0, 179.0, 244.0, 374.0, 596.0, 887.0, 1393.0, 2170.0, 3185.0, 4891.0, 7272.0, 11108.0, 16541.0, 24065.0, 35886.0, 51589.0, 70161.0, 92255.0, 109613.0, 118387.0, 115536.0, 102151.0, 82317.0, 61531.0, 43772.0, 30510.0, 20846.0, 13880.0, 9115.0, 6117.0, 3889.0, 2732.0, 1747.0, 1175.0, 740.0, 496.0, 318.0, 218.0, 137.0, 91.0, 59.0, 45.0, 30.0, 10.0, 9.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-8.421875, -8.1568603515625, -7.891845703125, -7.6268310546875, -7.36181640625, -7.0968017578125, -6.831787109375, -6.5667724609375, -6.3017578125, -6.0367431640625, -5.771728515625, -5.5067138671875, -5.24169921875, -4.9766845703125, -4.711669921875, -4.4466552734375, -4.181640625, -3.9166259765625, -3.651611328125, -3.3865966796875, -3.12158203125, -2.8565673828125, -2.591552734375, -2.3265380859375, -2.0615234375, -1.7965087890625, -1.531494140625, -1.2664794921875, -1.00146484375, -0.7364501953125, -0.471435546875, -0.2064208984375, 0.05859375, 0.3236083984375, 0.588623046875, 0.8536376953125, 1.11865234375, 1.3836669921875, 1.648681640625, 1.9136962890625, 2.1787109375, 2.4437255859375, 2.708740234375, 2.9737548828125, 3.23876953125, 3.5037841796875, 3.768798828125, 4.0338134765625, 4.298828125, 4.5638427734375, 4.828857421875, 5.0938720703125, 5.35888671875, 5.6239013671875, 5.888916015625, 6.1539306640625, 6.4189453125, 6.6839599609375, 6.948974609375, 7.2139892578125, 7.47900390625, 7.7440185546875, 8.009033203125, 8.2740478515625, 8.5390625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 10.0, 6.0, 7.0, 9.0, 13.0, 12.0, 11.0, 15.0, 21.0, 20.0, 18.0, 19.0, 27.0, 30.0, 22.0, 34.0, 33.0, 39.0, 39.0, 40.0, 33.0, 42.0, 39.0, 41.0, 30.0, 42.0, 44.0, 29.0, 27.0, 28.0, 35.0, 27.0, 19.0, 16.0, 21.0, 22.0, 12.0, 13.0, 11.0, 6.0, 12.0, 9.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.38671875, -7.13177490234375, -6.8768310546875, -6.62188720703125, -6.366943359375, -6.11199951171875, -5.8570556640625, -5.60211181640625, -5.34716796875, -5.09222412109375, -4.8372802734375, -4.58233642578125, -4.327392578125, -4.07244873046875, -3.8175048828125, -3.56256103515625, -3.3076171875, -3.05267333984375, -2.7977294921875, -2.54278564453125, -2.287841796875, -2.03289794921875, -1.7779541015625, -1.52301025390625, -1.26806640625, -1.01312255859375, -0.7581787109375, -0.50323486328125, -0.248291015625, 0.00665283203125, 0.2615966796875, 0.51654052734375, 0.771484375, 1.02642822265625, 1.2813720703125, 1.53631591796875, 1.791259765625, 2.04620361328125, 2.3011474609375, 2.55609130859375, 2.81103515625, 3.06597900390625, 3.3209228515625, 3.57586669921875, 3.830810546875, 4.08575439453125, 4.3406982421875, 4.59564208984375, 4.8505859375, 5.10552978515625, 5.3604736328125, 5.61541748046875, 5.870361328125, 6.12530517578125, 6.3802490234375, 6.63519287109375, 6.89013671875, 7.14508056640625, 7.4000244140625, 7.65496826171875, 7.909912109375, 8.16485595703125, 8.4197998046875, 8.67474365234375, 8.9296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 10.0, 9.0, 15.0, 16.0, 30.0, 32.0, 40.0, 66.0, 139.0, 215.0, 369.0, 782.0, 1394.0, 2582.0, 5253.0, 10871.0, 22785.0, 46154.0, 89723.0, 154890.0, 208815.0, 201756.0, 142206.0, 80650.0, 40918.0, 19687.0, 9394.0, 4656.0, 2314.0, 1273.0, 644.0, 352.0, 194.0, 130.0, 53.0, 42.0, 21.0, 16.0, 12.0, 13.0, 12.0, 5.0, 9.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.1953125, -6.9625244140625, -6.729736328125, -6.4969482421875, -6.26416015625, -6.0313720703125, -5.798583984375, -5.5657958984375, -5.3330078125, -5.1002197265625, -4.867431640625, -4.6346435546875, -4.40185546875, -4.1690673828125, -3.936279296875, -3.7034912109375, -3.470703125, -3.2379150390625, -3.005126953125, -2.7723388671875, -2.53955078125, -2.3067626953125, -2.073974609375, -1.8411865234375, -1.6083984375, -1.3756103515625, -1.142822265625, -0.9100341796875, -0.67724609375, -0.4444580078125, -0.211669921875, 0.0211181640625, 0.25390625, 0.4866943359375, 0.719482421875, 0.9522705078125, 1.18505859375, 1.4178466796875, 1.650634765625, 1.8834228515625, 2.1162109375, 2.3489990234375, 2.581787109375, 2.8145751953125, 3.04736328125, 3.2801513671875, 3.512939453125, 3.7457275390625, 3.978515625, 4.2113037109375, 4.444091796875, 4.6768798828125, 4.90966796875, 5.1424560546875, 5.375244140625, 5.6080322265625, 5.8408203125, 6.0736083984375, 6.306396484375, 6.5391845703125, 6.77197265625, 7.0047607421875, 7.237548828125, 7.4703369140625, 7.703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 9.0, 12.0, 13.0, 20.0, 24.0, 33.0, 40.0, 54.0, 57.0, 63.0, 73.0, 75.0, 70.0, 65.0, 65.0, 60.0, 50.0, 51.0, 42.0, 29.0, 25.0, 17.0, 6.0, 10.0, 9.0, 3.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008082389831542969, -0.0007845014333724976, -0.0007607638835906982, -0.0007370263338088989, -0.0007132887840270996, -0.0006895512342453003, -0.000665813684463501, -0.0006420761346817017, -0.0006183385848999023, -0.000594601035118103, -0.0005708634853363037, -0.0005471259355545044, -0.0005233883857727051, -0.0004996508359909058, -0.00047591328620910645, -0.00045217573642730713, -0.0004284381866455078, -0.0004047006368637085, -0.0003809630870819092, -0.00035722553730010986, -0.00033348798751831055, -0.00030975043773651123, -0.0002860128879547119, -0.0002622753381729126, -0.00023853778839111328, -0.00021480023860931396, -0.00019106268882751465, -0.00016732513904571533, -0.00014358758926391602, -0.0001198500394821167, -9.611248970031738e-05, -7.237493991851807e-05, -4.863739013671875e-05, -2.4899840354919434e-05, -1.1622905731201172e-06, 2.25752592086792e-05, 4.6312808990478516e-05, 7.005035877227783e-05, 9.378790855407715e-05, 0.00011752545833587646, 0.00014126300811767578, 0.0001650005578994751, 0.00018873810768127441, 0.00021247565746307373, 0.00023621320724487305, 0.00025995075702667236, 0.0002836883068084717, 0.000307425856590271, 0.0003311634063720703, 0.00035490095615386963, 0.00037863850593566895, 0.00040237605571746826, 0.0004261136054992676, 0.0004498511552810669, 0.0004735887050628662, 0.0004973262548446655, 0.0005210638046264648, 0.0005448013544082642, 0.0005685389041900635, 0.0005922764539718628, 0.0006160140037536621, 0.0006397515535354614, 0.0006634891033172607, 0.0006872266530990601, 0.0007109642028808594]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 12.0, 19.0, 29.0, 30.0, 62.0, 93.0, 140.0, 257.0, 347.0, 566.0, 870.0, 1395.0, 2265.0, 3489.0, 5589.0, 9084.0, 14569.0, 23606.0, 37029.0, 57735.0, 84284.0, 114470.0, 137061.0, 142341.0, 126266.0, 97655.0, 67820.0, 45037.0, 28572.0, 18005.0, 11191.0, 6883.0, 4351.0, 2665.0, 1704.0, 1113.0, 710.0, 438.0, 258.0, 188.0, 117.0, 87.0, 55.0, 32.0, 23.0, 9.0, 12.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.25, -5.0870361328125, -4.924072265625, -4.7611083984375, -4.59814453125, -4.4351806640625, -4.272216796875, -4.1092529296875, -3.9462890625, -3.7833251953125, -3.620361328125, -3.4573974609375, -3.29443359375, -3.1314697265625, -2.968505859375, -2.8055419921875, -2.642578125, -2.4796142578125, -2.316650390625, -2.1536865234375, -1.99072265625, -1.8277587890625, -1.664794921875, -1.5018310546875, -1.3388671875, -1.1759033203125, -1.012939453125, -0.8499755859375, -0.68701171875, -0.5240478515625, -0.361083984375, -0.1981201171875, -0.03515625, 0.1278076171875, 0.290771484375, 0.4537353515625, 0.61669921875, 0.7796630859375, 0.942626953125, 1.1055908203125, 1.2685546875, 1.4315185546875, 1.594482421875, 1.7574462890625, 1.92041015625, 2.0833740234375, 2.246337890625, 2.4093017578125, 2.572265625, 2.7352294921875, 2.898193359375, 3.0611572265625, 3.22412109375, 3.3870849609375, 3.550048828125, 3.7130126953125, 3.8759765625, 4.0389404296875, 4.201904296875, 4.3648681640625, 4.52783203125, 4.6907958984375, 4.853759765625, 5.0167236328125, 5.1796875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 10.0, 7.0, 8.0, 7.0, 18.0, 17.0, 26.0, 28.0, 29.0, 37.0, 46.0, 40.0, 39.0, 41.0, 62.0, 54.0, 67.0, 53.0, 53.0, 47.0, 55.0, 47.0, 39.0, 21.0, 30.0, 22.0, 19.0, 16.0, 10.0, 10.0, 11.0, 8.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.75, -1.6938629150390625, -1.637725830078125, -1.5815887451171875, -1.52545166015625, -1.4693145751953125, -1.413177490234375, -1.3570404052734375, -1.3009033203125, -1.2447662353515625, -1.188629150390625, -1.1324920654296875, -1.07635498046875, -1.0202178955078125, -0.964080810546875, -0.9079437255859375, -0.851806640625, -0.7956695556640625, -0.739532470703125, -0.6833953857421875, -0.62725830078125, -0.5711212158203125, -0.514984130859375, -0.4588470458984375, -0.4027099609375, -0.3465728759765625, -0.290435791015625, -0.2342987060546875, -0.17816162109375, -0.1220245361328125, -0.065887451171875, -0.0097503662109375, 0.04638671875, 0.1025238037109375, 0.158660888671875, 0.2147979736328125, 0.27093505859375, 0.3270721435546875, 0.383209228515625, 0.4393463134765625, 0.4954833984375, 0.5516204833984375, 0.607757568359375, 0.6638946533203125, 0.72003173828125, 0.7761688232421875, 0.832305908203125, 0.8884429931640625, 0.944580078125, 1.0007171630859375, 1.056854248046875, 1.1129913330078125, 1.16912841796875, 1.2252655029296875, 1.281402587890625, 1.3375396728515625, 1.3936767578125, 1.4498138427734375, 1.505950927734375, 1.5620880126953125, 1.61822509765625, 1.6743621826171875, 1.730499267578125, 1.7866363525390625, 1.8427734375]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 10.0, 11.0, 11.0, 10.0, 14.0, 17.0, 20.0, 25.0, 36.0, 37.0, 37.0, 49.0, 52.0, 41.0, 62.0, 55.0, 59.0, 61.0, 46.0, 57.0, 40.0, 47.0, 25.0, 31.0, 24.0, 21.0, 20.0, 15.0, 30.0, 14.0, 10.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.08586883544922, -16.457021713256836, -15.82817268371582, -15.199324607849121, -14.570476531982422, -13.941629409790039, -13.31278133392334, -12.68393325805664, -12.055085182189941, -11.426237106323242, -10.797389030456543, -10.168540954589844, -9.539693832397461, -8.910844802856445, -8.281997680664062, -7.653149604797363, -7.024301528930664, -6.395453453063965, -5.766605377197266, -5.137757778167725, -4.508909702301025, -3.880061626434326, -3.251213788986206, -2.622365951538086, -1.9935178756713867, -1.364669919013977, -0.7358219623565674, -0.10697400569915771, 0.521873950958252, 1.1507220268249512, 1.7795698642730713, 2.4084177017211914, 3.0372657775878906, 3.66611385345459, 4.294961929321289, 4.92380952835083, 5.552657604217529, 6.1815056800842285, 6.8103532791137695, 7.439201354980469, 8.068049430847168, 8.696897506713867, 9.325745582580566, 9.954593658447266, 10.583440780639648, 11.212289810180664, 11.841136932373047, 12.469985008239746, 13.098833084106445, 13.727681159973145, 14.356529235839844, 14.985377311706543, 15.614225387573242, 16.243072509765625, 16.87192153930664, 17.500768661499023, 18.129615783691406, 18.75846290588379, 19.387311935424805, 20.016159057617188, 20.645008087158203, 21.273855209350586, 21.9027042388916, 22.531551361083984, 23.160400390625]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 1.0, 8.0, 11.0, 10.0, 12.0, 15.0, 19.0, 16.0, 25.0, 17.0, 31.0, 31.0, 35.0, 30.0, 39.0, 56.0, 32.0, 46.0, 29.0, 44.0, 36.0, 39.0, 44.0, 41.0, 36.0, 32.0, 34.0, 23.0, 31.0, 22.0, 20.0, 31.0, 19.0, 19.0, 13.0, 14.0, 10.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-14.279146194458008, -13.843429565429688, -13.407712936401367, -12.971996307373047, -12.536279678344727, -12.100563049316406, -11.664847373962402, -11.229130744934082, -10.793414115905762, -10.357697486877441, -9.921980857849121, -9.4862642288208, -9.050548553466797, -8.614831924438477, -8.179115295410156, -7.743398666381836, -7.307682037353516, -6.871965408325195, -6.436248779296875, -6.000532627105713, -5.564815998077393, -5.129099369049072, -4.69338321685791, -4.25766658782959, -3.8219499588012695, -3.386233329772949, -2.950516939163208, -2.514800548553467, -2.0790839195251465, -1.6433672904968262, -1.207650899887085, -0.7719345092773438, -0.33621788024902344, 0.09949862957000732, 0.5352151393890381, 0.9709316492080688, 1.4066481590270996, 1.84236478805542, 2.278081178665161, 2.7137975692749023, 3.1495141983032227, 3.585230827331543, 4.020947456359863, 4.456663608551025, 4.892380237579346, 5.328096866607666, 5.763813018798828, 6.199529647827148, 6.635246276855469, 7.070962905883789, 7.506679534912109, 7.9423956871032715, 8.37811279296875, 8.81382942199707, 9.249545097351074, 9.685261726379395, 10.120978355407715, 10.556694984436035, 10.992411613464355, 11.428128242492676, 11.86384391784668, 12.299560546875, 12.73527717590332, 13.17099380493164, 13.606710433959961]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [6.0, 7.0, 8.0, 20.0, 35.0, 60.0, 105.0, 144.0, 219.0, 316.0, 510.0, 859.0, 1267.0, 1923.0, 3000.0, 5134.0, 8234.0, 14017.0, 24932.0, 44688.0, 80545.0, 145907.0, 255239.0, 425376.0, 625798.0, 740709.0, 664830.0, 472216.0, 291869.0, 167302.0, 93693.0, 52571.0, 29680.0, 16835.0, 9816.0, 5872.0, 3710.0, 2283.0, 1466.0, 985.0, 637.0, 455.0, 290.0, 211.0, 152.0, 102.0, 66.0, 56.0, 36.0, 34.0, 20.0, 19.0, 8.0, 8.0, 5.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.71875, -13.183349609375, -12.64794921875, -12.112548828125, -11.5771484375, -11.041748046875, -10.50634765625, -9.970947265625, -9.435546875, -8.900146484375, -8.36474609375, -7.829345703125, -7.2939453125, -6.758544921875, -6.22314453125, -5.687744140625, -5.15234375, -4.616943359375, -4.08154296875, -3.546142578125, -3.0107421875, -2.475341796875, -1.93994140625, -1.404541015625, -0.869140625, -0.333740234375, 0.20166015625, 0.737060546875, 1.2724609375, 1.807861328125, 2.34326171875, 2.878662109375, 3.4140625, 3.949462890625, 4.48486328125, 5.020263671875, 5.5556640625, 6.091064453125, 6.62646484375, 7.161865234375, 7.697265625, 8.232666015625, 8.76806640625, 9.303466796875, 9.8388671875, 10.374267578125, 10.90966796875, 11.445068359375, 11.98046875, 12.515869140625, 13.05126953125, 13.586669921875, 14.1220703125, 14.657470703125, 15.19287109375, 15.728271484375, 16.263671875, 16.799072265625, 17.33447265625, 17.869873046875, 18.4052734375, 18.940673828125, 19.47607421875, 20.011474609375, 20.546875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 2.0, 9.0, 10.0, 12.0, 9.0, 9.0, 8.0, 22.0, 31.0, 21.0, 23.0, 27.0, 26.0, 26.0, 43.0, 34.0, 40.0, 45.0, 46.0, 53.0, 48.0, 42.0, 27.0, 31.0, 37.0, 36.0, 38.0, 36.0, 31.0, 26.0, 22.0, 16.0, 14.0, 17.0, 20.0, 10.0, 14.0, 11.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.328125, -10.964111328125, -10.60009765625, -10.236083984375, -9.8720703125, -9.508056640625, -9.14404296875, -8.780029296875, -8.416015625, -8.052001953125, -7.68798828125, -7.323974609375, -6.9599609375, -6.595947265625, -6.23193359375, -5.867919921875, -5.50390625, -5.139892578125, -4.77587890625, -4.411865234375, -4.0478515625, -3.683837890625, -3.31982421875, -2.955810546875, -2.591796875, -2.227783203125, -1.86376953125, -1.499755859375, -1.1357421875, -0.771728515625, -0.40771484375, -0.043701171875, 0.3203125, 0.684326171875, 1.04833984375, 1.412353515625, 1.7763671875, 2.140380859375, 2.50439453125, 2.868408203125, 3.232421875, 3.596435546875, 3.96044921875, 4.324462890625, 4.6884765625, 5.052490234375, 5.41650390625, 5.780517578125, 6.14453125, 6.508544921875, 6.87255859375, 7.236572265625, 7.6005859375, 7.964599609375, 8.32861328125, 8.692626953125, 9.056640625, 9.420654296875, 9.78466796875, 10.148681640625, 10.5126953125, 10.876708984375, 11.24072265625, 11.604736328125, 11.96875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 14.0, 14.0, 32.0, 29.0, 50.0, 79.0, 118.0, 154.0, 245.0, 406.0, 623.0, 947.0, 1604.0, 2425.0, 3864.0, 6312.0, 9856.0, 15812.0, 26208.0, 42394.0, 69383.0, 111304.0, 176651.0, 268644.0, 383009.0, 499025.0, 568265.0, 555465.0, 464418.0, 346725.0, 236001.0, 152705.0, 96219.0, 59433.0, 36610.0, 22594.0, 13846.0, 8557.0, 5229.0, 3297.0, 2070.0, 1261.0, 830.0, 565.0, 333.0, 237.0, 136.0, 113.0, 48.0, 37.0, 31.0, 14.0, 17.0, 12.0, 8.0, 2.0, 2.0, 2.0], "bins": [-17.671875, -17.1337890625, -16.595703125, -16.0576171875, -15.51953125, -14.9814453125, -14.443359375, -13.9052734375, -13.3671875, -12.8291015625, -12.291015625, -11.7529296875, -11.21484375, -10.6767578125, -10.138671875, -9.6005859375, -9.0625, -8.5244140625, -7.986328125, -7.4482421875, -6.91015625, -6.3720703125, -5.833984375, -5.2958984375, -4.7578125, -4.2197265625, -3.681640625, -3.1435546875, -2.60546875, -2.0673828125, -1.529296875, -0.9912109375, -0.453125, 0.0849609375, 0.623046875, 1.1611328125, 1.69921875, 2.2373046875, 2.775390625, 3.3134765625, 3.8515625, 4.3896484375, 4.927734375, 5.4658203125, 6.00390625, 6.5419921875, 7.080078125, 7.6181640625, 8.15625, 8.6943359375, 9.232421875, 9.7705078125, 10.30859375, 10.8466796875, 11.384765625, 11.9228515625, 12.4609375, 12.9990234375, 13.537109375, 14.0751953125, 14.61328125, 15.1513671875, 15.689453125, 16.2275390625, 16.765625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 1.0, 4.0, 9.0, 10.0, 13.0, 19.0, 20.0, 31.0, 31.0, 54.0, 61.0, 59.0, 75.0, 102.0, 129.0, 136.0, 169.0, 161.0, 176.0, 188.0, 214.0, 250.0, 231.0, 224.0, 216.0, 188.0, 218.0, 187.0, 161.0, 140.0, 108.0, 100.0, 85.0, 64.0, 44.0, 33.0, 44.0, 31.0, 23.0, 22.0, 7.0, 10.0, 6.0, 6.0, 5.0, 1.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-7.2578125, -7.04803466796875, -6.8382568359375, -6.62847900390625, -6.418701171875, -6.20892333984375, -5.9991455078125, -5.78936767578125, -5.57958984375, -5.36981201171875, -5.1600341796875, -4.95025634765625, -4.740478515625, -4.53070068359375, -4.3209228515625, -4.11114501953125, -3.9013671875, -3.69158935546875, -3.4818115234375, -3.27203369140625, -3.062255859375, -2.85247802734375, -2.6427001953125, -2.43292236328125, -2.22314453125, -2.01336669921875, -1.8035888671875, -1.59381103515625, -1.384033203125, -1.17425537109375, -0.9644775390625, -0.75469970703125, -0.544921875, -0.33514404296875, -0.1253662109375, 0.08441162109375, 0.294189453125, 0.50396728515625, 0.7137451171875, 0.92352294921875, 1.13330078125, 1.34307861328125, 1.5528564453125, 1.76263427734375, 1.972412109375, 2.18218994140625, 2.3919677734375, 2.60174560546875, 2.8115234375, 3.02130126953125, 3.2310791015625, 3.44085693359375, 3.650634765625, 3.86041259765625, 4.0701904296875, 4.27996826171875, 4.48974609375, 4.69952392578125, 4.9093017578125, 5.11907958984375, 5.328857421875, 5.53863525390625, 5.7484130859375, 5.95819091796875, 6.16796875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 9.0, 12.0, 16.0, 25.0, 19.0, 21.0, 37.0, 48.0, 37.0, 44.0, 59.0, 63.0, 54.0, 65.0, 60.0, 56.0, 55.0, 51.0, 54.0, 43.0, 30.0, 26.0, 20.0, 30.0, 16.0, 5.0, 15.0, 8.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.70885467529297, -25.779415130615234, -24.849973678588867, -23.920534133911133, -22.991092681884766, -22.06165313720703, -21.132213592529297, -20.202774047851562, -19.273332595825195, -18.34389305114746, -17.414451599121094, -16.48501205444336, -15.555571556091309, -14.626131057739258, -13.696691513061523, -12.767251014709473, -11.837810516357422, -10.908370018005371, -9.97892951965332, -9.049489974975586, -8.120049476623535, -7.190608978271484, -6.261168956756592, -5.331728935241699, -4.402288436889648, -3.4728481769561768, -2.543407917022705, -1.6139676570892334, -0.6845273971557617, 0.24491310119628906, 1.1743531227111816, 2.103793144226074, 3.033233642578125, 3.9626739025115967, 4.892114162445068, 5.821554183959961, 6.750994682312012, 7.6804351806640625, 8.609874725341797, 9.539315223693848, 10.468755722045898, 11.39819622039795, 12.32763671875, 13.257076263427734, 14.186516761779785, 15.115957260131836, 16.04539680480957, 16.974838256835938, 17.904277801513672, 18.833717346191406, 19.763158798217773, 20.692598342895508, 21.622039794921875, 22.55147933959961, 23.480918884277344, 24.410358428955078, 25.339799880981445, 26.26923942565918, 27.198680877685547, 28.12812042236328, 29.057559967041016, 29.987001419067383, 30.916440963745117, 31.845882415771484, 32.77532196044922]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 8.0, 6.0, 8.0, 13.0, 11.0, 18.0, 20.0, 20.0, 26.0, 23.0, 34.0, 26.0, 37.0, 31.0, 57.0, 44.0, 47.0, 47.0, 39.0, 39.0, 43.0, 50.0, 42.0, 35.0, 31.0, 33.0, 26.0, 18.0, 23.0, 24.0, 25.0, 12.0, 19.0, 17.0, 5.0, 8.0, 6.0, 4.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.36580467224121, -15.850807189941406, -15.335808753967285, -14.82081127166748, -14.30581283569336, -13.790815353393555, -13.27581787109375, -12.760820388793945, -12.245821952819824, -11.73082447052002, -11.215826034545898, -10.700828552246094, -10.185831069946289, -9.670832633972168, -9.155835151672363, -8.640836715698242, -8.125839233398438, -7.610841274261475, -7.095843315124512, -6.580845832824707, -6.065847873687744, -5.550849914550781, -5.035852432250977, -4.520854473114014, -4.005856513977051, -3.490858554840088, -2.975860834121704, -2.4608631134033203, -1.9458651542663574, -1.4308671951293945, -0.9158694744110107, -0.40087175369262695, 0.11412429809570312, 0.6291221380233765, 1.1441199779510498, 1.6591178178787231, 2.1741156578063965, 2.6891136169433594, 3.204111337661743, 3.719109058380127, 4.23410701751709, 4.749104976654053, 5.264102935791016, 5.77910041809082, 6.294098377227783, 6.809096336364746, 7.324093818664551, 7.839091777801514, 8.354089736938477, 8.869087219238281, 9.384085655212402, 9.899083137512207, 10.414081573486328, 10.929079055786133, 11.444076538085938, 11.959074020385742, 12.474072456359863, 12.989069938659668, 13.504068374633789, 14.019065856933594, 14.534063339233398, 15.04906177520752, 15.564059257507324, 16.079057693481445, 16.59405517578125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 7.0, 5.0, 9.0, 17.0, 21.0, 26.0, 38.0, 58.0, 85.0, 142.0, 273.0, 416.0, 686.0, 1201.0, 1955.0, 3485.0, 5924.0, 10164.0, 17237.0, 29093.0, 48625.0, 77216.0, 113620.0, 149031.0, 161507.0, 143423.0, 106130.0, 70073.0, 43898.0, 26519.0, 15722.0, 9013.0, 5355.0, 3153.0, 1808.0, 1029.0, 587.0, 377.0, 229.0, 130.0, 93.0, 65.0, 36.0, 18.0, 19.0, 11.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0], "bins": [-11.2265625, -10.909423828125, -10.59228515625, -10.275146484375, -9.9580078125, -9.640869140625, -9.32373046875, -9.006591796875, -8.689453125, -8.372314453125, -8.05517578125, -7.738037109375, -7.4208984375, -7.103759765625, -6.78662109375, -6.469482421875, -6.15234375, -5.835205078125, -5.51806640625, -5.200927734375, -4.8837890625, -4.566650390625, -4.24951171875, -3.932373046875, -3.615234375, -3.298095703125, -2.98095703125, -2.663818359375, -2.3466796875, -2.029541015625, -1.71240234375, -1.395263671875, -1.078125, -0.760986328125, -0.44384765625, -0.126708984375, 0.1904296875, 0.507568359375, 0.82470703125, 1.141845703125, 1.458984375, 1.776123046875, 2.09326171875, 2.410400390625, 2.7275390625, 3.044677734375, 3.36181640625, 3.678955078125, 3.99609375, 4.313232421875, 4.63037109375, 4.947509765625, 5.2646484375, 5.581787109375, 5.89892578125, 6.216064453125, 6.533203125, 6.850341796875, 7.16748046875, 7.484619140625, 7.8017578125, 8.118896484375, 8.43603515625, 8.753173828125, 9.0703125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 10.0, 14.0, 14.0, 13.0, 25.0, 14.0, 17.0, 31.0, 23.0, 34.0, 27.0, 32.0, 39.0, 38.0, 51.0, 50.0, 37.0, 29.0, 46.0, 46.0, 43.0, 48.0, 34.0, 41.0, 32.0, 27.0, 30.0, 22.0, 16.0, 15.0, 18.0, 17.0, 12.0, 13.0, 6.0, 10.0, 10.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.434814453125, -17.88525390625, -17.335693359375, -16.7861328125, -16.236572265625, -15.68701171875, -15.137451171875, -14.587890625, -14.038330078125, -13.48876953125, -12.939208984375, -12.3896484375, -11.840087890625, -11.29052734375, -10.740966796875, -10.19140625, -9.641845703125, -9.09228515625, -8.542724609375, -7.9931640625, -7.443603515625, -6.89404296875, -6.344482421875, -5.794921875, -5.245361328125, -4.69580078125, -4.146240234375, -3.5966796875, -3.047119140625, -2.49755859375, -1.947998046875, -1.3984375, -0.848876953125, -0.29931640625, 0.250244140625, 0.7998046875, 1.349365234375, 1.89892578125, 2.448486328125, 2.998046875, 3.547607421875, 4.09716796875, 4.646728515625, 5.1962890625, 5.745849609375, 6.29541015625, 6.844970703125, 7.39453125, 7.944091796875, 8.49365234375, 9.043212890625, 9.5927734375, 10.142333984375, 10.69189453125, 11.241455078125, 11.791015625, 12.340576171875, 12.89013671875, 13.439697265625, 13.9892578125, 14.538818359375, 15.08837890625, 15.637939453125, 16.1875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 4.0, 6.0, 14.0, 14.0, 29.0, 37.0, 54.0, 77.0, 147.0, 238.0, 355.0, 562.0, 1007.0, 1810.0, 3518.0, 6396.0, 13325.0, 28510.0, 64267.0, 144107.0, 267929.0, 262575.0, 138758.0, 61093.0, 27171.0, 12682.0, 6332.0, 3236.0, 1748.0, 953.0, 606.0, 386.0, 233.0, 146.0, 84.0, 54.0, 40.0, 15.0, 13.0, 15.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.796875, -21.173583984375, -20.55029296875, -19.927001953125, -19.3037109375, -18.680419921875, -18.05712890625, -17.433837890625, -16.810546875, -16.187255859375, -15.56396484375, -14.940673828125, -14.3173828125, -13.694091796875, -13.07080078125, -12.447509765625, -11.82421875, -11.200927734375, -10.57763671875, -9.954345703125, -9.3310546875, -8.707763671875, -8.08447265625, -7.461181640625, -6.837890625, -6.214599609375, -5.59130859375, -4.968017578125, -4.3447265625, -3.721435546875, -3.09814453125, -2.474853515625, -1.8515625, -1.228271484375, -0.60498046875, 0.018310546875, 0.6416015625, 1.264892578125, 1.88818359375, 2.511474609375, 3.134765625, 3.758056640625, 4.38134765625, 5.004638671875, 5.6279296875, 6.251220703125, 6.87451171875, 7.497802734375, 8.12109375, 8.744384765625, 9.36767578125, 9.990966796875, 10.6142578125, 11.237548828125, 11.86083984375, 12.484130859375, 13.107421875, 13.730712890625, 14.35400390625, 14.977294921875, 15.6005859375, 16.223876953125, 16.84716796875, 17.470458984375, 18.09375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 7.0, 9.0, 11.0, 8.0, 14.0, 12.0, 11.0, 19.0, 22.0, 17.0, 29.0, 31.0, 39.0, 41.0, 34.0, 39.0, 39.0, 33.0, 37.0, 42.0, 40.0, 44.0, 31.0, 36.0, 30.0, 42.0, 31.0, 39.0, 27.0, 35.0, 20.0, 21.0, 28.0, 16.0, 8.0, 19.0, 11.0, 9.0, 4.0, 5.0, 9.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.9453125, -8.638916015625, -8.33251953125, -8.026123046875, -7.7197265625, -7.413330078125, -7.10693359375, -6.800537109375, -6.494140625, -6.187744140625, -5.88134765625, -5.574951171875, -5.2685546875, -4.962158203125, -4.65576171875, -4.349365234375, -4.04296875, -3.736572265625, -3.43017578125, -3.123779296875, -2.8173828125, -2.510986328125, -2.20458984375, -1.898193359375, -1.591796875, -1.285400390625, -0.97900390625, -0.672607421875, -0.3662109375, -0.059814453125, 0.24658203125, 0.552978515625, 0.859375, 1.165771484375, 1.47216796875, 1.778564453125, 2.0849609375, 2.391357421875, 2.69775390625, 3.004150390625, 3.310546875, 3.616943359375, 3.92333984375, 4.229736328125, 4.5361328125, 4.842529296875, 5.14892578125, 5.455322265625, 5.76171875, 6.068115234375, 6.37451171875, 6.680908203125, 6.9873046875, 7.293701171875, 7.60009765625, 7.906494140625, 8.212890625, 8.519287109375, 8.82568359375, 9.132080078125, 9.4384765625, 9.744873046875, 10.05126953125, 10.357666015625, 10.6640625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 15.0, 19.0, 17.0, 20.0, 49.0, 52.0, 98.0, 135.0, 248.0, 363.0, 538.0, 957.0, 1539.0, 2606.0, 4657.0, 8216.0, 15740.0, 29870.0, 58283.0, 111421.0, 192413.0, 239284.0, 174667.0, 98269.0, 50995.0, 26415.0, 13756.0, 7621.0, 4219.0, 2401.0, 1365.0, 821.0, 542.0, 322.0, 211.0, 139.0, 94.0, 48.0, 32.0, 31.0, 22.0, 14.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.91796875, -7.65753173828125, -7.3970947265625, -7.13665771484375, -6.876220703125, -6.61578369140625, -6.3553466796875, -6.09490966796875, -5.83447265625, -5.57403564453125, -5.3135986328125, -5.05316162109375, -4.792724609375, -4.53228759765625, -4.2718505859375, -4.01141357421875, -3.7509765625, -3.49053955078125, -3.2301025390625, -2.96966552734375, -2.709228515625, -2.44879150390625, -2.1883544921875, -1.92791748046875, -1.66748046875, -1.40704345703125, -1.1466064453125, -0.88616943359375, -0.625732421875, -0.36529541015625, -0.1048583984375, 0.15557861328125, 0.416015625, 0.67645263671875, 0.9368896484375, 1.19732666015625, 1.457763671875, 1.71820068359375, 1.9786376953125, 2.23907470703125, 2.49951171875, 2.75994873046875, 3.0203857421875, 3.28082275390625, 3.541259765625, 3.80169677734375, 4.0621337890625, 4.32257080078125, 4.5830078125, 4.84344482421875, 5.1038818359375, 5.36431884765625, 5.624755859375, 5.88519287109375, 6.1456298828125, 6.40606689453125, 6.66650390625, 6.92694091796875, 7.1873779296875, 7.44781494140625, 7.708251953125, 7.96868896484375, 8.2291259765625, 8.48956298828125, 8.75]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 9.0, 8.0, 11.0, 11.0, 27.0, 26.0, 32.0, 42.0, 38.0, 41.0, 56.0, 58.0, 65.0, 70.0, 66.0, 69.0, 52.0, 47.0, 49.0, 36.0, 32.0, 23.0, 26.0, 20.0, 15.0, 16.0, 7.0, 3.0, 10.0, 6.0, 3.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033926963806152344, -0.00032934918999671936, -0.0003194287419319153, -0.0003095082938671112, -0.00029958784580230713, -0.00028966739773750305, -0.000279746949672699, -0.0002698265016078949, -0.0002599060535430908, -0.00024998560547828674, -0.00024006515741348267, -0.0002301447093486786, -0.0002202242612838745, -0.00021030381321907043, -0.00020038336515426636, -0.00019046291708946228, -0.0001805424690246582, -0.00017062202095985413, -0.00016070157289505005, -0.00015078112483024597, -0.0001408606767654419, -0.00013094022870063782, -0.00012101978063583374, -0.00011109933257102966, -0.00010117888450622559, -9.125843644142151e-05, -8.133798837661743e-05, -7.141754031181335e-05, -6.149709224700928e-05, -5.15766441822052e-05, -4.165619611740112e-05, -3.1735748052597046e-05, -2.181529998779297e-05, -1.1894851922988892e-05, -1.9744038581848145e-06, 7.946044206619263e-06, 1.786649227142334e-05, 2.7786940336227417e-05, 3.7707388401031494e-05, 4.762783646583557e-05, 5.754828453063965e-05, 6.746873259544373e-05, 7.73891806602478e-05, 8.730962872505188e-05, 9.723007678985596e-05, 0.00010715052485466003, 0.00011707097291946411, 0.0001269914209842682, 0.00013691186904907227, 0.00014683231711387634, 0.00015675276517868042, 0.0001666732132434845, 0.00017659366130828857, 0.00018651410937309265, 0.00019643455743789673, 0.0002063550055027008, 0.00021627545356750488, 0.00022619590163230896, 0.00023611634969711304, 0.0002460367977619171, 0.0002559572458267212, 0.00026587769389152527, 0.00027579814195632935, 0.0002857185900211334, 0.0002956390380859375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 3.0, 4.0, 7.0, 13.0, 26.0, 42.0, 52.0, 83.0, 108.0, 181.0, 256.0, 393.0, 620.0, 1005.0, 1670.0, 2848.0, 5088.0, 9001.0, 16496.0, 29431.0, 52478.0, 89379.0, 137428.0, 176108.0, 175188.0, 137952.0, 90603.0, 53333.0, 30144.0, 16766.0, 9174.0, 5081.0, 2979.0, 1729.0, 1076.0, 641.0, 394.0, 236.0, 183.0, 108.0, 85.0, 53.0, 28.0, 21.0, 22.0, 11.0, 17.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.61407470703125, -8.3531494140625, -8.09222412109375, -7.831298828125, -7.57037353515625, -7.3094482421875, -7.04852294921875, -6.78759765625, -6.52667236328125, -6.2657470703125, -6.00482177734375, -5.743896484375, -5.48297119140625, -5.2220458984375, -4.96112060546875, -4.7001953125, -4.43927001953125, -4.1783447265625, -3.91741943359375, -3.656494140625, -3.39556884765625, -3.1346435546875, -2.87371826171875, -2.61279296875, -2.35186767578125, -2.0909423828125, -1.83001708984375, -1.569091796875, -1.30816650390625, -1.0472412109375, -0.78631591796875, -0.525390625, -0.26446533203125, -0.0035400390625, 0.25738525390625, 0.518310546875, 0.77923583984375, 1.0401611328125, 1.30108642578125, 1.56201171875, 1.82293701171875, 2.0838623046875, 2.34478759765625, 2.605712890625, 2.86663818359375, 3.1275634765625, 3.38848876953125, 3.6494140625, 3.91033935546875, 4.1712646484375, 4.43218994140625, 4.693115234375, 4.95404052734375, 5.2149658203125, 5.47589111328125, 5.73681640625, 5.99774169921875, 6.2586669921875, 6.51959228515625, 6.780517578125, 7.04144287109375, 7.3023681640625, 7.56329345703125, 7.82421875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 14.0, 8.0, 13.0, 13.0, 20.0, 24.0, 31.0, 51.0, 50.0, 41.0, 45.0, 44.0, 56.0, 79.0, 55.0, 57.0, 52.0, 55.0, 58.0, 37.0, 38.0, 24.0, 27.0, 29.0, 21.0, 9.0, 9.0, 5.0, 9.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.468017578125, -2.39306640625, -2.318115234375, -2.2431640625, -2.168212890625, -2.09326171875, -2.018310546875, -1.943359375, -1.868408203125, -1.79345703125, -1.718505859375, -1.6435546875, -1.568603515625, -1.49365234375, -1.418701171875, -1.34375, -1.268798828125, -1.19384765625, -1.118896484375, -1.0439453125, -0.968994140625, -0.89404296875, -0.819091796875, -0.744140625, -0.669189453125, -0.59423828125, -0.519287109375, -0.4443359375, -0.369384765625, -0.29443359375, -0.219482421875, -0.14453125, -0.069580078125, 0.00537109375, 0.080322265625, 0.1552734375, 0.230224609375, 0.30517578125, 0.380126953125, 0.455078125, 0.530029296875, 0.60498046875, 0.679931640625, 0.7548828125, 0.829833984375, 0.90478515625, 0.979736328125, 1.0546875, 1.129638671875, 1.20458984375, 1.279541015625, 1.3544921875, 1.429443359375, 1.50439453125, 1.579345703125, 1.654296875, 1.729248046875, 1.80419921875, 1.879150390625, 1.9541015625, 2.029052734375, 2.10400390625, 2.178955078125, 2.25390625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 7.0, 6.0, 17.0, 14.0, 21.0, 22.0, 25.0, 30.0, 47.0, 46.0, 55.0, 60.0, 66.0, 71.0, 65.0, 46.0, 65.0, 64.0, 49.0, 50.0, 35.0, 38.0, 20.0, 24.0, 20.0, 8.0, 11.0, 13.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.314485549926758, -28.31688117980957, -27.319276809692383, -26.321674346923828, -25.32406997680664, -24.326465606689453, -23.328861236572266, -22.331256866455078, -21.33365249633789, -20.336048126220703, -19.338443756103516, -18.340839385986328, -17.343236923217773, -16.345632553100586, -15.348028182983398, -14.350423812866211, -13.352821350097656, -12.355216979980469, -11.357613563537598, -10.36000919342041, -9.362405776977539, -8.364801406860352, -7.367197036743164, -6.369593143463135, -5.3719892501831055, -4.374385356903076, -3.3767812252044678, -2.3791770935058594, -1.38157320022583, -0.3839693069458008, 0.6136350631713867, 1.611238956451416, 2.6088409423828125, 3.606444835662842, 4.604048728942871, 5.601653099060059, 6.599256992340088, 7.596860885620117, 8.594465255737305, 9.592069625854492, 10.589673042297363, 11.58727741241455, 12.584880828857422, 13.58248519897461, 14.580089569091797, 15.577692985534668, 16.575298309326172, 17.572900772094727, 18.570505142211914, 19.5681095123291, 20.56571388244629, 21.563316345214844, 22.56092071533203, 23.55852508544922, 24.556129455566406, 25.553733825683594, 26.55133819580078, 27.54894256591797, 28.546546936035156, 29.544151306152344, 30.5417537689209, 31.539358139038086, 32.536964416503906, 33.53456497192383, 34.532169342041016]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 7.0, 9.0, 12.0, 12.0, 18.0, 15.0, 16.0, 27.0, 23.0, 30.0, 38.0, 39.0, 31.0, 39.0, 50.0, 42.0, 52.0, 44.0, 38.0, 38.0, 46.0, 54.0, 29.0, 38.0, 29.0, 32.0, 23.0, 20.0, 19.0, 25.0, 10.0, 23.0, 17.0, 8.0, 7.0, 6.0, 7.0, 7.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.50937271118164, -15.992749214172363, -15.476125717163086, -14.959502220153809, -14.442878723144531, -13.926255226135254, -13.409631729125977, -12.8930082321167, -12.376384735107422, -11.859761238098145, -11.343137741088867, -10.82651424407959, -10.309890747070312, -9.793267250061035, -9.276643753051758, -8.76002025604248, -8.243396759033203, -7.726773262023926, -7.210149765014648, -6.693526268005371, -6.176902770996094, -5.660279273986816, -5.143655776977539, -4.627032279968262, -4.110408782958984, -3.593785285949707, -3.0771617889404297, -2.5605382919311523, -2.043914794921875, -1.5272912979125977, -1.0106678009033203, -0.49404430389404297, 0.022579193115234375, 0.5392026901245117, 1.055826187133789, 1.5724496841430664, 2.0890731811523438, 2.605696678161621, 3.1223201751708984, 3.638943672180176, 4.155567169189453, 4.6721906661987305, 5.188814163208008, 5.705437660217285, 6.2220611572265625, 6.73868465423584, 7.255308151245117, 7.7719316482543945, 8.288555145263672, 8.80517864227295, 9.321802139282227, 9.838425636291504, 10.355049133300781, 10.871672630310059, 11.388296127319336, 11.904919624328613, 12.42154312133789, 12.938166618347168, 13.454790115356445, 13.971413612365723, 14.488037109375, 15.004660606384277, 15.521284103393555, 16.037906646728516, 16.55453109741211]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 13.0, 16.0, 14.0, 32.0, 53.0, 70.0, 98.0, 164.0, 216.0, 338.0, 502.0, 861.0, 1315.0, 2102.0, 3251.0, 5357.0, 8637.0, 14279.0, 23575.0, 37776.0, 60080.0, 89505.0, 121745.0, 144588.0, 145801.0, 125665.0, 94389.0, 63633.0, 40344.0, 24790.0, 15160.0, 9139.0, 5510.0, 3350.0, 2200.0, 1385.0, 925.0, 604.0, 358.0, 235.0, 158.0, 121.0, 83.0, 42.0, 35.0, 18.0, 10.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.546875, -13.149169921875, -12.75146484375, -12.353759765625, -11.9560546875, -11.558349609375, -11.16064453125, -10.762939453125, -10.365234375, -9.967529296875, -9.56982421875, -9.172119140625, -8.7744140625, -8.376708984375, -7.97900390625, -7.581298828125, -7.18359375, -6.785888671875, -6.38818359375, -5.990478515625, -5.5927734375, -5.195068359375, -4.79736328125, -4.399658203125, -4.001953125, -3.604248046875, -3.20654296875, -2.808837890625, -2.4111328125, -2.013427734375, -1.61572265625, -1.218017578125, -0.8203125, -0.422607421875, -0.02490234375, 0.372802734375, 0.7705078125, 1.168212890625, 1.56591796875, 1.963623046875, 2.361328125, 2.759033203125, 3.15673828125, 3.554443359375, 3.9521484375, 4.349853515625, 4.74755859375, 5.145263671875, 5.54296875, 5.940673828125, 6.33837890625, 6.736083984375, 7.1337890625, 7.531494140625, 7.92919921875, 8.326904296875, 8.724609375, 9.122314453125, 9.52001953125, 9.917724609375, 10.3154296875, 10.713134765625, 11.11083984375, 11.508544921875, 11.90625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 21.0, 9.0, 14.0, 18.0, 16.0, 25.0, 32.0, 27.0, 34.0, 44.0, 35.0, 46.0, 52.0, 43.0, 51.0, 48.0, 58.0, 58.0, 44.0, 41.0, 36.0, 35.0, 21.0, 25.0, 30.0, 22.0, 13.0, 21.0, 14.0, 11.0, 10.0, 8.0, 10.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.28125, -17.674560546875, -17.06787109375, -16.461181640625, -15.8544921875, -15.247802734375, -14.64111328125, -14.034423828125, -13.427734375, -12.821044921875, -12.21435546875, -11.607666015625, -11.0009765625, -10.394287109375, -9.78759765625, -9.180908203125, -8.57421875, -7.967529296875, -7.36083984375, -6.754150390625, -6.1474609375, -5.540771484375, -4.93408203125, -4.327392578125, -3.720703125, -3.114013671875, -2.50732421875, -1.900634765625, -1.2939453125, -0.687255859375, -0.08056640625, 0.526123046875, 1.1328125, 1.739501953125, 2.34619140625, 2.952880859375, 3.5595703125, 4.166259765625, 4.77294921875, 5.379638671875, 5.986328125, 6.593017578125, 7.19970703125, 7.806396484375, 8.4130859375, 9.019775390625, 9.62646484375, 10.233154296875, 10.83984375, 11.446533203125, 12.05322265625, 12.659912109375, 13.2666015625, 13.873291015625, 14.47998046875, 15.086669921875, 15.693359375, 16.300048828125, 16.90673828125, 17.513427734375, 18.1201171875, 18.726806640625, 19.33349609375, 19.940185546875, 20.546875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 6.0, 7.0, 7.0, 20.0, 37.0, 49.0, 74.0, 124.0, 165.0, 274.0, 425.0, 662.0, 1098.0, 1617.0, 2615.0, 4054.0, 6556.0, 10752.0, 17288.0, 28117.0, 45611.0, 70475.0, 102631.0, 133980.0, 149820.0, 141736.0, 113500.0, 79517.0, 51943.0, 32423.0, 20031.0, 12279.0, 7677.0, 4737.0, 2930.0, 1911.0, 1219.0, 764.0, 504.0, 347.0, 227.0, 124.0, 88.0, 66.0, 36.0, 14.0, 14.0, 6.0, 7.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -16.110595703125, -15.65869140625, -15.206787109375, -14.7548828125, -14.302978515625, -13.85107421875, -13.399169921875, -12.947265625, -12.495361328125, -12.04345703125, -11.591552734375, -11.1396484375, -10.687744140625, -10.23583984375, -9.783935546875, -9.33203125, -8.880126953125, -8.42822265625, -7.976318359375, -7.5244140625, -7.072509765625, -6.62060546875, -6.168701171875, -5.716796875, -5.264892578125, -4.81298828125, -4.361083984375, -3.9091796875, -3.457275390625, -3.00537109375, -2.553466796875, -2.1015625, -1.649658203125, -1.19775390625, -0.745849609375, -0.2939453125, 0.157958984375, 0.60986328125, 1.061767578125, 1.513671875, 1.965576171875, 2.41748046875, 2.869384765625, 3.3212890625, 3.773193359375, 4.22509765625, 4.677001953125, 5.12890625, 5.580810546875, 6.03271484375, 6.484619140625, 6.9365234375, 7.388427734375, 7.84033203125, 8.292236328125, 8.744140625, 9.196044921875, 9.64794921875, 10.099853515625, 10.5517578125, 11.003662109375, 11.45556640625, 11.907470703125, 12.359375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 7.0, 9.0, 9.0, 19.0, 12.0, 13.0, 12.0, 27.0, 26.0, 20.0, 22.0, 37.0, 36.0, 36.0, 33.0, 38.0, 32.0, 50.0, 41.0, 42.0, 45.0, 54.0, 32.0, 48.0, 32.0, 40.0, 35.0, 25.0, 25.0, 23.0, 25.0, 19.0, 15.0, 8.0, 14.0, 8.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.53125, -12.16748046875, -11.8037109375, -11.43994140625, -11.076171875, -10.71240234375, -10.3486328125, -9.98486328125, -9.62109375, -9.25732421875, -8.8935546875, -8.52978515625, -8.166015625, -7.80224609375, -7.4384765625, -7.07470703125, -6.7109375, -6.34716796875, -5.9833984375, -5.61962890625, -5.255859375, -4.89208984375, -4.5283203125, -4.16455078125, -3.80078125, -3.43701171875, -3.0732421875, -2.70947265625, -2.345703125, -1.98193359375, -1.6181640625, -1.25439453125, -0.890625, -0.52685546875, -0.1630859375, 0.20068359375, 0.564453125, 0.92822265625, 1.2919921875, 1.65576171875, 2.01953125, 2.38330078125, 2.7470703125, 3.11083984375, 3.474609375, 3.83837890625, 4.2021484375, 4.56591796875, 4.9296875, 5.29345703125, 5.6572265625, 6.02099609375, 6.384765625, 6.74853515625, 7.1123046875, 7.47607421875, 7.83984375, 8.20361328125, 8.5673828125, 8.93115234375, 9.294921875, 9.65869140625, 10.0224609375, 10.38623046875, 10.75]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 5.0, 10.0, 14.0, 14.0, 18.0, 26.0, 47.0, 54.0, 98.0, 119.0, 169.0, 236.0, 319.0, 491.0, 680.0, 961.0, 1311.0, 1928.0, 2623.0, 3968.0, 6651.0, 12999.0, 31713.0, 87819.0, 207406.0, 299906.0, 221901.0, 97150.0, 35042.0, 14213.0, 7026.0, 4162.0, 2754.0, 1957.0, 1387.0, 963.0, 727.0, 484.0, 321.0, 252.0, 193.0, 135.0, 83.0, 69.0, 42.0, 34.0, 28.0, 15.0, 7.0, 6.0, 6.0, 1.0, 5.0, 1.0, 4.0, 2.0], "bins": [-15.125, -14.6741943359375, -14.223388671875, -13.7725830078125, -13.32177734375, -12.8709716796875, -12.420166015625, -11.9693603515625, -11.5185546875, -11.0677490234375, -10.616943359375, -10.1661376953125, -9.71533203125, -9.2645263671875, -8.813720703125, -8.3629150390625, -7.912109375, -7.4613037109375, -7.010498046875, -6.5596923828125, -6.10888671875, -5.6580810546875, -5.207275390625, -4.7564697265625, -4.3056640625, -3.8548583984375, -3.404052734375, -2.9532470703125, -2.50244140625, -2.0516357421875, -1.600830078125, -1.1500244140625, -0.69921875, -0.2484130859375, 0.202392578125, 0.6531982421875, 1.10400390625, 1.5548095703125, 2.005615234375, 2.4564208984375, 2.9072265625, 3.3580322265625, 3.808837890625, 4.2596435546875, 4.71044921875, 5.1612548828125, 5.612060546875, 6.0628662109375, 6.513671875, 6.9644775390625, 7.415283203125, 7.8660888671875, 8.31689453125, 8.7677001953125, 9.218505859375, 9.6693115234375, 10.1201171875, 10.5709228515625, 11.021728515625, 11.4725341796875, 11.92333984375, 12.3741455078125, 12.824951171875, 13.2757568359375, 13.7265625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 1.0, 5.0, 1.0, 5.0, 17.0, 19.0, 21.0, 45.0, 70.0, 104.0, 108.0, 89.0, 136.0, 107.0, 93.0, 67.0, 38.0, 18.0, 13.0, 10.0, 9.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021572113037109375, -0.0021018385887145996, -0.0020464658737182617, -0.001991093158721924, -0.001935720443725586, -0.001880347728729248, -0.0018249750137329102, -0.0017696022987365723, -0.0017142295837402344, -0.0016588568687438965, -0.0016034841537475586, -0.0015481114387512207, -0.0014927387237548828, -0.001437366008758545, -0.001381993293762207, -0.0013266205787658691, -0.0012712478637695312, -0.0012158751487731934, -0.0011605024337768555, -0.0011051297187805176, -0.0010497570037841797, -0.0009943842887878418, -0.0009390115737915039, -0.000883638858795166, -0.0008282661437988281, -0.0007728934288024902, -0.0007175207138061523, -0.0006621479988098145, -0.0006067752838134766, -0.0005514025688171387, -0.0004960298538208008, -0.0004406571388244629, -0.000385284423828125, -0.0003299117088317871, -0.0002745389938354492, -0.00021916627883911133, -0.00016379356384277344, -0.00010842084884643555, -5.3048133850097656e-05, 2.3245811462402344e-06, 5.7697296142578125e-05, 0.00011307001113891602, 0.0001684427261352539, 0.0002238154411315918, 0.0002791881561279297, 0.0003345608711242676, 0.00038993358612060547, 0.00044530630111694336, 0.0005006790161132812, 0.0005560517311096191, 0.000611424446105957, 0.0006667971611022949, 0.0007221698760986328, 0.0007775425910949707, 0.0008329153060913086, 0.0008882880210876465, 0.0009436607360839844, 0.0009990334510803223, 0.0010544061660766602, 0.001109778881072998, 0.001165151596069336, 0.0012205243110656738, 0.0012758970260620117, 0.0013312697410583496, 0.0013866424560546875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 6.0, 9.0, 12.0, 17.0, 20.0, 34.0, 48.0, 77.0, 99.0, 108.0, 155.0, 168.0, 301.0, 369.0, 529.0, 696.0, 1032.0, 1465.0, 2050.0, 3090.0, 4740.0, 8351.0, 17274.0, 41785.0, 104275.0, 213966.0, 275872.0, 201064.0, 95053.0, 37931.0, 15661.0, 7949.0, 4503.0, 3020.0, 1991.0, 1325.0, 958.0, 664.0, 493.0, 388.0, 291.0, 203.0, 129.0, 111.0, 76.0, 67.0, 33.0, 27.0, 29.0, 14.0, 10.0, 7.0, 10.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0], "bins": [-13.515625, -13.0858154296875, -12.656005859375, -12.2261962890625, -11.79638671875, -11.3665771484375, -10.936767578125, -10.5069580078125, -10.0771484375, -9.6473388671875, -9.217529296875, -8.7877197265625, -8.35791015625, -7.9281005859375, -7.498291015625, -7.0684814453125, -6.638671875, -6.2088623046875, -5.779052734375, -5.3492431640625, -4.91943359375, -4.4896240234375, -4.059814453125, -3.6300048828125, -3.2001953125, -2.7703857421875, -2.340576171875, -1.9107666015625, -1.48095703125, -1.0511474609375, -0.621337890625, -0.1915283203125, 0.23828125, 0.6680908203125, 1.097900390625, 1.5277099609375, 1.95751953125, 2.3873291015625, 2.817138671875, 3.2469482421875, 3.6767578125, 4.1065673828125, 4.536376953125, 4.9661865234375, 5.39599609375, 5.8258056640625, 6.255615234375, 6.6854248046875, 7.115234375, 7.5450439453125, 7.974853515625, 8.4046630859375, 8.83447265625, 9.2642822265625, 9.694091796875, 10.1239013671875, 10.5537109375, 10.9835205078125, 11.413330078125, 11.8431396484375, 12.27294921875, 12.7027587890625, 13.132568359375, 13.5623779296875, 13.9921875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 8.0, 6.0, 1.0, 7.0, 4.0, 14.0, 21.0, 39.0, 45.0, 62.0, 69.0, 88.0, 95.0, 79.0, 93.0, 78.0, 80.0, 67.0, 49.0, 29.0, 20.0, 18.0, 10.0, 3.0, 7.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5546875, -3.4151611328125, -3.275634765625, -3.1361083984375, -2.99658203125, -2.8570556640625, -2.717529296875, -2.5780029296875, -2.4384765625, -2.2989501953125, -2.159423828125, -2.0198974609375, -1.88037109375, -1.7408447265625, -1.601318359375, -1.4617919921875, -1.322265625, -1.1827392578125, -1.043212890625, -0.9036865234375, -0.76416015625, -0.6246337890625, -0.485107421875, -0.3455810546875, -0.2060546875, -0.0665283203125, 0.072998046875, 0.2125244140625, 0.35205078125, 0.4915771484375, 0.631103515625, 0.7706298828125, 0.91015625, 1.0496826171875, 1.189208984375, 1.3287353515625, 1.46826171875, 1.6077880859375, 1.747314453125, 1.8868408203125, 2.0263671875, 2.1658935546875, 2.305419921875, 2.4449462890625, 2.58447265625, 2.7239990234375, 2.863525390625, 3.0030517578125, 3.142578125, 3.2821044921875, 3.421630859375, 3.5611572265625, 3.70068359375, 3.8402099609375, 3.979736328125, 4.1192626953125, 4.2587890625, 4.3983154296875, 4.537841796875, 4.6773681640625, 4.81689453125, 4.9564208984375, 5.095947265625, 5.2354736328125, 5.375]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 9.0, 9.0, 22.0, 20.0, 24.0, 34.0, 33.0, 36.0, 41.0, 49.0, 57.0, 74.0, 58.0, 63.0, 53.0, 54.0, 64.0, 53.0, 46.0, 33.0, 35.0, 31.0, 27.0, 23.0, 11.0, 9.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.120203018188477, -27.138328552246094, -26.156455993652344, -25.17458152770996, -24.19270896911621, -23.210834503173828, -22.228961944580078, -21.247087478637695, -20.265213012695312, -19.28333854675293, -18.30146598815918, -17.319591522216797, -16.337718963623047, -15.355844497680664, -14.373970985412598, -13.392097473144531, -12.410224914550781, -11.428351402282715, -10.446477890014648, -9.464603424072266, -8.482730865478516, -7.500856876373291, -6.518982887268066, -5.537109375, -4.555235862731934, -3.573362350463867, -2.5914885997772217, -1.6096148490905762, -0.6277413368225098, 0.35413217544555664, 1.3360061645507812, 2.3178796768188477, 3.2997512817382812, 4.281624794006348, 5.263498306274414, 6.245372295379639, 7.227245807647705, 8.20911979675293, 9.190993309020996, 10.172866821289062, 11.154740333557129, 12.136613845825195, 13.118487358093262, 14.100360870361328, 15.082235336303711, 16.06410789489746, 17.045982360839844, 18.027854919433594, 19.009729385375977, 19.99160385131836, 20.97347640991211, 21.955350875854492, 22.937223434448242, 23.919097900390625, 24.900970458984375, 25.882844924926758, 26.86471939086914, 27.846593856811523, 28.828466415405273, 29.810340881347656, 30.792213439941406, 31.77408790588379, 32.75596237182617, 33.73783493041992, 34.71970748901367]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 10.0, 4.0, 8.0, 6.0, 8.0, 13.0, 11.0, 24.0, 17.0, 22.0, 20.0, 35.0, 29.0, 27.0, 34.0, 33.0, 37.0, 49.0, 47.0, 35.0, 41.0, 40.0, 38.0, 45.0, 47.0, 29.0, 36.0, 33.0, 24.0, 37.0, 30.0, 16.0, 15.0, 19.0, 19.0, 8.0, 8.0, 12.0, 11.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.892009735107422, -19.3161678314209, -18.740324020385742, -18.16448211669922, -17.588638305664062, -17.01279640197754, -16.436954498291016, -15.861111640930176, -15.285268783569336, -14.709425926208496, -14.133583068847656, -13.557741165161133, -12.981898307800293, -12.406055450439453, -11.83021354675293, -11.25437068939209, -10.67852783203125, -10.10268497467041, -9.52684211730957, -8.951000213623047, -8.375157356262207, -7.799314498901367, -7.2234721183776855, -6.647629737854004, -6.071786880493164, -5.495944023132324, -4.920101642608643, -4.344259262084961, -3.768416404724121, -3.1925737857818604, -2.6167311668395996, -2.040888786315918, -1.4650440216064453, -0.8892014026641846, -0.31335878372192383, 0.2624838352203369, 0.8383264541625977, 1.4141690731048584, 1.9900116920471191, 2.565854072570801, 3.1416969299316406, 3.7175395488739014, 4.293382167816162, 4.869224548339844, 5.445067405700684, 6.020910263061523, 6.596752643585205, 7.172595024108887, 7.748437881469727, 8.324280738830566, 8.900123596191406, 9.47596549987793, 10.05180835723877, 10.62765121459961, 11.203493118286133, 11.779335975646973, 12.355178833007812, 12.931021690368652, 13.506864547729492, 14.082706451416016, 14.658549308776855, 15.234392166137695, 15.810234069824219, 16.386077880859375, 16.9619197845459]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 14.0, 22.0, 25.0, 34.0, 54.0, 93.0, 132.0, 175.0, 300.0, 473.0, 750.0, 1085.0, 1796.0, 2921.0, 4981.0, 8333.0, 14678.0, 25585.0, 44968.0, 79107.0, 142620.0, 253124.0, 431048.0, 649695.0, 773362.0, 676688.0, 458896.0, 270579.0, 154154.0, 85023.0, 47644.0, 26992.0, 15527.0, 9187.0, 5340.0, 3292.0, 1983.0, 1230.0, 851.0, 507.0, 335.0, 218.0, 140.0, 96.0, 72.0, 42.0, 38.0, 24.0, 20.0, 16.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0], "bins": [-24.03125, -23.29345703125, -22.5556640625, -21.81787109375, -21.080078125, -20.34228515625, -19.6044921875, -18.86669921875, -18.12890625, -17.39111328125, -16.6533203125, -15.91552734375, -15.177734375, -14.43994140625, -13.7021484375, -12.96435546875, -12.2265625, -11.48876953125, -10.7509765625, -10.01318359375, -9.275390625, -8.53759765625, -7.7998046875, -7.06201171875, -6.32421875, -5.58642578125, -4.8486328125, -4.11083984375, -3.373046875, -2.63525390625, -1.8974609375, -1.15966796875, -0.421875, 0.31591796875, 1.0537109375, 1.79150390625, 2.529296875, 3.26708984375, 4.0048828125, 4.74267578125, 5.48046875, 6.21826171875, 6.9560546875, 7.69384765625, 8.431640625, 9.16943359375, 9.9072265625, 10.64501953125, 11.3828125, 12.12060546875, 12.8583984375, 13.59619140625, 14.333984375, 15.07177734375, 15.8095703125, 16.54736328125, 17.28515625, 18.02294921875, 18.7607421875, 19.49853515625, 20.236328125, 20.97412109375, 21.7119140625, 22.44970703125, 23.1875]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 7.0, 9.0, 10.0, 12.0, 7.0, 17.0, 26.0, 23.0, 26.0, 21.0, 34.0, 27.0, 41.0, 32.0, 48.0, 45.0, 36.0, 36.0, 44.0, 41.0, 53.0, 49.0, 39.0, 34.0, 34.0, 35.0, 27.0, 28.0, 24.0, 18.0, 17.0, 22.0, 8.0, 6.0, 12.0, 9.0, 9.0, 8.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-20.859375, -20.2884521484375, -19.717529296875, -19.1466064453125, -18.57568359375, -18.0047607421875, -17.433837890625, -16.8629150390625, -16.2919921875, -15.7210693359375, -15.150146484375, -14.5792236328125, -14.00830078125, -13.4373779296875, -12.866455078125, -12.2955322265625, -11.724609375, -11.1536865234375, -10.582763671875, -10.0118408203125, -9.44091796875, -8.8699951171875, -8.299072265625, -7.7281494140625, -7.1572265625, -6.5863037109375, -6.015380859375, -5.4444580078125, -4.87353515625, -4.3026123046875, -3.731689453125, -3.1607666015625, -2.58984375, -2.0189208984375, -1.447998046875, -0.8770751953125, -0.30615234375, 0.2647705078125, 0.835693359375, 1.4066162109375, 1.9775390625, 2.5484619140625, 3.119384765625, 3.6903076171875, 4.26123046875, 4.8321533203125, 5.403076171875, 5.9739990234375, 6.544921875, 7.1158447265625, 7.686767578125, 8.2576904296875, 8.82861328125, 9.3995361328125, 9.970458984375, 10.5413818359375, 11.1123046875, 11.6832275390625, 12.254150390625, 12.8250732421875, 13.39599609375, 13.9669189453125, 14.537841796875, 15.1087646484375, 15.6796875]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 10.0, 12.0, 14.0, 39.0, 56.0, 92.0, 137.0, 212.0, 340.0, 491.0, 822.0, 1349.0, 2092.0, 3409.0, 5595.0, 9365.0, 15537.0, 26171.0, 44380.0, 76616.0, 131107.0, 217769.0, 351520.0, 519152.0, 659546.0, 667008.0, 534506.0, 365359.0, 228197.0, 137040.0, 80013.0, 47046.0, 28050.0, 16329.0, 9520.0, 5848.0, 3609.0, 2245.0, 1305.0, 904.0, 560.0, 333.0, 200.0, 136.0, 93.0, 57.0, 38.0, 22.0, 15.0, 11.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-30.625, -29.6982421875, -28.771484375, -27.8447265625, -26.91796875, -25.9912109375, -25.064453125, -24.1376953125, -23.2109375, -22.2841796875, -21.357421875, -20.4306640625, -19.50390625, -18.5771484375, -17.650390625, -16.7236328125, -15.796875, -14.8701171875, -13.943359375, -13.0166015625, -12.08984375, -11.1630859375, -10.236328125, -9.3095703125, -8.3828125, -7.4560546875, -6.529296875, -5.6025390625, -4.67578125, -3.7490234375, -2.822265625, -1.8955078125, -0.96875, -0.0419921875, 0.884765625, 1.8115234375, 2.73828125, 3.6650390625, 4.591796875, 5.5185546875, 6.4453125, 7.3720703125, 8.298828125, 9.2255859375, 10.15234375, 11.0791015625, 12.005859375, 12.9326171875, 13.859375, 14.7861328125, 15.712890625, 16.6396484375, 17.56640625, 18.4931640625, 19.419921875, 20.3466796875, 21.2734375, 22.2001953125, 23.126953125, 24.0537109375, 24.98046875, 25.9072265625, 26.833984375, 27.7607421875, 28.6875]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 5.0, 3.0, 14.0, 11.0, 18.0, 14.0, 21.0, 28.0, 47.0, 47.0, 51.0, 58.0, 97.0, 99.0, 115.0, 148.0, 173.0, 188.0, 205.0, 209.0, 216.0, 240.0, 241.0, 229.0, 239.0, 220.0, 198.0, 151.0, 152.0, 117.0, 92.0, 93.0, 69.0, 46.0, 57.0, 39.0, 28.0, 28.0, 17.0, 17.0, 10.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.8555908203125, -8.523681640625, -8.1917724609375, -7.85986328125, -7.5279541015625, -7.196044921875, -6.8641357421875, -6.5322265625, -6.2003173828125, -5.868408203125, -5.5364990234375, -5.20458984375, -4.8726806640625, -4.540771484375, -4.2088623046875, -3.876953125, -3.5450439453125, -3.213134765625, -2.8812255859375, -2.54931640625, -2.2174072265625, -1.885498046875, -1.5535888671875, -1.2216796875, -0.8897705078125, -0.557861328125, -0.2259521484375, 0.10595703125, 0.4378662109375, 0.769775390625, 1.1016845703125, 1.43359375, 1.7655029296875, 2.097412109375, 2.4293212890625, 2.76123046875, 3.0931396484375, 3.425048828125, 3.7569580078125, 4.0888671875, 4.4207763671875, 4.752685546875, 5.0845947265625, 5.41650390625, 5.7484130859375, 6.080322265625, 6.4122314453125, 6.744140625, 7.0760498046875, 7.407958984375, 7.7398681640625, 8.07177734375, 8.4036865234375, 8.735595703125, 9.0675048828125, 9.3994140625, 9.7313232421875, 10.063232421875, 10.3951416015625, 10.72705078125, 11.0589599609375, 11.390869140625, 11.7227783203125, 12.0546875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 8.0, 7.0, 12.0, 9.0, 19.0, 13.0, 14.0, 19.0, 24.0, 20.0, 51.0, 41.0, 41.0, 59.0, 53.0, 58.0, 60.0, 57.0, 34.0, 66.0, 46.0, 44.0, 47.0, 35.0, 30.0, 26.0, 18.0, 16.0, 16.0, 11.0, 12.0, 15.0, 4.0, 7.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-44.5002326965332, -43.10509490966797, -41.709957122802734, -40.3148193359375, -38.91968536376953, -37.5245475769043, -36.12940979003906, -34.73427200317383, -33.339134216308594, -31.94399642944336, -30.548860549926758, -29.153722763061523, -27.758586883544922, -26.363449096679688, -24.968311309814453, -23.57317352294922, -22.17803955078125, -20.782901763916016, -19.387765884399414, -17.99262809753418, -16.597492218017578, -15.202354431152344, -13.80721664428711, -12.412079811096191, -11.016942977905273, -9.621806144714355, -8.226669311523438, -6.831531524658203, -5.436394691467285, -4.041257858276367, -2.646120071411133, -1.2509832382202148, 0.14415740966796875, 1.5392944812774658, 2.934431552886963, 4.329568862915039, 5.724705696105957, 7.119842529296875, 8.51498031616211, 9.910117149353027, 11.305253982543945, 12.700390815734863, 14.095527648925781, 15.490665435791016, 16.88580322265625, 18.28093910217285, 19.676076889038086, 21.071212768554688, 22.466350555419922, 23.861488342285156, 25.256624221801758, 26.651762008666992, 28.046897888183594, 29.442035675048828, 30.837173461914062, 32.2323112487793, 33.62744903564453, 35.022586822509766, 36.417724609375, 37.81285858154297, 39.2079963684082, 40.60313415527344, 41.99827194213867, 43.393409729003906, 44.788543701171875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 4.0, 3.0, 8.0, 10.0, 12.0, 9.0, 16.0, 13.0, 20.0, 12.0, 23.0, 23.0, 26.0, 33.0, 29.0, 33.0, 30.0, 42.0, 32.0, 38.0, 29.0, 42.0, 38.0, 34.0, 31.0, 39.0, 46.0, 28.0, 17.0, 23.0, 32.0, 28.0, 21.0, 22.0, 18.0, 17.0, 18.0, 14.0, 16.0, 8.0, 5.0, 8.0, 8.0, 5.0, 5.0, 5.0, 2.0, 7.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-21.947113037109375, -21.238201141357422, -20.52928924560547, -19.820377349853516, -19.11146354675293, -18.402551651000977, -17.693639755249023, -16.98472785949707, -16.275814056396484, -15.566902160644531, -14.857989311218262, -14.149077415466309, -13.440164566040039, -12.731252670288086, -12.022340774536133, -11.31342887878418, -10.604516983032227, -9.895605087280273, -9.186692237854004, -8.47778034210205, -7.7688679695129395, -7.059955596923828, -6.351043701171875, -5.642131328582764, -4.933218955993652, -4.224306583404541, -3.515394449234009, -2.8064823150634766, -2.0975699424743652, -1.388657569885254, -0.6797456741333008, 0.029166698455810547, 0.7380809783935547, 1.4469932317733765, 2.1559054851531982, 2.8648176193237305, 3.573729991912842, 4.282642364501953, 4.991554260253906, 5.700466632843018, 6.409379005432129, 7.11829137802124, 7.827203750610352, 8.536115646362305, 9.245027542114258, 9.953940391540527, 10.66285228729248, 11.37176513671875, 12.080677032470703, 12.789588928222656, 13.498501777648926, 14.207413673400879, 14.916326522827148, 15.625238418579102, 16.334150314331055, 17.043062210083008, 17.751976013183594, 18.460887908935547, 19.1697998046875, 19.878711700439453, 20.58762550354004, 21.296537399291992, 22.005449295043945, 22.7143611907959, 23.42327308654785]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 20.0, 32.0, 60.0, 89.0, 110.0, 217.0, 276.0, 438.0, 680.0, 1031.0, 1629.0, 2412.0, 3859.0, 6062.0, 9391.0, 14667.0, 22967.0, 35206.0, 53781.0, 78153.0, 108209.0, 132939.0, 141856.0, 127577.0, 99553.0, 71312.0, 48164.0, 31148.0, 20451.0, 13026.0, 8293.0, 5492.0, 3319.0, 2124.0, 1356.0, 921.0, 624.0, 382.0, 257.0, 155.0, 99.0, 78.0, 48.0, 24.0, 21.0, 10.0, 8.0, 7.0, 3.0, 4.0, 2.0, 2.0], "bins": [-13.75, -13.349853515625, -12.94970703125, -12.549560546875, -12.1494140625, -11.749267578125, -11.34912109375, -10.948974609375, -10.548828125, -10.148681640625, -9.74853515625, -9.348388671875, -8.9482421875, -8.548095703125, -8.14794921875, -7.747802734375, -7.34765625, -6.947509765625, -6.54736328125, -6.147216796875, -5.7470703125, -5.346923828125, -4.94677734375, -4.546630859375, -4.146484375, -3.746337890625, -3.34619140625, -2.946044921875, -2.5458984375, -2.145751953125, -1.74560546875, -1.345458984375, -0.9453125, -0.545166015625, -0.14501953125, 0.255126953125, 0.6552734375, 1.055419921875, 1.45556640625, 1.855712890625, 2.255859375, 2.656005859375, 3.05615234375, 3.456298828125, 3.8564453125, 4.256591796875, 4.65673828125, 5.056884765625, 5.45703125, 5.857177734375, 6.25732421875, 6.657470703125, 7.0576171875, 7.457763671875, 7.85791015625, 8.258056640625, 8.658203125, 9.058349609375, 9.45849609375, 9.858642578125, 10.2587890625, 10.658935546875, 11.05908203125, 11.459228515625, 11.859375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 7.0, 6.0, 9.0, 8.0, 14.0, 14.0, 14.0, 23.0, 18.0, 26.0, 24.0, 25.0, 34.0, 27.0, 42.0, 38.0, 48.0, 37.0, 49.0, 34.0, 36.0, 37.0, 38.0, 35.0, 40.0, 40.0, 30.0, 29.0, 26.0, 25.0, 14.0, 28.0, 19.0, 13.0, 17.0, 15.0, 12.0, 10.0, 9.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.078125, -27.189208984375, -26.30029296875, -25.411376953125, -24.5224609375, -23.633544921875, -22.74462890625, -21.855712890625, -20.966796875, -20.077880859375, -19.18896484375, -18.300048828125, -17.4111328125, -16.522216796875, -15.63330078125, -14.744384765625, -13.85546875, -12.966552734375, -12.07763671875, -11.188720703125, -10.2998046875, -9.410888671875, -8.52197265625, -7.633056640625, -6.744140625, -5.855224609375, -4.96630859375, -4.077392578125, -3.1884765625, -2.299560546875, -1.41064453125, -0.521728515625, 0.3671875, 1.256103515625, 2.14501953125, 3.033935546875, 3.9228515625, 4.811767578125, 5.70068359375, 6.589599609375, 7.478515625, 8.367431640625, 9.25634765625, 10.145263671875, 11.0341796875, 11.923095703125, 12.81201171875, 13.700927734375, 14.58984375, 15.478759765625, 16.36767578125, 17.256591796875, 18.1455078125, 19.034423828125, 19.92333984375, 20.812255859375, 21.701171875, 22.590087890625, 23.47900390625, 24.367919921875, 25.2568359375, 26.145751953125, 27.03466796875, 27.923583984375, 28.8125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 9.0, 9.0, 15.0, 34.0, 36.0, 37.0, 68.0, 83.0, 118.0, 198.0, 337.0, 496.0, 700.0, 1187.0, 1832.0, 3139.0, 5023.0, 8383.0, 14419.0, 25380.0, 44703.0, 77640.0, 129263.0, 188783.0, 196365.0, 142533.0, 87350.0, 50370.0, 28884.0, 16454.0, 9538.0, 5737.0, 3524.0, 2076.0, 1301.0, 859.0, 556.0, 372.0, 258.0, 137.0, 123.0, 66.0, 54.0, 20.0, 31.0, 18.0, 8.0, 12.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.828125, -18.24169921875, -17.6552734375, -17.06884765625, -16.482421875, -15.89599609375, -15.3095703125, -14.72314453125, -14.13671875, -13.55029296875, -12.9638671875, -12.37744140625, -11.791015625, -11.20458984375, -10.6181640625, -10.03173828125, -9.4453125, -8.85888671875, -8.2724609375, -7.68603515625, -7.099609375, -6.51318359375, -5.9267578125, -5.34033203125, -4.75390625, -4.16748046875, -3.5810546875, -2.99462890625, -2.408203125, -1.82177734375, -1.2353515625, -0.64892578125, -0.0625, 0.52392578125, 1.1103515625, 1.69677734375, 2.283203125, 2.86962890625, 3.4560546875, 4.04248046875, 4.62890625, 5.21533203125, 5.8017578125, 6.38818359375, 6.974609375, 7.56103515625, 8.1474609375, 8.73388671875, 9.3203125, 9.90673828125, 10.4931640625, 11.07958984375, 11.666015625, 12.25244140625, 12.8388671875, 13.42529296875, 14.01171875, 14.59814453125, 15.1845703125, 15.77099609375, 16.357421875, 16.94384765625, 17.5302734375, 18.11669921875, 18.703125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 12.0, 3.0, 1.0, 6.0, 8.0, 8.0, 14.0, 19.0, 17.0, 26.0, 36.0, 26.0, 41.0, 32.0, 40.0, 44.0, 50.0, 50.0, 51.0, 53.0, 51.0, 41.0, 40.0, 37.0, 41.0, 39.0, 37.0, 30.0, 26.0, 19.0, 16.0, 20.0, 20.0, 14.0, 5.0, 9.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-20.953125, -20.38818359375, -19.8232421875, -19.25830078125, -18.693359375, -18.12841796875, -17.5634765625, -16.99853515625, -16.43359375, -15.86865234375, -15.3037109375, -14.73876953125, -14.173828125, -13.60888671875, -13.0439453125, -12.47900390625, -11.9140625, -11.34912109375, -10.7841796875, -10.21923828125, -9.654296875, -9.08935546875, -8.5244140625, -7.95947265625, -7.39453125, -6.82958984375, -6.2646484375, -5.69970703125, -5.134765625, -4.56982421875, -4.0048828125, -3.43994140625, -2.875, -2.31005859375, -1.7451171875, -1.18017578125, -0.615234375, -0.05029296875, 0.5146484375, 1.07958984375, 1.64453125, 2.20947265625, 2.7744140625, 3.33935546875, 3.904296875, 4.46923828125, 5.0341796875, 5.59912109375, 6.1640625, 6.72900390625, 7.2939453125, 7.85888671875, 8.423828125, 8.98876953125, 9.5537109375, 10.11865234375, 10.68359375, 11.24853515625, 11.8134765625, 12.37841796875, 12.943359375, 13.50830078125, 14.0732421875, 14.63818359375, 15.203125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 10.0, 8.0, 17.0, 13.0, 36.0, 55.0, 99.0, 146.0, 267.0, 478.0, 813.0, 1397.0, 2505.0, 4637.0, 8409.0, 16384.0, 31971.0, 63006.0, 121931.0, 207762.0, 240689.0, 164281.0, 88940.0, 45719.0, 23095.0, 11940.0, 6143.0, 3342.0, 1895.0, 1070.0, 630.0, 359.0, 198.0, 128.0, 73.0, 38.0, 30.0, 14.0, 12.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 5.0], "bins": [-13.5625, -13.198486328125, -12.83447265625, -12.470458984375, -12.1064453125, -11.742431640625, -11.37841796875, -11.014404296875, -10.650390625, -10.286376953125, -9.92236328125, -9.558349609375, -9.1943359375, -8.830322265625, -8.46630859375, -8.102294921875, -7.73828125, -7.374267578125, -7.01025390625, -6.646240234375, -6.2822265625, -5.918212890625, -5.55419921875, -5.190185546875, -4.826171875, -4.462158203125, -4.09814453125, -3.734130859375, -3.3701171875, -3.006103515625, -2.64208984375, -2.278076171875, -1.9140625, -1.550048828125, -1.18603515625, -0.822021484375, -0.4580078125, -0.093994140625, 0.27001953125, 0.634033203125, 0.998046875, 1.362060546875, 1.72607421875, 2.090087890625, 2.4541015625, 2.818115234375, 3.18212890625, 3.546142578125, 3.91015625, 4.274169921875, 4.63818359375, 5.002197265625, 5.3662109375, 5.730224609375, 6.09423828125, 6.458251953125, 6.822265625, 7.186279296875, 7.55029296875, 7.914306640625, 8.2783203125, 8.642333984375, 9.00634765625, 9.370361328125, 9.734375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 7.0, 5.0, 14.0, 13.0, 16.0, 17.0, 22.0, 29.0, 27.0, 36.0, 37.0, 36.0, 56.0, 62.0, 49.0, 52.0, 51.0, 63.0, 58.0, 53.0, 47.0, 38.0, 40.0, 23.0, 29.0, 15.0, 22.0, 14.0, 12.0, 8.0, 8.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005345344543457031, -0.0005201771855354309, -0.0005058199167251587, -0.0004914626479148865, -0.00047710537910461426, -0.00046274811029434204, -0.0004483908414840698, -0.0004340335726737976, -0.0004196763038635254, -0.0004053190350532532, -0.00039096176624298096, -0.00037660449743270874, -0.0003622472286224365, -0.0003478899598121643, -0.0003335326910018921, -0.0003191754221916199, -0.00030481815338134766, -0.00029046088457107544, -0.0002761036157608032, -0.000261746346950531, -0.0002473890781402588, -0.00023303180932998657, -0.00021867454051971436, -0.00020431727170944214, -0.00018996000289916992, -0.0001756027340888977, -0.0001612454652786255, -0.00014688819646835327, -0.00013253092765808105, -0.00011817365884780884, -0.00010381639003753662, -8.94591212272644e-05, -7.510185241699219e-05, -6.074458360671997e-05, -4.6387314796447754e-05, -3.203004598617554e-05, -1.767277717590332e-05, -3.3155083656311035e-06, 1.1041760444641113e-05, 2.539902925491333e-05, 3.975629806518555e-05, 5.4113566875457764e-05, 6.847083568572998e-05, 8.28281044960022e-05, 9.718537330627441e-05, 0.00011154264211654663, 0.00012589991092681885, 0.00014025717973709106, 0.00015461444854736328, 0.0001689717173576355, 0.00018332898616790771, 0.00019768625497817993, 0.00021204352378845215, 0.00022640079259872437, 0.00024075806140899658, 0.0002551153302192688, 0.000269472599029541, 0.00028382986783981323, 0.00029818713665008545, 0.00031254440546035767, 0.0003269016742706299, 0.0003412589430809021, 0.0003556162118911743, 0.00036997348070144653, 0.00038433074951171875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 8.0, 5.0, 7.0, 15.0, 17.0, 15.0, 30.0, 60.0, 79.0, 103.0, 156.0, 196.0, 320.0, 481.0, 718.0, 1118.0, 1641.0, 2393.0, 3731.0, 5715.0, 8798.0, 13772.0, 20733.0, 31910.0, 48398.0, 71544.0, 98666.0, 125228.0, 137471.0, 129927.0, 107710.0, 78863.0, 54411.0, 36403.0, 23497.0, 15290.0, 10032.0, 6487.0, 4287.0, 2756.0, 1810.0, 1223.0, 830.0, 551.0, 361.0, 244.0, 178.0, 118.0, 73.0, 68.0, 42.0, 21.0, 18.0, 15.0, 5.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0], "bins": [-8.0390625, -7.7850341796875, -7.531005859375, -7.2769775390625, -7.02294921875, -6.7689208984375, -6.514892578125, -6.2608642578125, -6.0068359375, -5.7528076171875, -5.498779296875, -5.2447509765625, -4.99072265625, -4.7366943359375, -4.482666015625, -4.2286376953125, -3.974609375, -3.7205810546875, -3.466552734375, -3.2125244140625, -2.95849609375, -2.7044677734375, -2.450439453125, -2.1964111328125, -1.9423828125, -1.6883544921875, -1.434326171875, -1.1802978515625, -0.92626953125, -0.6722412109375, -0.418212890625, -0.1641845703125, 0.08984375, 0.3438720703125, 0.597900390625, 0.8519287109375, 1.10595703125, 1.3599853515625, 1.614013671875, 1.8680419921875, 2.1220703125, 2.3760986328125, 2.630126953125, 2.8841552734375, 3.13818359375, 3.3922119140625, 3.646240234375, 3.9002685546875, 4.154296875, 4.4083251953125, 4.662353515625, 4.9163818359375, 5.17041015625, 5.4244384765625, 5.678466796875, 5.9324951171875, 6.1865234375, 6.4405517578125, 6.694580078125, 6.9486083984375, 7.20263671875, 7.4566650390625, 7.710693359375, 7.9647216796875, 8.21875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 3.0, 10.0, 10.0, 6.0, 20.0, 15.0, 19.0, 21.0, 31.0, 26.0, 44.0, 42.0, 52.0, 53.0, 42.0, 61.0, 76.0, 59.0, 59.0, 62.0, 54.0, 32.0, 34.0, 29.0, 27.0, 31.0, 14.0, 21.0, 6.0, 8.0, 6.0, 2.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.44140625, -3.339935302734375, -3.23846435546875, -3.136993408203125, -3.0355224609375, -2.934051513671875, -2.83258056640625, -2.731109619140625, -2.629638671875, -2.528167724609375, -2.42669677734375, -2.325225830078125, -2.2237548828125, -2.122283935546875, -2.02081298828125, -1.919342041015625, -1.81787109375, -1.716400146484375, -1.61492919921875, -1.513458251953125, -1.4119873046875, -1.310516357421875, -1.20904541015625, -1.107574462890625, -1.006103515625, -0.904632568359375, -0.80316162109375, -0.701690673828125, -0.6002197265625, -0.498748779296875, -0.39727783203125, -0.295806884765625, -0.1943359375, -0.092864990234375, 0.00860595703125, 0.110076904296875, 0.2115478515625, 0.313018798828125, 0.41448974609375, 0.515960693359375, 0.617431640625, 0.718902587890625, 0.82037353515625, 0.921844482421875, 1.0233154296875, 1.124786376953125, 1.22625732421875, 1.327728271484375, 1.42919921875, 1.530670166015625, 1.63214111328125, 1.733612060546875, 1.8350830078125, 1.936553955078125, 2.03802490234375, 2.139495849609375, 2.240966796875, 2.342437744140625, 2.44390869140625, 2.545379638671875, 2.6468505859375, 2.748321533203125, 2.84979248046875, 2.951263427734375, 3.052734375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 6.0, 6.0, 11.0, 10.0, 9.0, 13.0, 15.0, 20.0, 21.0, 21.0, 26.0, 51.0, 30.0, 42.0, 61.0, 53.0, 53.0, 65.0, 46.0, 43.0, 60.0, 47.0, 41.0, 43.0, 39.0, 33.0, 23.0, 18.0, 18.0, 12.0, 17.0, 13.0, 14.0, 4.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-45.09272766113281, -43.728179931640625, -42.36363220214844, -40.99908447265625, -39.63453674316406, -38.269989013671875, -36.90544128417969, -35.5408935546875, -34.17634582519531, -32.811798095703125, -31.447250366210938, -30.08270263671875, -28.718154907226562, -27.353607177734375, -25.989059448242188, -24.62451171875, -23.259963989257812, -21.895416259765625, -20.530868530273438, -19.16632080078125, -17.801773071289062, -16.437225341796875, -15.072677612304688, -13.7081298828125, -12.343582153320312, -10.979034423828125, -9.614486694335938, -8.24993896484375, -6.8853912353515625, -5.520843505859375, -4.1562957763671875, -2.791748046875, -1.4271965026855469, -0.06264877319335938, 1.3018989562988281, 2.6664466857910156, 4.030994415283203, 5.395542144775391, 6.760089874267578, 8.124637603759766, 9.489185333251953, 10.85373306274414, 12.218280792236328, 13.582828521728516, 14.947376251220703, 16.31192398071289, 17.676471710205078, 19.041019439697266, 20.405567169189453, 21.77011489868164, 23.134662628173828, 24.499210357666016, 25.863758087158203, 27.22830581665039, 28.592853546142578, 29.957401275634766, 31.321949005126953, 32.68649673461914, 34.05104446411133, 35.415592193603516, 36.7801399230957, 38.14468765258789, 39.50923538208008, 40.873783111572266, 42.23833084106445]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 7.0, 5.0, 6.0, 8.0, 7.0, 11.0, 13.0, 11.0, 13.0, 19.0, 21.0, 22.0, 22.0, 29.0, 32.0, 27.0, 28.0, 44.0, 31.0, 31.0, 33.0, 44.0, 35.0, 34.0, 38.0, 33.0, 40.0, 34.0, 35.0, 20.0, 18.0, 26.0, 31.0, 30.0, 23.0, 17.0, 11.0, 17.0, 17.0, 16.0, 6.0, 11.0, 3.0, 7.0, 7.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.469125747680664, -21.740489959716797, -21.01185417175293, -20.283218383789062, -19.554582595825195, -18.825946807861328, -18.09731101989746, -17.368675231933594, -16.640039443969727, -15.91140365600586, -15.182767868041992, -14.454132080078125, -13.725496292114258, -12.99686050415039, -12.268224716186523, -11.539588928222656, -10.810953140258789, -10.082317352294922, -9.353681564331055, -8.625045776367188, -7.89640998840332, -7.167774200439453, -6.439138412475586, -5.710502624511719, -4.981866836547852, -4.253231048583984, -3.524595260620117, -2.79595947265625, -2.067323684692383, -1.3386878967285156, -0.6100521087646484, 0.11858367919921875, 0.8472194671630859, 1.5758552551269531, 2.3044910430908203, 3.0331268310546875, 3.7617626190185547, 4.490398406982422, 5.219034194946289, 5.947669982910156, 6.676305770874023, 7.404941558837891, 8.133577346801758, 8.862213134765625, 9.590848922729492, 10.31948471069336, 11.048120498657227, 11.776756286621094, 12.505392074584961, 13.234027862548828, 13.962663650512695, 14.691299438476562, 15.41993522644043, 16.148571014404297, 16.877206802368164, 17.60584259033203, 18.3344783782959, 19.063114166259766, 19.791749954223633, 20.5203857421875, 21.249021530151367, 21.977657318115234, 22.7062931060791, 23.43492889404297, 24.163564682006836]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 4.0, 17.0, 16.0, 35.0, 33.0, 60.0, 66.0, 106.0, 165.0, 231.0, 306.0, 497.0, 739.0, 1106.0, 1791.0, 3141.0, 5483.0, 10086.0, 19540.0, 37937.0, 73149.0, 129167.0, 189448.0, 205758.0, 160201.0, 97747.0, 52340.0, 27055.0, 14126.0, 7479.0, 4146.0, 2354.0, 1476.0, 924.0, 532.0, 405.0, 269.0, 162.0, 136.0, 86.0, 62.0, 52.0, 36.0, 20.0, 13.0, 15.0, 10.0, 7.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-26.859375, -25.999755859375, -25.14013671875, -24.280517578125, -23.4208984375, -22.561279296875, -21.70166015625, -20.842041015625, -19.982421875, -19.122802734375, -18.26318359375, -17.403564453125, -16.5439453125, -15.684326171875, -14.82470703125, -13.965087890625, -13.10546875, -12.245849609375, -11.38623046875, -10.526611328125, -9.6669921875, -8.807373046875, -7.94775390625, -7.088134765625, -6.228515625, -5.368896484375, -4.50927734375, -3.649658203125, -2.7900390625, -1.930419921875, -1.07080078125, -0.211181640625, 0.6484375, 1.508056640625, 2.36767578125, 3.227294921875, 4.0869140625, 4.946533203125, 5.80615234375, 6.665771484375, 7.525390625, 8.385009765625, 9.24462890625, 10.104248046875, 10.9638671875, 11.823486328125, 12.68310546875, 13.542724609375, 14.40234375, 15.261962890625, 16.12158203125, 16.981201171875, 17.8408203125, 18.700439453125, 19.56005859375, 20.419677734375, 21.279296875, 22.138916015625, 22.99853515625, 23.858154296875, 24.7177734375, 25.577392578125, 26.43701171875, 27.296630859375, 28.15625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 9.0, 6.0, 11.0, 13.0, 12.0, 32.0, 21.0, 27.0, 18.0, 22.0, 39.0, 34.0, 31.0, 35.0, 44.0, 55.0, 46.0, 50.0, 49.0, 59.0, 47.0, 38.0, 41.0, 37.0, 22.0, 29.0, 23.0, 23.0, 18.0, 21.0, 15.0, 11.0, 9.0, 13.0, 10.0, 6.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.65625, -28.71923828125, -27.7822265625, -26.84521484375, -25.908203125, -24.97119140625, -24.0341796875, -23.09716796875, -22.16015625, -21.22314453125, -20.2861328125, -19.34912109375, -18.412109375, -17.47509765625, -16.5380859375, -15.60107421875, -14.6640625, -13.72705078125, -12.7900390625, -11.85302734375, -10.916015625, -9.97900390625, -9.0419921875, -8.10498046875, -7.16796875, -6.23095703125, -5.2939453125, -4.35693359375, -3.419921875, -2.48291015625, -1.5458984375, -0.60888671875, 0.328125, 1.26513671875, 2.2021484375, 3.13916015625, 4.076171875, 5.01318359375, 5.9501953125, 6.88720703125, 7.82421875, 8.76123046875, 9.6982421875, 10.63525390625, 11.572265625, 12.50927734375, 13.4462890625, 14.38330078125, 15.3203125, 16.25732421875, 17.1943359375, 18.13134765625, 19.068359375, 20.00537109375, 20.9423828125, 21.87939453125, 22.81640625, 23.75341796875, 24.6904296875, 25.62744140625, 26.564453125, 27.50146484375, 28.4384765625, 29.37548828125, 30.3125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 11.0, 15.0, 17.0, 21.0, 26.0, 49.0, 66.0, 102.0, 128.0, 180.0, 247.0, 377.0, 586.0, 858.0, 1323.0, 2198.0, 3613.0, 6166.0, 11256.0, 20854.0, 41768.0, 86713.0, 175337.0, 258739.0, 211824.0, 113217.0, 53872.0, 26185.0, 13646.0, 7479.0, 4410.0, 2593.0, 1637.0, 1016.0, 651.0, 417.0, 284.0, 198.0, 131.0, 99.0, 61.0, 59.0, 39.0, 29.0, 13.0, 18.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.8125, -47.22119140625, -45.6298828125, -44.03857421875, -42.447265625, -40.85595703125, -39.2646484375, -37.67333984375, -36.08203125, -34.49072265625, -32.8994140625, -31.30810546875, -29.716796875, -28.12548828125, -26.5341796875, -24.94287109375, -23.3515625, -21.76025390625, -20.1689453125, -18.57763671875, -16.986328125, -15.39501953125, -13.8037109375, -12.21240234375, -10.62109375, -9.02978515625, -7.4384765625, -5.84716796875, -4.255859375, -2.66455078125, -1.0732421875, 0.51806640625, 2.109375, 3.70068359375, 5.2919921875, 6.88330078125, 8.474609375, 10.06591796875, 11.6572265625, 13.24853515625, 14.83984375, 16.43115234375, 18.0224609375, 19.61376953125, 21.205078125, 22.79638671875, 24.3876953125, 25.97900390625, 27.5703125, 29.16162109375, 30.7529296875, 32.34423828125, 33.935546875, 35.52685546875, 37.1181640625, 38.70947265625, 40.30078125, 41.89208984375, 43.4833984375, 45.07470703125, 46.666015625, 48.25732421875, 49.8486328125, 51.43994140625, 53.03125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 5.0, 6.0, 9.0, 18.0, 11.0, 22.0, 14.0, 23.0, 30.0, 24.0, 29.0, 30.0, 34.0, 38.0, 39.0, 38.0, 41.0, 51.0, 33.0, 46.0, 42.0, 41.0, 27.0, 42.0, 35.0, 36.0, 32.0, 44.0, 22.0, 15.0, 22.0, 19.0, 13.0, 16.0, 10.0, 8.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.656005859375, -17.07763671875, -16.499267578125, -15.9208984375, -15.342529296875, -14.76416015625, -14.185791015625, -13.607421875, -13.029052734375, -12.45068359375, -11.872314453125, -11.2939453125, -10.715576171875, -10.13720703125, -9.558837890625, -8.98046875, -8.402099609375, -7.82373046875, -7.245361328125, -6.6669921875, -6.088623046875, -5.51025390625, -4.931884765625, -4.353515625, -3.775146484375, -3.19677734375, -2.618408203125, -2.0400390625, -1.461669921875, -0.88330078125, -0.304931640625, 0.2734375, 0.851806640625, 1.43017578125, 2.008544921875, 2.5869140625, 3.165283203125, 3.74365234375, 4.322021484375, 4.900390625, 5.478759765625, 6.05712890625, 6.635498046875, 7.2138671875, 7.792236328125, 8.37060546875, 8.948974609375, 9.52734375, 10.105712890625, 10.68408203125, 11.262451171875, 11.8408203125, 12.419189453125, 12.99755859375, 13.575927734375, 14.154296875, 14.732666015625, 15.31103515625, 15.889404296875, 16.4677734375, 17.046142578125, 17.62451171875, 18.202880859375, 18.78125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 7.0, 9.0, 21.0, 24.0, 37.0, 52.0, 87.0, 102.0, 169.0, 247.0, 421.0, 684.0, 1248.0, 2331.0, 4623.0, 10486.0, 28531.0, 86053.0, 234733.0, 349843.0, 210549.0, 74970.0, 24708.0, 9405.0, 4130.0, 2120.0, 1169.0, 711.0, 358.0, 246.0, 171.0, 95.0, 55.0, 40.0, 24.0, 25.0, 21.0, 14.0, 8.0, 12.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.09375, -32.041015625, -30.98828125, -29.935546875, -28.8828125, -27.830078125, -26.77734375, -25.724609375, -24.671875, -23.619140625, -22.56640625, -21.513671875, -20.4609375, -19.408203125, -18.35546875, -17.302734375, -16.25, -15.197265625, -14.14453125, -13.091796875, -12.0390625, -10.986328125, -9.93359375, -8.880859375, -7.828125, -6.775390625, -5.72265625, -4.669921875, -3.6171875, -2.564453125, -1.51171875, -0.458984375, 0.59375, 1.646484375, 2.69921875, 3.751953125, 4.8046875, 5.857421875, 6.91015625, 7.962890625, 9.015625, 10.068359375, 11.12109375, 12.173828125, 13.2265625, 14.279296875, 15.33203125, 16.384765625, 17.4375, 18.490234375, 19.54296875, 20.595703125, 21.6484375, 22.701171875, 23.75390625, 24.806640625, 25.859375, 26.912109375, 27.96484375, 29.017578125, 30.0703125, 31.123046875, 32.17578125, 33.228515625, 34.28125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 11.0, 9.0, 11.0, 30.0, 31.0, 41.0, 45.0, 74.0, 87.0, 92.0, 77.0, 95.0, 79.0, 83.0, 71.0, 37.0, 31.0, 29.0, 14.0, 11.0, 12.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031871795654296875, -0.0030979812145233154, -0.0030087828636169434, -0.0029195845127105713, -0.0028303861618041992, -0.002741187810897827, -0.002651989459991455, -0.002562791109085083, -0.002473592758178711, -0.002384394407272339, -0.002295196056365967, -0.0022059977054595947, -0.0021167993545532227, -0.0020276010036468506, -0.0019384026527404785, -0.0018492043018341064, -0.0017600059509277344, -0.0016708076000213623, -0.0015816092491149902, -0.0014924108982086182, -0.001403212547302246, -0.001314014196395874, -0.001224815845489502, -0.0011356174945831299, -0.0010464191436767578, -0.0009572207927703857, -0.0008680224418640137, -0.0007788240909576416, -0.0006896257400512695, -0.0006004273891448975, -0.0005112290382385254, -0.0004220306873321533, -0.00033283233642578125, -0.00024363398551940918, -0.0001544356346130371, -6.523728370666504e-05, 2.396106719970703e-05, 0.0001131594181060791, 0.00020235776901245117, 0.00029155611991882324, 0.0003807544708251953, 0.0004699528217315674, 0.0005591511726379395, 0.0006483495235443115, 0.0007375478744506836, 0.0008267462253570557, 0.0009159445762634277, 0.0010051429271697998, 0.0010943412780761719, 0.001183539628982544, 0.001272737979888916, 0.001361936330795288, 0.0014511346817016602, 0.0015403330326080322, 0.0016295313835144043, 0.0017187297344207764, 0.0018079280853271484, 0.0018971264362335205, 0.0019863247871398926, 0.0020755231380462646, 0.0021647214889526367, 0.002253919839859009, 0.002343118190765381, 0.002432316541671753, 0.002521514892578125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 16.0, 11.0, 23.0, 23.0, 32.0, 54.0, 92.0, 79.0, 152.0, 185.0, 284.0, 386.0, 669.0, 929.0, 1570.0, 2648.0, 4852.0, 8971.0, 18292.0, 39285.0, 84889.0, 163114.0, 235459.0, 218962.0, 136952.0, 67551.0, 30952.0, 14488.0, 7394.0, 4009.0, 2227.0, 1386.0, 862.0, 554.0, 335.0, 283.0, 195.0, 130.0, 78.0, 56.0, 29.0, 26.0, 22.0, 16.0, 11.0, 6.0, 6.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-21.3125, -20.62158203125, -19.9306640625, -19.23974609375, -18.548828125, -17.85791015625, -17.1669921875, -16.47607421875, -15.78515625, -15.09423828125, -14.4033203125, -13.71240234375, -13.021484375, -12.33056640625, -11.6396484375, -10.94873046875, -10.2578125, -9.56689453125, -8.8759765625, -8.18505859375, -7.494140625, -6.80322265625, -6.1123046875, -5.42138671875, -4.73046875, -4.03955078125, -3.3486328125, -2.65771484375, -1.966796875, -1.27587890625, -0.5849609375, 0.10595703125, 0.796875, 1.48779296875, 2.1787109375, 2.86962890625, 3.560546875, 4.25146484375, 4.9423828125, 5.63330078125, 6.32421875, 7.01513671875, 7.7060546875, 8.39697265625, 9.087890625, 9.77880859375, 10.4697265625, 11.16064453125, 11.8515625, 12.54248046875, 13.2333984375, 13.92431640625, 14.615234375, 15.30615234375, 15.9970703125, 16.68798828125, 17.37890625, 18.06982421875, 18.7607421875, 19.45166015625, 20.142578125, 20.83349609375, 21.5244140625, 22.21533203125, 22.90625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 8.0, 18.0, 21.0, 24.0, 36.0, 58.0, 56.0, 81.0, 80.0, 78.0, 79.0, 88.0, 74.0, 62.0, 54.0, 47.0, 27.0, 32.0, 20.0, 15.0, 6.0, 6.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1171875, -5.894775390625, -5.67236328125, -5.449951171875, -5.2275390625, -5.005126953125, -4.78271484375, -4.560302734375, -4.337890625, -4.115478515625, -3.89306640625, -3.670654296875, -3.4482421875, -3.225830078125, -3.00341796875, -2.781005859375, -2.55859375, -2.336181640625, -2.11376953125, -1.891357421875, -1.6689453125, -1.446533203125, -1.22412109375, -1.001708984375, -0.779296875, -0.556884765625, -0.33447265625, -0.112060546875, 0.1103515625, 0.332763671875, 0.55517578125, 0.777587890625, 1.0, 1.222412109375, 1.44482421875, 1.667236328125, 1.8896484375, 2.112060546875, 2.33447265625, 2.556884765625, 2.779296875, 3.001708984375, 3.22412109375, 3.446533203125, 3.6689453125, 3.891357421875, 4.11376953125, 4.336181640625, 4.55859375, 4.781005859375, 5.00341796875, 5.225830078125, 5.4482421875, 5.670654296875, 5.89306640625, 6.115478515625, 6.337890625, 6.560302734375, 6.78271484375, 7.005126953125, 7.2275390625, 7.449951171875, 7.67236328125, 7.894775390625, 8.1171875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 5.0, 11.0, 9.0, 9.0, 17.0, 13.0, 24.0, 16.0, 29.0, 43.0, 45.0, 43.0, 38.0, 51.0, 65.0, 59.0, 62.0, 58.0, 51.0, 49.0, 53.0, 53.0, 32.0, 29.0, 24.0, 21.0, 24.0, 13.0, 11.0, 11.0, 4.0, 12.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.61028289794922, -52.007198333740234, -50.404109954833984, -48.801025390625, -47.197940826416016, -45.59485626220703, -43.99176788330078, -42.3886833190918, -40.78559875488281, -39.18251419067383, -37.57942581176758, -35.976341247558594, -34.37325668334961, -32.770172119140625, -31.167083740234375, -29.56399917602539, -27.96091079711914, -26.357824325561523, -24.75473976135254, -23.151653289794922, -21.548568725585938, -19.94548225402832, -18.342395782470703, -16.73931121826172, -15.136224746704102, -13.5331392288208, -11.9300537109375, -10.326967239379883, -8.723881721496582, -7.120796203613281, -5.517709732055664, -3.9146242141723633, -2.311542510986328, -0.7084567546844482, 0.8946290016174316, 2.4977149963378906, 4.100800514221191, 5.703886032104492, 7.306972503662109, 8.91005802154541, 10.513143539428711, 12.116229057312012, 13.719314575195312, 15.32240104675293, 16.925487518310547, 18.52857208251953, 20.13165855407715, 21.734745025634766, 23.33782958984375, 24.940916061401367, 26.54400062561035, 28.14708709716797, 29.750171661376953, 31.35325813293457, 32.95634460449219, 34.55942916870117, 36.162513732910156, 37.76559829711914, 39.36868667602539, 40.971771240234375, 42.57485580444336, 44.177940368652344, 45.781028747558594, 47.38411331176758, 48.98720169067383]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 8.0, 7.0, 9.0, 17.0, 13.0, 11.0, 17.0, 16.0, 25.0, 22.0, 31.0, 23.0, 39.0, 26.0, 35.0, 40.0, 39.0, 36.0, 37.0, 52.0, 41.0, 48.0, 34.0, 43.0, 39.0, 39.0, 37.0, 29.0, 24.0, 14.0, 17.0, 25.0, 17.0, 18.0, 16.0, 11.0, 7.0, 7.0, 3.0, 2.0, 7.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.49057388305664, -35.39398193359375, -34.29738998413086, -33.20079803466797, -32.10420608520508, -31.007614135742188, -29.911022186279297, -28.814430236816406, -27.717838287353516, -26.621246337890625, -25.524654388427734, -24.428062438964844, -23.331470489501953, -22.234878540039062, -21.138286590576172, -20.04169464111328, -18.945104598999023, -17.848512649536133, -16.751920700073242, -15.655328750610352, -14.558736801147461, -13.46214485168457, -12.365553855895996, -11.268961906433105, -10.172369956970215, -9.075778007507324, -7.979186058044434, -6.882594585418701, -5.7860026359558105, -4.68941068649292, -3.5928192138671875, -2.496227264404297, -1.3996353149414062, -0.3030434846878052, 0.7935483455657959, 1.8901400566101074, 2.986732006072998, 4.083323955535889, 5.179915428161621, 6.276507377624512, 7.373099327087402, 8.469691276550293, 9.566283226013184, 10.662874221801758, 11.759466171264648, 12.856058120727539, 13.95265007019043, 15.04924201965332, 16.14583396911621, 17.2424259185791, 18.339017868041992, 19.435609817504883, 20.532201766967773, 21.628793716430664, 22.725383758544922, 23.821975708007812, 24.918567657470703, 26.015159606933594, 27.111751556396484, 28.208343505859375, 29.304935455322266, 30.401527404785156, 31.498119354248047, 32.59471130371094, 33.69130325317383]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 7.0, 9.0, 15.0, 18.0, 35.0, 36.0, 45.0, 87.0, 75.0, 146.0, 189.0, 280.0, 418.0, 696.0, 997.0, 1699.0, 2935.0, 5517.0, 14314.0, 483151.0, 5715.0, 3030.0, 1705.0, 1073.0, 667.0, 416.0, 279.0, 207.0, 152.0, 101.0, 78.0, 56.0, 37.0, 27.0, 23.0, 8.0, 10.0, 2.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-612.1024169921875, -593.5662841796875, -575.0301513671875, -556.4940185546875, -537.9578857421875, -519.4216918945312, -500.88555908203125, -482.34942626953125, -463.81329345703125, -445.27716064453125, -426.74102783203125, -408.2048645019531, -389.6687316894531, -371.1325988769531, -352.596435546875, -334.060302734375, -315.524169921875, -296.988037109375, -278.451904296875, -259.9157409667969, -241.37960815429688, -222.84347534179688, -204.3073272705078, -185.77117919921875, -167.23504638671875, -148.69891357421875, -130.1627655029297, -111.62662506103516, -93.09048461914062, -74.5543441772461, -56.01820373535156, -37.4820556640625, -18.9459228515625, -0.40978240966796875, 18.126358032226562, 36.662498474121094, 55.198638916015625, 73.73477935791016, 92.27091979980469, 110.80706787109375, 129.34320068359375, 147.87933349609375, 166.4154815673828, 184.95162963867188, 203.48776245117188, 222.02389526367188, 240.56004333496094, 259.09619140625, 277.63232421875, 296.16845703125, 314.70458984375, 333.2407531738281, 351.7768859863281, 370.3130187988281, 388.84918212890625, 407.38531494140625, 425.92144775390625, 444.45758056640625, 462.99371337890625, 481.5298767089844, 500.0660095214844, 518.6021728515625, 537.1383056640625, 555.6744384765625, 574.2105712890625]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 5.0, 7.0, 8.0, 11.0, 13.0, 16.0, 10.0, 12.0, 21.0, 23.0, 19.0, 32.0, 22.0, 29.0, 36.0, 30.0, 35.0, 37.0, 39.0, 41.0, 1068.0, 51.0, 35.0, 43.0, 43.0, 35.0, 39.0, 42.0, 30.0, 26.0, 18.0, 14.0, 23.0, 19.0, 19.0, 15.0, 12.0, 10.0, 7.0, 4.0, 3.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1139.9310302734375, -1105.94970703125, -1071.9683837890625, -1037.987060546875, -1004.0057373046875, -970.0244140625, -936.0431518554688, -902.0618286132812, -868.0805053710938, -834.0991821289062, -800.1178588867188, -766.1365356445312, -732.1552734375, -698.1739501953125, -664.192626953125, -630.2113037109375, -596.22998046875, -562.2486572265625, -528.267333984375, -494.2860412597656, -460.3047180175781, -426.3233947753906, -392.34210205078125, -358.36077880859375, -324.37945556640625, -290.39813232421875, -256.41680908203125, -222.43551635742188, -188.45419311523438, -154.47286987304688, -120.49156188964844, -86.51025390625, -52.529052734375, -18.54773712158203, 15.433578491210938, 49.414894104003906, 83.39620971679688, 117.37753295898438, 151.3588409423828, 185.34014892578125, 219.32147216796875, 253.30279541015625, 287.28411865234375, 321.2654113769531, 355.2467346191406, 389.2280578613281, 423.2093505859375, 457.190673828125, 491.1719970703125, 525.1533203125, 559.1346435546875, 593.115966796875, 627.0972900390625, 661.07861328125, 695.0598754882812, 729.0411987304688, 763.0225219726562, 797.0038452148438, 830.9851684570312, 864.9664916992188, 898.94775390625, 932.9290771484375, 966.910400390625, 1000.8917236328125, 1034.873046875]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 4.0, 8.0, 16.0, 21.0, 14.0, 22.0, 38.0, 43.0, 77.0, 132.0, 197.0, 278.0, 421.0, 632.0, 766.0, 1042.0, 1441.0, 1714.0, 2189.0, 2628.0, 3067.0, 3797.0, 4859.0, 5892.0, 7586.0, 12197.0, 209721.0, 30919324.0, 20959.0, 13903.0, 15488.0, 15881.0, 5207.0, 1853.0, 1124.0, 659.0, 456.0, 276.0, 183.0, 123.0, 89.0, 52.0, 47.0, 36.0, 20.0, 13.0, 5.0, 4.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-750.5015258789062, -729.7124633789062, -708.9234008789062, -688.1343383789062, -667.3452758789062, -646.5562133789062, -625.7671508789062, -604.9780883789062, -584.1890258789062, -563.3999633789062, -542.6109008789062, -521.8218383789062, -501.03277587890625, -480.24371337890625, -459.45465087890625, -438.66558837890625, -417.87652587890625, -397.08746337890625, -376.29840087890625, -355.50933837890625, -334.72027587890625, -313.93121337890625, -293.14215087890625, -272.35308837890625, -251.56402587890625, -230.77496337890625, -209.98590087890625, -189.19683837890625, -168.40777587890625, -147.61871337890625, -126.82965087890625, -106.04058837890625, -85.2515869140625, -64.4625244140625, -43.6734619140625, -22.8843994140625, -2.0953369140625, 18.6937255859375, 39.4827880859375, 60.2718505859375, 81.0609130859375, 101.8499755859375, 122.6390380859375, 143.4281005859375, 164.2171630859375, 185.0062255859375, 205.7952880859375, 226.5843505859375, 247.3734130859375, 268.1624755859375, 288.9515380859375, 309.7406005859375, 330.5296630859375, 351.3187255859375, 372.1077880859375, 392.8968505859375, 413.6859130859375, 434.4749755859375, 455.2640380859375, 476.0531005859375, 496.8421630859375, 517.6312255859375, 538.4202880859375, 559.2093505859375, 579.9984130859375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 16.0, 18.0, 28.0, 52.0, 71.0, 118.0, 194.0, 269.0, 483.0, 783.0, 1441.0, 2604.0, 5017.0, 9728.0, 20067.0, 43914.0, 100178.0, 241347.0, 638248.0, 1962484.0, 2119080.0, 687280.0, 259615.0, 107149.0, 46974.0, 21675.0, 10525.0, 5323.0, 2831.0, 1560.0, 914.0, 601.0, 296.0, 201.0, 94.0, 80.0, 49.0, 42.0, 20.0, 15.0, 11.0, 16.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-141.125, -135.705078125, -130.28515625, -124.865234375, -119.4453125, -114.025390625, -108.60546875, -103.185546875, -97.765625, -92.345703125, -86.92578125, -81.505859375, -76.0859375, -70.666015625, -65.24609375, -59.826171875, -54.40625, -48.986328125, -43.56640625, -38.146484375, -32.7265625, -27.306640625, -21.88671875, -16.466796875, -11.046875, -5.626953125, -0.20703125, 5.212890625, 10.6328125, 16.052734375, 21.47265625, 26.892578125, 32.3125, 37.732421875, 43.15234375, 48.572265625, 53.9921875, 59.412109375, 64.83203125, 70.251953125, 75.671875, 81.091796875, 86.51171875, 91.931640625, 97.3515625, 102.771484375, 108.19140625, 113.611328125, 119.03125, 124.451171875, 129.87109375, 135.291015625, 140.7109375, 146.130859375, 151.55078125, 156.970703125, 162.390625, 167.810546875, 173.23046875, 178.650390625, 184.0703125, 189.490234375, 194.91015625, 200.330078125, 205.75]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 7.0, 11.0, 11.0, 21.0, 21.0, 13.0, 28.0, 44.0, 41.0, 54.0, 67.0, 85.0, 101.0, 133.0, 171.0, 205.0, 206.0, 160.0, 145.0, 94.0, 91.0, 54.0, 54.0, 43.0, 32.0, 30.0, 26.0, 18.0, 8.0, 6.0, 7.0, 10.0, 5.0, 3.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-55.625, -53.92529296875, -52.2255859375, -50.52587890625, -48.826171875, -47.12646484375, -45.4267578125, -43.72705078125, -42.02734375, -40.32763671875, -38.6279296875, -36.92822265625, -35.228515625, -33.52880859375, -31.8291015625, -30.12939453125, -28.4296875, -26.72998046875, -25.0302734375, -23.33056640625, -21.630859375, -19.93115234375, -18.2314453125, -16.53173828125, -14.83203125, -13.13232421875, -11.4326171875, -9.73291015625, -8.033203125, -6.33349609375, -4.6337890625, -2.93408203125, -1.234375, 0.46533203125, 2.1650390625, 3.86474609375, 5.564453125, 7.26416015625, 8.9638671875, 10.66357421875, 12.36328125, 14.06298828125, 15.7626953125, 17.46240234375, 19.162109375, 20.86181640625, 22.5615234375, 24.26123046875, 25.9609375, 27.66064453125, 29.3603515625, 31.06005859375, 32.759765625, 34.45947265625, 36.1591796875, 37.85888671875, 39.55859375, 41.25830078125, 42.9580078125, 44.65771484375, 46.357421875, 48.05712890625, 49.7568359375, 51.45654296875, 53.15625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 8.0, 12.0, 14.0, 16.0, 45.0, 59.0, 83.0, 105.0, 172.0, 225.0, 394.0, 689.0, 1024.0, 1571.0, 2621.0, 3897.0, 6289.0, 9876.0, 15718.0, 24680.0, 38929.0, 62252.0, 100162.0, 162907.0, 272335.0, 485602.0, 972947.0, 1635250.0, 1139621.0, 566405.0, 307788.0, 181437.0, 111054.0, 69064.0, 43369.0, 27607.0, 17338.0, 10903.0, 6818.0, 4320.0, 2823.0, 1773.0, 1151.0, 736.0, 461.0, 319.0, 196.0, 120.0, 112.0, 48.0, 36.0, 26.0, 15.0, 8.0, 5.0, 3.0, 7.0, 3.0, 1.0, 1.0], "bins": [-54.0625, -52.3525390625, -50.642578125, -48.9326171875, -47.22265625, -45.5126953125, -43.802734375, -42.0927734375, -40.3828125, -38.6728515625, -36.962890625, -35.2529296875, -33.54296875, -31.8330078125, -30.123046875, -28.4130859375, -26.703125, -24.9931640625, -23.283203125, -21.5732421875, -19.86328125, -18.1533203125, -16.443359375, -14.7333984375, -13.0234375, -11.3134765625, -9.603515625, -7.8935546875, -6.18359375, -4.4736328125, -2.763671875, -1.0537109375, 0.65625, 2.3662109375, 4.076171875, 5.7861328125, 7.49609375, 9.2060546875, 10.916015625, 12.6259765625, 14.3359375, 16.0458984375, 17.755859375, 19.4658203125, 21.17578125, 22.8857421875, 24.595703125, 26.3056640625, 28.015625, 29.7255859375, 31.435546875, 33.1455078125, 34.85546875, 36.5654296875, 38.275390625, 39.9853515625, 41.6953125, 43.4052734375, 45.115234375, 46.8251953125, 48.53515625, 50.2451171875, 51.955078125, 53.6650390625, 55.375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 8.0, 6.0, 14.0, 12.0, 19.0, 19.0, 12.0, 20.0, 25.0, 44.0, 43.0, 59.0, 98.0, 128.0, 182.0, 215.0, 247.0, 222.0, 174.0, 116.0, 75.0, 56.0, 53.0, 49.0, 19.0, 23.0, 15.0, 14.0, 12.0, 11.0, 9.0, 4.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.8125, -83.2900390625, -80.767578125, -78.2451171875, -75.72265625, -73.2001953125, -70.677734375, -68.1552734375, -65.6328125, -63.1103515625, -60.587890625, -58.0654296875, -55.54296875, -53.0205078125, -50.498046875, -47.9755859375, -45.453125, -42.9306640625, -40.408203125, -37.8857421875, -35.36328125, -32.8408203125, -30.318359375, -27.7958984375, -25.2734375, -22.7509765625, -20.228515625, -17.7060546875, -15.18359375, -12.6611328125, -10.138671875, -7.6162109375, -5.09375, -2.5712890625, -0.048828125, 2.4736328125, 4.99609375, 7.5185546875, 10.041015625, 12.5634765625, 15.0859375, 17.6083984375, 20.130859375, 22.6533203125, 25.17578125, 27.6982421875, 30.220703125, 32.7431640625, 35.265625, 37.7880859375, 40.310546875, 42.8330078125, 45.35546875, 47.8779296875, 50.400390625, 52.9228515625, 55.4453125, 57.9677734375, 60.490234375, 63.0126953125, 65.53515625, 68.0576171875, 70.580078125, 73.1025390625, 75.625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 14.0, 12.0, 7.0, 28.0, 29.0, 34.0, 55.0, 110.0, 177.0, 194.0, 318.0, 533.0, 997.0, 1583.0, 2824.0, 5285.0, 11007.0, 24701.0, 61328.0, 234189.0, 5724178.0, 139140.0, 46409.0, 19217.0, 8819.0, 4495.0, 2379.0, 1207.0, 743.0, 489.0, 292.0, 198.0, 127.0, 90.0, 46.0, 51.0, 26.0, 25.0, 18.0, 16.0, 11.0, 12.0, 3.0, 11.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-301.5, -292.970703125, -284.44140625, -275.912109375, -267.3828125, -258.853515625, -250.32421875, -241.794921875, -233.265625, -224.736328125, -216.20703125, -207.677734375, -199.1484375, -190.619140625, -182.08984375, -173.560546875, -165.03125, -156.501953125, -147.97265625, -139.443359375, -130.9140625, -122.384765625, -113.85546875, -105.326171875, -96.796875, -88.267578125, -79.73828125, -71.208984375, -62.6796875, -54.150390625, -45.62109375, -37.091796875, -28.5625, -20.033203125, -11.50390625, -2.974609375, 5.5546875, 14.083984375, 22.61328125, 31.142578125, 39.671875, 48.201171875, 56.73046875, 65.259765625, 73.7890625, 82.318359375, 90.84765625, 99.376953125, 107.90625, 116.435546875, 124.96484375, 133.494140625, 142.0234375, 150.552734375, 159.08203125, 167.611328125, 176.140625, 184.669921875, 193.19921875, 201.728515625, 210.2578125, 218.787109375, 227.31640625, 235.845703125, 244.375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 9.0, 8.0, 11.0, 5.0, 11.0, 14.0, 15.0, 28.0, 28.0, 47.0, 41.0, 82.0, 92.0, 201.0, 434.0, 431.0, 188.0, 93.0, 60.0, 57.0, 34.0, 46.0, 24.0, 17.0, 12.0, 10.0, 7.0, 8.0, 1.0, 9.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.0, -140.12109375, -134.2421875, -128.36328125, -122.484375, -116.60546875, -110.7265625, -104.84765625, -98.96875, -93.08984375, -87.2109375, -81.33203125, -75.453125, -69.57421875, -63.6953125, -57.81640625, -51.9375, -46.05859375, -40.1796875, -34.30078125, -28.421875, -22.54296875, -16.6640625, -10.78515625, -4.90625, 0.97265625, 6.8515625, 12.73046875, 18.609375, 24.48828125, 30.3671875, 36.24609375, 42.125, 48.00390625, 53.8828125, 59.76171875, 65.640625, 71.51953125, 77.3984375, 83.27734375, 89.15625, 95.03515625, 100.9140625, 106.79296875, 112.671875, 118.55078125, 124.4296875, 130.30859375, 136.1875, 142.06640625, 147.9453125, 153.82421875, 159.703125, 165.58203125, 171.4609375, 177.33984375, 183.21875, 189.09765625, 194.9765625, 200.85546875, 206.734375, 212.61328125, 218.4921875, 224.37109375, 230.25]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 12.0, 5.0, 13.0, 20.0, 27.0, 40.0, 68.0, 110.0, 318.0, 177.0, 86.0, 52.0, 33.0, 20.0, 12.0, 11.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5123.6796875, -4864.41015625, -4605.140625, -4345.87060546875, -4086.60107421875, -3827.33154296875, -3568.061767578125, -3308.7919921875, -3049.5224609375, -2790.2529296875, -2530.983154296875, -2271.71337890625, -2012.44384765625, -1753.1741943359375, -1493.904541015625, -1234.6348876953125, -975.365234375, -716.0955810546875, -456.825927734375, -197.5562744140625, 61.71337890625, 320.9830322265625, 580.252685546875, 839.5223388671875, 1098.7919921875, 1358.0616455078125, 1617.331298828125, 1876.6009521484375, 2135.87060546875, 2395.14013671875, 2654.409912109375, 2913.6796875, 3172.9482421875, 3432.2177734375, 3691.487548828125, 3950.75732421875, 4210.02685546875, 4469.29638671875, 4728.56640625, 4987.8359375, 5247.10546875, 5506.375, 5765.64453125, 6024.91455078125, 6284.18408203125, 6543.45361328125, 6802.7236328125, 7061.9931640625, 7321.2626953125, 7580.5322265625, 7839.8017578125, 8099.07177734375, 8358.341796875, 8617.611328125, 8876.880859375, 9136.150390625, 9395.419921875, 9654.689453125, 9913.958984375, 10173.228515625, 10432.498046875, 10691.7685546875, 10951.0380859375, 11210.3076171875, 11469.5771484375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 5.0, 8.0, 7.0, 3.0, 10.0, 9.0, 14.0, 13.0, 14.0, 21.0, 13.0, 26.0, 24.0, 20.0, 36.0, 50.0, 63.0, 165.0, 161.0, 82.0, 40.0, 33.0, 14.0, 21.0, 15.0, 24.0, 19.0, 17.0, 17.0, 4.0, 9.0, 6.0, 7.0, 8.0, 8.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5073.2099609375, -4932.59716796875, -4791.984375, -4651.37158203125, -4510.7587890625, -4370.1455078125, -4229.53271484375, -4088.919921875, -3948.30712890625, -3807.6943359375, -3667.08154296875, -3526.468505859375, -3385.855712890625, -3245.242919921875, -3104.6298828125, -2964.01708984375, -2823.404296875, -2682.79150390625, -2542.1787109375, -2401.565673828125, -2260.952880859375, -2120.340087890625, -1979.7271728515625, -1839.1142578125, -1698.50146484375, -1557.888671875, -1417.2757568359375, -1276.662841796875, -1136.050048828125, -995.4371948242188, -854.8243408203125, -714.2114868164062, -573.5986328125, -432.98577880859375, -292.3729248046875, -151.76007080078125, -11.147216796875, 129.46563720703125, 270.0784912109375, 410.69134521484375, 551.30419921875, 691.9170532226562, 832.5299072265625, 973.1427612304688, 1113.755615234375, 1254.368408203125, 1394.9813232421875, 1535.59423828125, 1676.20703125, 1816.81982421875, 1957.4327392578125, 2098.045654296875, 2238.658447265625, 2379.271240234375, 2519.88427734375, 2660.4970703125, 2801.10986328125, 2941.72265625, 3082.33544921875, 3222.948486328125, 3363.561279296875, 3504.174072265625, 3644.787109375, 3785.39990234375, 3926.0126953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 12.0, 6.0, 22.0, 21.0, 35.0, 43.0, 47.0, 95.0, 122.0, 156.0, 225.0, 304.0, 407.0, 592.0, 864.0, 1186.0, 1716.0, 2475.0, 3778.0, 5744.0, 9231.0, 15546.0, 29199.0, 63338.0, 189407.0, 2546570.0, 1071157.0, 148331.0, 49683.0, 22412.0, 11725.0, 6916.0, 4276.0, 2827.0, 1796.0, 1292.0, 887.0, 593.0, 409.0, 256.0, 174.0, 134.0, 88.0, 56.0, 48.0, 30.0, 21.0, 6.0, 11.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-36.5, -35.39013671875, -34.2802734375, -33.17041015625, -32.060546875, -30.95068359375, -29.8408203125, -28.73095703125, -27.62109375, -26.51123046875, -25.4013671875, -24.29150390625, -23.181640625, -22.07177734375, -20.9619140625, -19.85205078125, -18.7421875, -17.63232421875, -16.5224609375, -15.41259765625, -14.302734375, -13.19287109375, -12.0830078125, -10.97314453125, -9.86328125, -8.75341796875, -7.6435546875, -6.53369140625, -5.423828125, -4.31396484375, -3.2041015625, -2.09423828125, -0.984375, 0.12548828125, 1.2353515625, 2.34521484375, 3.455078125, 4.56494140625, 5.6748046875, 6.78466796875, 7.89453125, 9.00439453125, 10.1142578125, 11.22412109375, 12.333984375, 13.44384765625, 14.5537109375, 15.66357421875, 16.7734375, 17.88330078125, 18.9931640625, 20.10302734375, 21.212890625, 22.32275390625, 23.4326171875, 24.54248046875, 25.65234375, 26.76220703125, 27.8720703125, 28.98193359375, 30.091796875, 31.20166015625, 32.3115234375, 33.42138671875, 34.53125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 2.0, 6.0, 3.0, 3.0, 12.0, 11.0, 11.0, 14.0, 24.0, 32.0, 34.0, 54.0, 90.0, 159.0, 179.0, 114.0, 62.0, 49.0, 29.0, 26.0, 17.0, 10.0, 10.0, 3.0, 4.0, 6.0, 3.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.2578125, -4.1358642578125, -4.013916015625, -3.8919677734375, -3.77001953125, -3.6480712890625, -3.526123046875, -3.4041748046875, -3.2822265625, -3.1602783203125, -3.038330078125, -2.9163818359375, -2.79443359375, -2.6724853515625, -2.550537109375, -2.4285888671875, -2.306640625, -2.1846923828125, -2.062744140625, -1.9407958984375, -1.81884765625, -1.6968994140625, -1.574951171875, -1.4530029296875, -1.3310546875, -1.2091064453125, -1.087158203125, -0.9652099609375, -0.84326171875, -0.7213134765625, -0.599365234375, -0.4774169921875, -0.35546875, -0.2335205078125, -0.111572265625, 0.0103759765625, 0.13232421875, 0.2542724609375, 0.376220703125, 0.4981689453125, 0.6201171875, 0.7420654296875, 0.864013671875, 0.9859619140625, 1.10791015625, 1.2298583984375, 1.351806640625, 1.4737548828125, 1.595703125, 1.7176513671875, 1.839599609375, 1.9615478515625, 2.08349609375, 2.2054443359375, 2.327392578125, 2.4493408203125, 2.5712890625, 2.6932373046875, 2.815185546875, 2.9371337890625, 3.05908203125, 3.1810302734375, 3.302978515625, 3.4249267578125, 3.546875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 4.0, 6.0, 8.0, 13.0, 15.0, 23.0, 33.0, 36.0, 62.0, 78.0, 134.0, 199.0, 326.0, 477.0, 819.0, 1511.0, 3073.0, 6990.0, 18029.0, 58138.0, 251452.0, 1750099.0, 1760413.0, 251177.0, 58457.0, 18160.0, 7199.0, 3179.0, 1677.0, 909.0, 543.0, 349.0, 208.0, 157.0, 103.0, 69.0, 52.0, 29.0, 25.0, 23.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.0625, -46.64892578125, -45.2353515625, -43.82177734375, -42.408203125, -40.99462890625, -39.5810546875, -38.16748046875, -36.75390625, -35.34033203125, -33.9267578125, -32.51318359375, -31.099609375, -29.68603515625, -28.2724609375, -26.85888671875, -25.4453125, -24.03173828125, -22.6181640625, -21.20458984375, -19.791015625, -18.37744140625, -16.9638671875, -15.55029296875, -14.13671875, -12.72314453125, -11.3095703125, -9.89599609375, -8.482421875, -7.06884765625, -5.6552734375, -4.24169921875, -2.828125, -1.41455078125, -0.0009765625, 1.41259765625, 2.826171875, 4.23974609375, 5.6533203125, 7.06689453125, 8.48046875, 9.89404296875, 11.3076171875, 12.72119140625, 14.134765625, 15.54833984375, 16.9619140625, 18.37548828125, 19.7890625, 21.20263671875, 22.6162109375, 24.02978515625, 25.443359375, 26.85693359375, 28.2705078125, 29.68408203125, 31.09765625, 32.51123046875, 33.9248046875, 35.33837890625, 36.751953125, 38.16552734375, 39.5791015625, 40.99267578125, 42.40625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 9.0, 3.0, 9.0, 21.0, 27.0, 26.0, 27.0, 48.0, 65.0, 54.0, 95.0, 104.0, 120.0, 194.0, 269.0, 373.0, 630.0, 590.0, 352.0, 260.0, 170.0, 136.0, 114.0, 72.0, 66.0, 44.0, 49.0, 43.0, 19.0, 23.0, 12.0, 11.0, 12.0, 4.0, 6.0, 3.0, 6.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.640625, -10.2459716796875, -9.851318359375, -9.4566650390625, -9.06201171875, -8.6673583984375, -8.272705078125, -7.8780517578125, -7.4833984375, -7.0887451171875, -6.694091796875, -6.2994384765625, -5.90478515625, -5.5101318359375, -5.115478515625, -4.7208251953125, -4.326171875, -3.9315185546875, -3.536865234375, -3.1422119140625, -2.74755859375, -2.3529052734375, -1.958251953125, -1.5635986328125, -1.1689453125, -0.7742919921875, -0.379638671875, 0.0150146484375, 0.40966796875, 0.8043212890625, 1.198974609375, 1.5936279296875, 1.98828125, 2.3829345703125, 2.777587890625, 3.1722412109375, 3.56689453125, 3.9615478515625, 4.356201171875, 4.7508544921875, 5.1455078125, 5.5401611328125, 5.934814453125, 6.3294677734375, 6.72412109375, 7.1187744140625, 7.513427734375, 7.9080810546875, 8.302734375, 8.6973876953125, 9.092041015625, 9.4866943359375, 9.88134765625, 10.2760009765625, 10.670654296875, 11.0653076171875, 11.4599609375, 11.8546142578125, 12.249267578125, 12.6439208984375, 13.03857421875, 13.4332275390625, 13.827880859375, 14.2225341796875, 14.6171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 5.0, 4.0, 16.0, 18.0, 25.0, 34.0, 43.0, 60.0, 87.0, 108.0, 109.0, 115.0, 76.0, 76.0, 58.0, 53.0, 33.0, 13.0, 16.0, 11.0, 13.0, 3.0, 5.0, 8.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-157.7928466796875, -153.80645751953125, -149.82005310058594, -145.8336639404297, -141.84727478027344, -137.86087036132812, -133.87448120117188, -129.88809204101562, -125.90169525146484, -121.91529846191406, -117.92890930175781, -113.94251251220703, -109.95611572265625, -105.9697265625, -101.98332977294922, -97.99693298339844, -94.01054382324219, -90.0241470336914, -86.03775787353516, -82.05136108398438, -78.0649642944336, -74.07857513427734, -70.09217834472656, -66.10578918457031, -62.119384765625, -58.132991790771484, -54.1465950012207, -50.16020202636719, -46.17380905151367, -42.187416076660156, -38.201019287109375, -34.21462631225586, -30.228233337402344, -26.241838455200195, -22.25544548034668, -18.26905059814453, -14.2826566696167, -10.296262741088867, -6.309867858886719, -2.323474884033203, 1.6629199981689453, 5.649313926696777, 9.63570785522461, 13.622102737426758, 17.608497619628906, 21.594890594482422, 25.58128547668457, 29.567678451538086, 33.554073333740234, 37.54046630859375, 41.52686309814453, 45.51325607299805, 49.49964904785156, 53.486045837402344, 57.47243881225586, 61.458831787109375, 65.44522857666016, 69.43162536621094, 73.41801452636719, 77.40441131591797, 81.39080810546875, 85.377197265625, 89.36359405517578, 93.34999084472656, 97.33638000488281]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 5.0, 10.0, 8.0, 15.0, 22.0, 20.0, 26.0, 20.0, 36.0, 41.0, 43.0, 33.0, 49.0, 44.0, 53.0, 55.0, 56.0, 49.0, 58.0, 48.0, 38.0, 53.0, 37.0, 40.0, 25.0, 26.0, 24.0, 17.0, 9.0, 15.0, 12.0, 1.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-90.92772674560547, -87.76943969726562, -84.61116027832031, -81.45287322998047, -78.29458618164062, -75.13629913330078, -71.97801208496094, -68.81973266601562, -65.66144561767578, -62.50315856933594, -59.34487533569336, -56.18659210205078, -53.02830505371094, -49.870018005371094, -46.711734771728516, -43.55345153808594, -40.395164489746094, -37.23687744140625, -34.07859420776367, -30.92030906677246, -27.76202392578125, -24.60373878479004, -21.445453643798828, -18.287168502807617, -15.128883361816406, -11.970598220825195, -8.812313079833984, -5.654027938842773, -2.4957427978515625, 0.6625423431396484, 3.8208274841308594, 6.97911262512207, 10.13739013671875, 13.295675277709961, 16.453960418701172, 19.612245559692383, 22.770530700683594, 25.928815841674805, 29.087100982666016, 32.245384216308594, 35.40367126464844, 38.56195831298828, 41.72024154663086, 44.87852478027344, 48.03681182861328, 51.195098876953125, 54.3533821105957, 57.51166534423828, 60.669952392578125, 63.82823944091797, 66.98652648925781, 70.14480590820312, 73.30309295654297, 76.46138000488281, 79.61965942382812, 82.77794647216797, 85.93623352050781, 89.09452056884766, 92.2528076171875, 95.41108703613281, 98.56937408447266, 101.7276611328125, 104.88594055175781, 108.04422760009766, 111.2025146484375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 6.0, 9.0, 7.0, 15.0, 23.0, 40.0, 53.0, 66.0, 101.0, 160.0, 202.0, 296.0, 444.0, 657.0, 1022.0, 1545.0, 2488.0, 4178.0, 7320.0, 14153.0, 30010.0, 75875.0, 271210.0, 437781.0, 117765.0, 41972.0, 18420.0, 9199.0, 4974.0, 3063.0, 1896.0, 1196.0, 765.0, 497.0, 343.0, 248.0, 148.0, 124.0, 74.0, 61.0, 40.0, 27.0, 19.0, 19.0, 11.0, 6.0, 8.0, 5.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-23.65625, -22.92138671875, -22.1865234375, -21.45166015625, -20.716796875, -19.98193359375, -19.2470703125, -18.51220703125, -17.77734375, -17.04248046875, -16.3076171875, -15.57275390625, -14.837890625, -14.10302734375, -13.3681640625, -12.63330078125, -11.8984375, -11.16357421875, -10.4287109375, -9.69384765625, -8.958984375, -8.22412109375, -7.4892578125, -6.75439453125, -6.01953125, -5.28466796875, -4.5498046875, -3.81494140625, -3.080078125, -2.34521484375, -1.6103515625, -0.87548828125, -0.140625, 0.59423828125, 1.3291015625, 2.06396484375, 2.798828125, 3.53369140625, 4.2685546875, 5.00341796875, 5.73828125, 6.47314453125, 7.2080078125, 7.94287109375, 8.677734375, 9.41259765625, 10.1474609375, 10.88232421875, 11.6171875, 12.35205078125, 13.0869140625, 13.82177734375, 14.556640625, 15.29150390625, 16.0263671875, 16.76123046875, 17.49609375, 18.23095703125, 18.9658203125, 19.70068359375, 20.435546875, 21.17041015625, 21.9052734375, 22.64013671875, 23.375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 10.0, 2.0, 6.0, 5.0, 10.0, 15.0, 14.0, 27.0, 23.0, 36.0, 35.0, 42.0, 65.0, 63.0, 58.0, 73.0, 95.0, 83.0, 67.0, 61.0, 51.0, 36.0, 21.0, 22.0, 15.0, 13.0, 8.0, 8.0, 6.0, 3.0, 7.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.375, -4.2412109375, -4.107421875, -3.9736328125, -3.83984375, -3.7060546875, -3.572265625, -3.4384765625, -3.3046875, -3.1708984375, -3.037109375, -2.9033203125, -2.76953125, -2.6357421875, -2.501953125, -2.3681640625, -2.234375, -2.1005859375, -1.966796875, -1.8330078125, -1.69921875, -1.5654296875, -1.431640625, -1.2978515625, -1.1640625, -1.0302734375, -0.896484375, -0.7626953125, -0.62890625, -0.4951171875, -0.361328125, -0.2275390625, -0.09375, 0.0400390625, 0.173828125, 0.3076171875, 0.44140625, 0.5751953125, 0.708984375, 0.8427734375, 0.9765625, 1.1103515625, 1.244140625, 1.3779296875, 1.51171875, 1.6455078125, 1.779296875, 1.9130859375, 2.046875, 2.1806640625, 2.314453125, 2.4482421875, 2.58203125, 2.7158203125, 2.849609375, 2.9833984375, 3.1171875, 3.2509765625, 3.384765625, 3.5185546875, 3.65234375, 3.7861328125, 3.919921875, 4.0537109375, 4.1875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 21.0, 30.0, 31.0, 40.0, 68.0, 84.0, 151.0, 183.0, 315.0, 475.0, 731.0, 1251.0, 2127.0, 3935.0, 7450.0, 15220.0, 35389.0, 96594.0, 340693.0, 369565.0, 103375.0, 37222.0, 16092.0, 7653.0, 4057.0, 2261.0, 1293.0, 798.0, 518.0, 278.0, 191.0, 135.0, 105.0, 75.0, 41.0, 36.0, 17.0, 12.0, 12.0, 8.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.046875, -20.40966796875, -19.7724609375, -19.13525390625, -18.498046875, -17.86083984375, -17.2236328125, -16.58642578125, -15.94921875, -15.31201171875, -14.6748046875, -14.03759765625, -13.400390625, -12.76318359375, -12.1259765625, -11.48876953125, -10.8515625, -10.21435546875, -9.5771484375, -8.93994140625, -8.302734375, -7.66552734375, -7.0283203125, -6.39111328125, -5.75390625, -5.11669921875, -4.4794921875, -3.84228515625, -3.205078125, -2.56787109375, -1.9306640625, -1.29345703125, -0.65625, -0.01904296875, 0.6181640625, 1.25537109375, 1.892578125, 2.52978515625, 3.1669921875, 3.80419921875, 4.44140625, 5.07861328125, 5.7158203125, 6.35302734375, 6.990234375, 7.62744140625, 8.2646484375, 8.90185546875, 9.5390625, 10.17626953125, 10.8134765625, 11.45068359375, 12.087890625, 12.72509765625, 13.3623046875, 13.99951171875, 14.63671875, 15.27392578125, 15.9111328125, 16.54833984375, 17.185546875, 17.82275390625, 18.4599609375, 19.09716796875, 19.734375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 6.0, 2.0, 6.0, 4.0, 9.0, 10.0, 8.0, 11.0, 14.0, 30.0, 25.0, 29.0, 26.0, 23.0, 34.0, 32.0, 48.0, 37.0, 38.0, 42.0, 39.0, 30.0, 38.0, 35.0, 43.0, 30.0, 38.0, 45.0, 33.0, 36.0, 24.0, 19.0, 19.0, 30.0, 19.0, 12.0, 14.0, 8.0, 15.0, 7.0, 7.0, 9.0, 8.0, 0.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.453125, -16.874755859375, -16.29638671875, -15.718017578125, -15.1396484375, -14.561279296875, -13.98291015625, -13.404541015625, -12.826171875, -12.247802734375, -11.66943359375, -11.091064453125, -10.5126953125, -9.934326171875, -9.35595703125, -8.777587890625, -8.19921875, -7.620849609375, -7.04248046875, -6.464111328125, -5.8857421875, -5.307373046875, -4.72900390625, -4.150634765625, -3.572265625, -2.993896484375, -2.41552734375, -1.837158203125, -1.2587890625, -0.680419921875, -0.10205078125, 0.476318359375, 1.0546875, 1.633056640625, 2.21142578125, 2.789794921875, 3.3681640625, 3.946533203125, 4.52490234375, 5.103271484375, 5.681640625, 6.260009765625, 6.83837890625, 7.416748046875, 7.9951171875, 8.573486328125, 9.15185546875, 9.730224609375, 10.30859375, 10.886962890625, 11.46533203125, 12.043701171875, 12.6220703125, 13.200439453125, 13.77880859375, 14.357177734375, 14.935546875, 15.513916015625, 16.09228515625, 16.670654296875, 17.2490234375, 17.827392578125, 18.40576171875, 18.984130859375, 19.5625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 12.0, 15.0, 30.0, 33.0, 49.0, 92.0, 161.0, 243.0, 492.0, 877.0, 2052.0, 4695.0, 13506.0, 55588.0, 379313.0, 491883.0, 72837.0, 16513.0, 5610.0, 2250.0, 1054.0, 506.0, 281.0, 154.0, 98.0, 65.0, 43.0, 23.0, 19.0, 13.0, 9.0, 11.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.0, -20.3837890625, -19.767578125, -19.1513671875, -18.53515625, -17.9189453125, -17.302734375, -16.6865234375, -16.0703125, -15.4541015625, -14.837890625, -14.2216796875, -13.60546875, -12.9892578125, -12.373046875, -11.7568359375, -11.140625, -10.5244140625, -9.908203125, -9.2919921875, -8.67578125, -8.0595703125, -7.443359375, -6.8271484375, -6.2109375, -5.5947265625, -4.978515625, -4.3623046875, -3.74609375, -3.1298828125, -2.513671875, -1.8974609375, -1.28125, -0.6650390625, -0.048828125, 0.5673828125, 1.18359375, 1.7998046875, 2.416015625, 3.0322265625, 3.6484375, 4.2646484375, 4.880859375, 5.4970703125, 6.11328125, 6.7294921875, 7.345703125, 7.9619140625, 8.578125, 9.1943359375, 9.810546875, 10.4267578125, 11.04296875, 11.6591796875, 12.275390625, 12.8916015625, 13.5078125, 14.1240234375, 14.740234375, 15.3564453125, 15.97265625, 16.5888671875, 17.205078125, 17.8212890625, 18.4375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 5.0, 11.0, 13.0, 23.0, 28.0, 51.0, 58.0, 76.0, 110.0, 98.0, 109.0, 95.0, 78.0, 62.0, 48.0, 40.0, 29.0, 18.0, 15.0, 10.0, 7.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003840923309326172, -0.00036393478512763977, -0.00034377723932266235, -0.00032361969351768494, -0.0003034621477127075, -0.0002833046019077301, -0.0002631470561027527, -0.00024298951029777527, -0.00022283196449279785, -0.00020267441868782043, -0.00018251687288284302, -0.0001623593270778656, -0.00014220178127288818, -0.00012204423546791077, -0.00010188668966293335, -8.172914385795593e-05, -6.157159805297852e-05, -4.14140522480011e-05, -2.125650644302368e-05, -1.0989606380462646e-06, 1.9058585166931152e-05, 3.921613097190857e-05, 5.9373676776885986e-05, 7.95312225818634e-05, 9.968876838684082e-05, 0.00011984631419181824, 0.00014000385999679565, 0.00016016140580177307, 0.0001803189516067505, 0.0002004764974117279, 0.00022063404321670532, 0.00024079158902168274, 0.00026094913482666016, 0.0002811066806316376, 0.000301264226436615, 0.0003214217722415924, 0.0003415793180465698, 0.00036173686385154724, 0.00038189440965652466, 0.0004020519554615021, 0.0004222095012664795, 0.0004423670470714569, 0.0004625245928764343, 0.00048268213868141174, 0.0005028396844863892, 0.0005229972302913666, 0.000543154776096344, 0.0005633123219013214, 0.0005834698677062988, 0.0006036274135112762, 0.0006237849593162537, 0.0006439425051212311, 0.0006641000509262085, 0.0006842575967311859, 0.0007044151425361633, 0.0007245726883411407, 0.0007447302341461182, 0.0007648877799510956, 0.000785045325756073, 0.0008052028715610504, 0.0008253604173660278, 0.0008455179631710052, 0.0008656755089759827, 0.0008858330547809601, 0.0009059906005859375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 15.0, 8.0, 26.0, 29.0, 46.0, 78.0, 120.0, 211.0, 370.0, 771.0, 1670.0, 4083.0, 12067.0, 45965.0, 269404.0, 567870.0, 110577.0, 23310.0, 6971.0, 2589.0, 1152.0, 529.0, 273.0, 152.0, 92.0, 78.0, 27.0, 22.0, 11.0, 15.0, 6.0, 4.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.0625, -18.4326171875, -17.802734375, -17.1728515625, -16.54296875, -15.9130859375, -15.283203125, -14.6533203125, -14.0234375, -13.3935546875, -12.763671875, -12.1337890625, -11.50390625, -10.8740234375, -10.244140625, -9.6142578125, -8.984375, -8.3544921875, -7.724609375, -7.0947265625, -6.46484375, -5.8349609375, -5.205078125, -4.5751953125, -3.9453125, -3.3154296875, -2.685546875, -2.0556640625, -1.42578125, -0.7958984375, -0.166015625, 0.4638671875, 1.09375, 1.7236328125, 2.353515625, 2.9833984375, 3.61328125, 4.2431640625, 4.873046875, 5.5029296875, 6.1328125, 6.7626953125, 7.392578125, 8.0224609375, 8.65234375, 9.2822265625, 9.912109375, 10.5419921875, 11.171875, 11.8017578125, 12.431640625, 13.0615234375, 13.69140625, 14.3212890625, 14.951171875, 15.5810546875, 16.2109375, 16.8408203125, 17.470703125, 18.1005859375, 18.73046875, 19.3603515625, 19.990234375, 20.6201171875, 21.25]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 6.0, 8.0, 15.0, 9.0, 7.0, 15.0, 17.0, 24.0, 21.0, 41.0, 55.0, 53.0, 70.0, 68.0, 52.0, 79.0, 73.0, 67.0, 59.0, 43.0, 48.0, 38.0, 22.0, 20.0, 16.0, 17.0, 15.0, 12.0, 3.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.0390625, -10.7445068359375, -10.449951171875, -10.1553955078125, -9.86083984375, -9.5662841796875, -9.271728515625, -8.9771728515625, -8.6826171875, -8.3880615234375, -8.093505859375, -7.7989501953125, -7.50439453125, -7.2098388671875, -6.915283203125, -6.6207275390625, -6.326171875, -6.0316162109375, -5.737060546875, -5.4425048828125, -5.14794921875, -4.8533935546875, -4.558837890625, -4.2642822265625, -3.9697265625, -3.6751708984375, -3.380615234375, -3.0860595703125, -2.79150390625, -2.4969482421875, -2.202392578125, -1.9078369140625, -1.61328125, -1.3187255859375, -1.024169921875, -0.7296142578125, -0.43505859375, -0.1405029296875, 0.154052734375, 0.4486083984375, 0.7431640625, 1.0377197265625, 1.332275390625, 1.6268310546875, 1.92138671875, 2.2159423828125, 2.510498046875, 2.8050537109375, 3.099609375, 3.3941650390625, 3.688720703125, 3.9832763671875, 4.27783203125, 4.5723876953125, 4.866943359375, 5.1614990234375, 5.4560546875, 5.7506103515625, 6.045166015625, 6.3397216796875, 6.63427734375, 6.9288330078125, 7.223388671875, 7.5179443359375, 7.8125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 12.0, 13.0, 48.0, 111.0, 347.0, 301.0, 105.0, 32.0, 8.0, 10.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-613.5601806640625, -600.1788940429688, -586.797607421875, -573.416259765625, -560.0349731445312, -546.6536865234375, -533.2723999023438, -519.89111328125, -506.5097961425781, -493.1285095214844, -479.7471923828125, -466.36590576171875, -452.984619140625, -439.6033020019531, -426.2220153808594, -412.8406982421875, -399.45941162109375, -386.078125, -372.6968078613281, -359.3155212402344, -345.9342346191406, -332.55291748046875, -319.171630859375, -305.79034423828125, -292.4090576171875, -279.02777099609375, -265.6464538574219, -252.26516723632812, -238.8838653564453, -225.5025634765625, -212.12127685546875, -198.73997497558594, -185.3586883544922, -171.97738647460938, -158.59609985351562, -145.2147979736328, -131.83349609375, -118.45220184326172, -105.07090759277344, -91.68960571289062, -78.30831146240234, -64.92701721191406, -51.54571533203125, -38.16442108154297, -24.783123016357422, -11.401824951171875, 1.9794692993164062, 15.360771179199219, 28.7420654296875, 42.12336349487305, 55.504661560058594, 68.88595581054688, 82.26725769042969, 95.64855194091797, 109.02984619140625, 122.41114807128906, 135.79244995117188, 149.1737518310547, 162.55503845214844, 175.93634033203125, 189.31764221191406, 202.69894409179688, 216.08023071289062, 229.46153259277344, 242.8428192138672]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 13.0, 8.0, 11.0, 21.0, 25.0, 45.0, 88.0, 117.0, 143.0, 156.0, 114.0, 81.0, 54.0, 33.0, 22.0, 10.0, 6.0, 4.0, 6.0, 4.0, 8.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-342.6025390625, -331.60174560546875, -320.6009521484375, -309.60015869140625, -298.599365234375, -287.59857177734375, -276.5977783203125, -265.59698486328125, -254.59619140625, -243.59539794921875, -232.5946044921875, -221.59381103515625, -210.593017578125, -199.59222412109375, -188.5914306640625, -177.59063720703125, -166.58982849121094, -155.5890350341797, -144.58824157714844, -133.5874481201172, -122.58665466308594, -111.58586120605469, -100.5850601196289, -89.58426666259766, -78.5834732055664, -67.58267974853516, -56.581886291503906, -45.58108901977539, -34.58029556274414, -23.57950210571289, -12.578704833984375, -1.577911376953125, 9.422882080078125, 20.423675537109375, 31.424470901489258, 42.42526626586914, 53.42605972290039, 64.42684936523438, 75.42765045166016, 86.4284439086914, 97.42923736572266, 108.4300308227539, 119.43082427978516, 130.43162536621094, 141.4324188232422, 152.43321228027344, 163.4340057373047, 174.43479919433594, 185.4355926513672, 196.43638610839844, 207.4371795654297, 218.43797302246094, 229.4387664794922, 240.43955993652344, 251.44036865234375, 262.441162109375, 273.44195556640625, 284.4427490234375, 295.44354248046875, 306.4443359375, 317.44512939453125, 328.4459228515625, 339.44671630859375, 350.447509765625, 361.44830322265625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 2.0, 6.0, 12.0, 12.0, 18.0, 27.0, 42.0, 67.0, 106.0, 162.0, 271.0, 470.0, 866.0, 1599.0, 3434.0, 7804.0, 20276.0, 70386.0, 608678.0, 3312271.0, 117650.0, 29291.0, 10571.0, 4675.0, 2337.0, 1278.0, 708.0, 433.0, 280.0, 169.0, 120.0, 87.0, 49.0, 30.0, 26.0, 16.0, 8.0, 12.0, 4.0, 2.0, 7.0, 8.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.0625, -58.89453125, -56.7265625, -54.55859375, -52.390625, -50.22265625, -48.0546875, -45.88671875, -43.71875, -41.55078125, -39.3828125, -37.21484375, -35.046875, -32.87890625, -30.7109375, -28.54296875, -26.375, -24.20703125, -22.0390625, -19.87109375, -17.703125, -15.53515625, -13.3671875, -11.19921875, -9.03125, -6.86328125, -4.6953125, -2.52734375, -0.359375, 1.80859375, 3.9765625, 6.14453125, 8.3125, 10.48046875, 12.6484375, 14.81640625, 16.984375, 19.15234375, 21.3203125, 23.48828125, 25.65625, 27.82421875, 29.9921875, 32.16015625, 34.328125, 36.49609375, 38.6640625, 40.83203125, 43.0, 45.16796875, 47.3359375, 49.50390625, 51.671875, 53.83984375, 56.0078125, 58.17578125, 60.34375, 62.51171875, 64.6796875, 66.84765625, 69.015625, 71.18359375, 73.3515625, 75.51953125, 77.6875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 10.0, 4.0, 5.0, 10.0, 13.0, 12.0, 19.0, 28.0, 32.0, 42.0, 40.0, 52.0, 65.0, 39.0, 80.0, 73.0, 66.0, 78.0, 45.0, 50.0, 49.0, 38.0, 23.0, 23.0, 19.0, 16.0, 11.0, 11.0, 6.0, 8.0, 0.0, 3.0, 2.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.95703125, -3.82763671875, -3.6982421875, -3.56884765625, -3.439453125, -3.31005859375, -3.1806640625, -3.05126953125, -2.921875, -2.79248046875, -2.6630859375, -2.53369140625, -2.404296875, -2.27490234375, -2.1455078125, -2.01611328125, -1.88671875, -1.75732421875, -1.6279296875, -1.49853515625, -1.369140625, -1.23974609375, -1.1103515625, -0.98095703125, -0.8515625, -0.72216796875, -0.5927734375, -0.46337890625, -0.333984375, -0.20458984375, -0.0751953125, 0.05419921875, 0.18359375, 0.31298828125, 0.4423828125, 0.57177734375, 0.701171875, 0.83056640625, 0.9599609375, 1.08935546875, 1.21875, 1.34814453125, 1.4775390625, 1.60693359375, 1.736328125, 1.86572265625, 1.9951171875, 2.12451171875, 2.25390625, 2.38330078125, 2.5126953125, 2.64208984375, 2.771484375, 2.90087890625, 3.0302734375, 3.15966796875, 3.2890625, 3.41845703125, 3.5478515625, 3.67724609375, 3.806640625, 3.93603515625, 4.0654296875, 4.19482421875, 4.32421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 7.0, 12.0, 11.0, 19.0, 20.0, 37.0, 61.0, 86.0, 126.0, 174.0, 321.0, 514.0, 901.0, 1518.0, 2787.0, 5564.0, 11529.0, 27173.0, 73102.0, 258875.0, 2617672.0, 933711.0, 168441.0, 52456.0, 20592.0, 8907.0, 4272.0, 2225.0, 1284.0, 706.0, 426.0, 270.0, 154.0, 110.0, 69.0, 50.0, 29.0, 17.0, 18.0, 11.0, 9.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.3125, -44.81103515625, -43.3095703125, -41.80810546875, -40.306640625, -38.80517578125, -37.3037109375, -35.80224609375, -34.30078125, -32.79931640625, -31.2978515625, -29.79638671875, -28.294921875, -26.79345703125, -25.2919921875, -23.79052734375, -22.2890625, -20.78759765625, -19.2861328125, -17.78466796875, -16.283203125, -14.78173828125, -13.2802734375, -11.77880859375, -10.27734375, -8.77587890625, -7.2744140625, -5.77294921875, -4.271484375, -2.77001953125, -1.2685546875, 0.23291015625, 1.734375, 3.23583984375, 4.7373046875, 6.23876953125, 7.740234375, 9.24169921875, 10.7431640625, 12.24462890625, 13.74609375, 15.24755859375, 16.7490234375, 18.25048828125, 19.751953125, 21.25341796875, 22.7548828125, 24.25634765625, 25.7578125, 27.25927734375, 28.7607421875, 30.26220703125, 31.763671875, 33.26513671875, 34.7666015625, 36.26806640625, 37.76953125, 39.27099609375, 40.7724609375, 42.27392578125, 43.775390625, 45.27685546875, 46.7783203125, 48.27978515625, 49.78125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 9.0, 11.0, 17.0, 28.0, 13.0, 33.0, 45.0, 59.0, 94.0, 137.0, 221.0, 403.0, 1508.0, 615.0, 300.0, 172.0, 108.0, 81.0, 53.0, 36.0, 28.0, 16.0, 19.0, 7.0, 10.0, 6.0, 6.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.1485595703125, -9.828369140625, -9.5081787109375, -9.18798828125, -8.8677978515625, -8.547607421875, -8.2274169921875, -7.9072265625, -7.5870361328125, -7.266845703125, -6.9466552734375, -6.62646484375, -6.3062744140625, -5.986083984375, -5.6658935546875, -5.345703125, -5.0255126953125, -4.705322265625, -4.3851318359375, -4.06494140625, -3.7447509765625, -3.424560546875, -3.1043701171875, -2.7841796875, -2.4639892578125, -2.143798828125, -1.8236083984375, -1.50341796875, -1.1832275390625, -0.863037109375, -0.5428466796875, -0.22265625, 0.0975341796875, 0.417724609375, 0.7379150390625, 1.05810546875, 1.3782958984375, 1.698486328125, 2.0186767578125, 2.3388671875, 2.6590576171875, 2.979248046875, 3.2994384765625, 3.61962890625, 3.9398193359375, 4.260009765625, 4.5802001953125, 4.900390625, 5.2205810546875, 5.540771484375, 5.8609619140625, 6.18115234375, 6.5013427734375, 6.821533203125, 7.1417236328125, 7.4619140625, 7.7821044921875, 8.102294921875, 8.4224853515625, 8.74267578125, 9.0628662109375, 9.383056640625, 9.7032470703125, 10.0234375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 5.0, 4.0, 7.0, 21.0, 38.0, 107.0, 222.0, 272.0, 195.0, 91.0, 27.0, 11.0, 6.0, 2.0, 2.0, 1.0], "bins": [-244.48631286621094, -240.07911682128906, -235.6719207763672, -231.2647247314453, -226.85752868652344, -222.45033264160156, -218.0431365966797, -213.6359405517578, -209.22874450683594, -204.82154846191406, -200.4143524169922, -196.0071563720703, -191.59996032714844, -187.19276428222656, -182.7855682373047, -178.3783721923828, -173.97119140625, -169.56399536132812, -165.15679931640625, -160.74960327148438, -156.3424072265625, -151.93521118164062, -147.52801513671875, -143.12081909179688, -138.713623046875, -134.30642700195312, -129.89923095703125, -125.49203491210938, -121.0848388671875, -116.67764282226562, -112.27044677734375, -107.86325073242188, -103.45603942871094, -99.04884338378906, -94.64164733886719, -90.23445129394531, -85.82725524902344, -81.42005920410156, -77.01286315917969, -72.60566711425781, -68.19847869873047, -63.791282653808594, -59.38408660888672, -54.976890563964844, -50.56969451904297, -46.162498474121094, -41.755306243896484, -37.34811019897461, -32.940914154052734, -28.53371810913086, -24.126522064208984, -19.719327926635742, -15.312131881713867, -10.904935836791992, -6.49774169921875, -2.090545654296875, 2.316650390625, 6.723845958709717, 11.131041526794434, 15.538236618041992, 19.945432662963867, 24.352628707885742, 28.759822845458984, 33.16701889038086, 37.574214935302734]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 5.0, 6.0, 3.0, 7.0, 9.0, 15.0, 24.0, 19.0, 28.0, 38.0, 48.0, 44.0, 45.0, 60.0, 64.0, 47.0, 69.0, 62.0, 67.0, 49.0, 55.0, 50.0, 48.0, 39.0, 26.0, 21.0, 14.0, 17.0, 10.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.72093200683594, -49.16692352294922, -47.6129150390625, -46.05890655517578, -44.50489807128906, -42.95089340209961, -41.39688491821289, -39.84287643432617, -38.28886795043945, -36.734859466552734, -35.180850982666016, -33.6268424987793, -32.072837829589844, -30.518827438354492, -28.964820861816406, -27.410812377929688, -25.85680389404297, -24.30279541015625, -22.74878692626953, -21.194780349731445, -19.640771865844727, -18.086763381958008, -16.532756805419922, -14.978748321533203, -13.424739837646484, -11.870731353759766, -10.316723823547363, -8.762716293334961, -7.208707809448242, -5.654699802398682, -4.100691795349121, -2.5466842651367188, -0.9926795959472656, 0.5613284111022949, 2.1153364181518555, 3.669344425201416, 5.223352432250977, 6.777360439300537, 8.331368446350098, 9.8853759765625, 11.439384460449219, 12.993392944335938, 14.54740047454834, 16.101408004760742, 17.65541648864746, 19.20942497253418, 20.763431549072266, 22.317440032958984, 23.871448516845703, 25.425457000732422, 26.97946548461914, 28.533472061157227, 30.087480545043945, 31.641489028930664, 33.19549560546875, 34.74950408935547, 36.30351257324219, 37.857521057128906, 39.411529541015625, 40.965538024902344, 42.51954650878906, 44.073551177978516, 45.627559661865234, 47.18156814575195, 48.73557662963867]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 6.0, 3.0, 3.0, 7.0, 11.0, 6.0, 15.0, 31.0, 48.0, 67.0, 88.0, 148.0, 225.0, 363.0, 678.0, 1193.0, 2135.0, 4108.0, 8890.0, 20901.0, 57902.0, 214192.0, 507823.0, 152526.0, 45019.0, 16755.0, 7395.0, 3594.0, 1886.0, 993.0, 582.0, 344.0, 237.0, 127.0, 88.0, 45.0, 36.0, 30.0, 19.0, 16.0, 4.0, 7.0, 9.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.625, -36.38671875, -35.1484375, -33.91015625, -32.671875, -31.43359375, -30.1953125, -28.95703125, -27.71875, -26.48046875, -25.2421875, -24.00390625, -22.765625, -21.52734375, -20.2890625, -19.05078125, -17.8125, -16.57421875, -15.3359375, -14.09765625, -12.859375, -11.62109375, -10.3828125, -9.14453125, -7.90625, -6.66796875, -5.4296875, -4.19140625, -2.953125, -1.71484375, -0.4765625, 0.76171875, 2.0, 3.23828125, 4.4765625, 5.71484375, 6.953125, 8.19140625, 9.4296875, 10.66796875, 11.90625, 13.14453125, 14.3828125, 15.62109375, 16.859375, 18.09765625, 19.3359375, 20.57421875, 21.8125, 23.05078125, 24.2890625, 25.52734375, 26.765625, 28.00390625, 29.2421875, 30.48046875, 31.71875, 32.95703125, 34.1953125, 35.43359375, 36.671875, 37.91015625, 39.1484375, 40.38671875, 41.625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 2.0, 4.0, 8.0, 11.0, 6.0, 18.0, 13.0, 16.0, 18.0, 31.0, 35.0, 30.0, 49.0, 45.0, 58.0, 39.0, 79.0, 62.0, 60.0, 53.0, 48.0, 47.0, 42.0, 47.0, 38.0, 24.0, 26.0, 16.0, 18.0, 9.0, 7.0, 10.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1796875, -3.06048583984375, -2.9412841796875, -2.82208251953125, -2.702880859375, -2.58367919921875, -2.4644775390625, -2.34527587890625, -2.22607421875, -2.10687255859375, -1.9876708984375, -1.86846923828125, -1.749267578125, -1.63006591796875, -1.5108642578125, -1.39166259765625, -1.2724609375, -1.15325927734375, -1.0340576171875, -0.91485595703125, -0.795654296875, -0.67645263671875, -0.5572509765625, -0.43804931640625, -0.31884765625, -0.19964599609375, -0.0804443359375, 0.03875732421875, 0.157958984375, 0.27716064453125, 0.3963623046875, 0.51556396484375, 0.634765625, 0.75396728515625, 0.8731689453125, 0.99237060546875, 1.111572265625, 1.23077392578125, 1.3499755859375, 1.46917724609375, 1.58837890625, 1.70758056640625, 1.8267822265625, 1.94598388671875, 2.065185546875, 2.18438720703125, 2.3035888671875, 2.42279052734375, 2.5419921875, 2.66119384765625, 2.7803955078125, 2.89959716796875, 3.018798828125, 3.13800048828125, 3.2572021484375, 3.37640380859375, 3.49560546875, 3.61480712890625, 3.7340087890625, 3.85321044921875, 3.972412109375, 4.09161376953125, 4.2108154296875, 4.33001708984375, 4.44921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 9.0, 22.0, 17.0, 33.0, 40.0, 63.0, 96.0, 121.0, 165.0, 253.0, 354.0, 612.0, 949.0, 1513.0, 2461.0, 4382.0, 8330.0, 17251.0, 40466.0, 113147.0, 347714.0, 330326.0, 105384.0, 38766.0, 17003.0, 8217.0, 4411.0, 2410.0, 1456.0, 871.0, 557.0, 347.0, 235.0, 161.0, 126.0, 83.0, 51.0, 42.0, 34.0, 19.0, 17.0, 6.0, 11.0, 10.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-26.5, -25.719970703125, -24.93994140625, -24.159912109375, -23.3798828125, -22.599853515625, -21.81982421875, -21.039794921875, -20.259765625, -19.479736328125, -18.69970703125, -17.919677734375, -17.1396484375, -16.359619140625, -15.57958984375, -14.799560546875, -14.01953125, -13.239501953125, -12.45947265625, -11.679443359375, -10.8994140625, -10.119384765625, -9.33935546875, -8.559326171875, -7.779296875, -6.999267578125, -6.21923828125, -5.439208984375, -4.6591796875, -3.879150390625, -3.09912109375, -2.319091796875, -1.5390625, -0.759033203125, 0.02099609375, 0.801025390625, 1.5810546875, 2.361083984375, 3.14111328125, 3.921142578125, 4.701171875, 5.481201171875, 6.26123046875, 7.041259765625, 7.8212890625, 8.601318359375, 9.38134765625, 10.161376953125, 10.94140625, 11.721435546875, 12.50146484375, 13.281494140625, 14.0615234375, 14.841552734375, 15.62158203125, 16.401611328125, 17.181640625, 17.961669921875, 18.74169921875, 19.521728515625, 20.3017578125, 21.081787109375, 21.86181640625, 22.641845703125, 23.421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 9.0, 7.0, 4.0, 16.0, 16.0, 25.0, 26.0, 38.0, 32.0, 39.0, 36.0, 43.0, 59.0, 41.0, 42.0, 43.0, 46.0, 60.0, 46.0, 52.0, 39.0, 36.0, 41.0, 28.0, 34.0, 17.0, 21.0, 18.0, 14.0, 12.0, 11.0, 5.0, 6.0, 7.0, 6.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-19.359375, -18.78955078125, -18.2197265625, -17.64990234375, -17.080078125, -16.51025390625, -15.9404296875, -15.37060546875, -14.80078125, -14.23095703125, -13.6611328125, -13.09130859375, -12.521484375, -11.95166015625, -11.3818359375, -10.81201171875, -10.2421875, -9.67236328125, -9.1025390625, -8.53271484375, -7.962890625, -7.39306640625, -6.8232421875, -6.25341796875, -5.68359375, -5.11376953125, -4.5439453125, -3.97412109375, -3.404296875, -2.83447265625, -2.2646484375, -1.69482421875, -1.125, -0.55517578125, 0.0146484375, 0.58447265625, 1.154296875, 1.72412109375, 2.2939453125, 2.86376953125, 3.43359375, 4.00341796875, 4.5732421875, 5.14306640625, 5.712890625, 6.28271484375, 6.8525390625, 7.42236328125, 7.9921875, 8.56201171875, 9.1318359375, 9.70166015625, 10.271484375, 10.84130859375, 11.4111328125, 11.98095703125, 12.55078125, 13.12060546875, 13.6904296875, 14.26025390625, 14.830078125, 15.39990234375, 15.9697265625, 16.53955078125, 17.109375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 5.0, 21.0, 22.0, 43.0, 55.0, 57.0, 123.0, 236.0, 409.0, 692.0, 1393.0, 2681.0, 5602.0, 13428.0, 39563.0, 148481.0, 448630.0, 278386.0, 71060.0, 21544.0, 8201.0, 3777.0, 1856.0, 974.0, 516.0, 306.0, 187.0, 112.0, 52.0, 46.0, 23.0, 23.0, 17.0, 10.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.9375, -26.088623046875, -25.23974609375, -24.390869140625, -23.5419921875, -22.693115234375, -21.84423828125, -20.995361328125, -20.146484375, -19.297607421875, -18.44873046875, -17.599853515625, -16.7509765625, -15.902099609375, -15.05322265625, -14.204345703125, -13.35546875, -12.506591796875, -11.65771484375, -10.808837890625, -9.9599609375, -9.111083984375, -8.26220703125, -7.413330078125, -6.564453125, -5.715576171875, -4.86669921875, -4.017822265625, -3.1689453125, -2.320068359375, -1.47119140625, -0.622314453125, 0.2265625, 1.075439453125, 1.92431640625, 2.773193359375, 3.6220703125, 4.470947265625, 5.31982421875, 6.168701171875, 7.017578125, 7.866455078125, 8.71533203125, 9.564208984375, 10.4130859375, 11.261962890625, 12.11083984375, 12.959716796875, 13.80859375, 14.657470703125, 15.50634765625, 16.355224609375, 17.2041015625, 18.052978515625, 18.90185546875, 19.750732421875, 20.599609375, 21.448486328125, 22.29736328125, 23.146240234375, 23.9951171875, 24.843994140625, 25.69287109375, 26.541748046875, 27.390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 4.0, 4.0, 9.0, 4.0, 10.0, 22.0, 79.0, 256.0, 344.0, 163.0, 47.0, 22.0, 16.0, 3.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004444122314453125, -0.0043215155601501465, -0.004198908805847168, -0.0040763020515441895, -0.003953695297241211, -0.0038310885429382324, -0.003708481788635254, -0.0035858750343322754, -0.003463268280029297, -0.0033406615257263184, -0.00321805477142334, -0.0030954480171203613, -0.002972841262817383, -0.0028502345085144043, -0.0027276277542114258, -0.0026050209999084473, -0.0024824142456054688, -0.0023598074913024902, -0.0022372007369995117, -0.002114593982696533, -0.0019919872283935547, -0.0018693804740905762, -0.0017467737197875977, -0.0016241669654846191, -0.0015015602111816406, -0.0013789534568786621, -0.0012563467025756836, -0.001133739948272705, -0.0010111331939697266, -0.000888526439666748, -0.0007659196853637695, -0.000643312931060791, -0.0005207061767578125, -0.000398099422454834, -0.00027549266815185547, -0.00015288591384887695, -3.0279159545898438e-05, 9.232759475708008e-05, 0.0002149343490600586, 0.0003375411033630371, 0.0004601478576660156, 0.0005827546119689941, 0.0007053613662719727, 0.0008279681205749512, 0.0009505748748779297, 0.0010731816291809082, 0.0011957883834838867, 0.0013183951377868652, 0.0014410018920898438, 0.0015636086463928223, 0.0016862154006958008, 0.0018088221549987793, 0.0019314289093017578, 0.0020540356636047363, 0.002176642417907715, 0.0022992491722106934, 0.002421855926513672, 0.0025444626808166504, 0.002667069435119629, 0.0027896761894226074, 0.002912282943725586, 0.0030348896980285645, 0.003157496452331543, 0.0032801032066345215, 0.0034027099609375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 16.0, 16.0, 28.0, 33.0, 44.0, 72.0, 110.0, 147.0, 255.0, 443.0, 716.0, 1230.0, 2151.0, 4195.0, 8778.0, 19444.0, 50661.0, 150047.0, 361200.0, 284194.0, 100473.0, 35724.0, 14292.0, 6669.0, 3276.0, 1725.0, 993.0, 585.0, 357.0, 206.0, 140.0, 112.0, 56.0, 37.0, 21.0, 25.0, 22.0, 12.0, 8.0, 8.0, 8.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.265625, -21.51904296875, -20.7724609375, -20.02587890625, -19.279296875, -18.53271484375, -17.7861328125, -17.03955078125, -16.29296875, -15.54638671875, -14.7998046875, -14.05322265625, -13.306640625, -12.56005859375, -11.8134765625, -11.06689453125, -10.3203125, -9.57373046875, -8.8271484375, -8.08056640625, -7.333984375, -6.58740234375, -5.8408203125, -5.09423828125, -4.34765625, -3.60107421875, -2.8544921875, -2.10791015625, -1.361328125, -0.61474609375, 0.1318359375, 0.87841796875, 1.625, 2.37158203125, 3.1181640625, 3.86474609375, 4.611328125, 5.35791015625, 6.1044921875, 6.85107421875, 7.59765625, 8.34423828125, 9.0908203125, 9.83740234375, 10.583984375, 11.33056640625, 12.0771484375, 12.82373046875, 13.5703125, 14.31689453125, 15.0634765625, 15.81005859375, 16.556640625, 17.30322265625, 18.0498046875, 18.79638671875, 19.54296875, 20.28955078125, 21.0361328125, 21.78271484375, 22.529296875, 23.27587890625, 24.0224609375, 24.76904296875, 25.515625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 6.0, 4.0, 9.0, 9.0, 7.0, 17.0, 13.0, 16.0, 30.0, 30.0, 34.0, 40.0, 65.0, 56.0, 75.0, 78.0, 67.0, 84.0, 62.0, 58.0, 40.0, 28.0, 27.0, 36.0, 20.0, 13.0, 11.0, 15.0, 11.0, 6.0, 7.0, 2.0, 8.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.4765625, -11.0697021484375, -10.662841796875, -10.2559814453125, -9.84912109375, -9.4422607421875, -9.035400390625, -8.6285400390625, -8.2216796875, -7.8148193359375, -7.407958984375, -7.0010986328125, -6.59423828125, -6.1873779296875, -5.780517578125, -5.3736572265625, -4.966796875, -4.5599365234375, -4.153076171875, -3.7462158203125, -3.33935546875, -2.9324951171875, -2.525634765625, -2.1187744140625, -1.7119140625, -1.3050537109375, -0.898193359375, -0.4913330078125, -0.08447265625, 0.3223876953125, 0.729248046875, 1.1361083984375, 1.54296875, 1.9498291015625, 2.356689453125, 2.7635498046875, 3.17041015625, 3.5772705078125, 3.984130859375, 4.3909912109375, 4.7978515625, 5.2047119140625, 5.611572265625, 6.0184326171875, 6.42529296875, 6.8321533203125, 7.239013671875, 7.6458740234375, 8.052734375, 8.4595947265625, 8.866455078125, 9.2733154296875, 9.68017578125, 10.0870361328125, 10.493896484375, 10.9007568359375, 11.3076171875, 11.7144775390625, 12.121337890625, 12.5281982421875, 12.93505859375, 13.3419189453125, 13.748779296875, 14.1556396484375, 14.5625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 4.0, 6.0, 3.0, 17.0, 33.0, 58.0, 114.0, 178.0, 199.0, 142.0, 114.0, 57.0, 34.0, 27.0, 10.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-350.56793212890625, -341.4657287597656, -332.363525390625, -323.26129150390625, -314.1590881347656, -305.056884765625, -295.9546813964844, -286.85247802734375, -277.750244140625, -268.6480407714844, -259.54583740234375, -250.44361877441406, -241.34140014648438, -232.23919677734375, -223.13699340820312, -214.0347900390625, -204.93258666992188, -195.83038330078125, -186.72816467285156, -177.62596130371094, -168.52374267578125, -159.42153930664062, -150.3193359375, -141.21713256835938, -132.1149139404297, -123.01270294189453, -113.91049194335938, -104.80828857421875, -95.7060775756836, -86.60386657714844, -77.50166320800781, -68.39945220947266, -59.2972412109375, -50.195030212402344, -41.09282302856445, -31.99061393737793, -22.888404846191406, -13.78619384765625, -4.683986663818359, 4.418220520019531, 13.520431518554688, 22.62264060974121, 31.724849700927734, 40.827056884765625, 49.92926788330078, 59.03147888183594, 68.13368225097656, 77.23589324951172, 86.33810424804688, 95.44031524658203, 104.54252624511719, 113.64472961425781, 122.74694061279297, 131.84915161132812, 140.95135498046875, 150.05355834960938, 159.15577697753906, 168.2579803466797, 177.36019897460938, 186.46240234375, 195.56460571289062, 204.6668243408203, 213.76902770996094, 222.87124633789062, 231.97344970703125]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 4.0, 5.0, 12.0, 25.0, 25.0, 33.0, 41.0, 58.0, 54.0, 68.0, 76.0, 70.0, 54.0, 78.0, 63.0, 70.0, 54.0, 43.0, 33.0, 35.0, 20.0, 17.0, 20.0, 9.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.04751586914062, -192.46629333496094, -186.8850555419922, -181.3038330078125, -175.7226104736328, -170.14137268066406, -164.56015014648438, -158.97891235351562, -153.39768981933594, -147.81646728515625, -142.2352294921875, -136.6540069580078, -131.07278442382812, -125.49154663085938, -119.91032409667969, -114.32909393310547, -108.74787139892578, -103.16664123535156, -97.58541870117188, -92.00418853759766, -86.42295837402344, -80.84173583984375, -75.26050567626953, -69.67927551269531, -64.09805297851562, -58.51682662963867, -52.93559646606445, -47.3543701171875, -41.77313995361328, -36.19191360473633, -30.610687255859375, -25.029457092285156, -19.448226928710938, -13.866998672485352, -8.285771369934082, -2.7045440673828125, 2.8766841888427734, 8.45791244506836, 14.039138793945312, 19.62036895751953, 25.201595306396484, 30.78282356262207, 36.364051818847656, 41.94527816772461, 47.52650451660156, 53.10773468017578, 58.688961029052734, 64.27018737792969, 69.8514175415039, 75.43264770507812, 81.01387023925781, 86.59510040283203, 92.17633056640625, 97.75755310058594, 103.33878326416016, 108.92001342773438, 114.50123596191406, 120.08246612548828, 125.66368865966797, 131.2449188232422, 136.82614135742188, 142.40737915039062, 147.9886016845703, 153.56982421875, 159.15106201171875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 6.0, 16.0, 21.0, 32.0, 56.0, 105.0, 125.0, 210.0, 360.0, 607.0, 1004.0, 1752.0, 3162.0, 5975.0, 12526.0, 31135.0, 114423.0, 3300206.0, 607747.0, 71379.0, 22799.0, 9727.0, 4724.0, 2567.0, 1418.0, 767.0, 503.0, 299.0, 193.0, 138.0, 92.0, 55.0, 39.0, 24.0, 21.0, 18.0, 13.0, 10.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-64.125, -61.189453125, -58.25390625, -55.318359375, -52.3828125, -49.447265625, -46.51171875, -43.576171875, -40.640625, -37.705078125, -34.76953125, -31.833984375, -28.8984375, -25.962890625, -23.02734375, -20.091796875, -17.15625, -14.220703125, -11.28515625, -8.349609375, -5.4140625, -2.478515625, 0.45703125, 3.392578125, 6.328125, 9.263671875, 12.19921875, 15.134765625, 18.0703125, 21.005859375, 23.94140625, 26.876953125, 29.8125, 32.748046875, 35.68359375, 38.619140625, 41.5546875, 44.490234375, 47.42578125, 50.361328125, 53.296875, 56.232421875, 59.16796875, 62.103515625, 65.0390625, 67.974609375, 70.91015625, 73.845703125, 76.78125, 79.716796875, 82.65234375, 85.587890625, 88.5234375, 91.458984375, 94.39453125, 97.330078125, 100.265625, 103.201171875, 106.13671875, 109.072265625, 112.0078125, 114.943359375, 117.87890625, 120.814453125, 123.75]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 11.0, 3.0, 7.0, 4.0, 10.0, 21.0, 20.0, 17.0, 22.0, 28.0, 25.0, 38.0, 31.0, 44.0, 52.0, 72.0, 55.0, 61.0, 67.0, 46.0, 55.0, 47.0, 37.0, 38.0, 30.0, 27.0, 18.0, 24.0, 14.0, 13.0, 10.0, 12.0, 8.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.37890625, -3.2603759765625, -3.141845703125, -3.0233154296875, -2.90478515625, -2.7862548828125, -2.667724609375, -2.5491943359375, -2.4306640625, -2.3121337890625, -2.193603515625, -2.0750732421875, -1.95654296875, -1.8380126953125, -1.719482421875, -1.6009521484375, -1.482421875, -1.3638916015625, -1.245361328125, -1.1268310546875, -1.00830078125, -0.8897705078125, -0.771240234375, -0.6527099609375, -0.5341796875, -0.4156494140625, -0.297119140625, -0.1785888671875, -0.06005859375, 0.0584716796875, 0.177001953125, 0.2955322265625, 0.4140625, 0.5325927734375, 0.651123046875, 0.7696533203125, 0.88818359375, 1.0067138671875, 1.125244140625, 1.2437744140625, 1.3623046875, 1.4808349609375, 1.599365234375, 1.7178955078125, 1.83642578125, 1.9549560546875, 2.073486328125, 2.1920166015625, 2.310546875, 2.4290771484375, 2.547607421875, 2.6661376953125, 2.78466796875, 2.9031982421875, 3.021728515625, 3.1402587890625, 3.2587890625, 3.3773193359375, 3.495849609375, 3.6143798828125, 3.73291015625, 3.8514404296875, 3.969970703125, 4.0885009765625, 4.20703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 4.0, 10.0, 6.0, 17.0, 21.0, 38.0, 70.0, 122.0, 204.0, 589.0, 2484.0, 28320.0, 3661343.0, 487179.0, 11536.0, 1464.0, 404.0, 183.0, 92.0, 60.0, 30.0, 23.0, 22.0, 12.0, 15.0, 5.0, 5.0, 7.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-282.5, -274.619140625, -266.73828125, -258.857421875, -250.9765625, -243.095703125, -235.21484375, -227.333984375, -219.453125, -211.572265625, -203.69140625, -195.810546875, -187.9296875, -180.048828125, -172.16796875, -164.287109375, -156.40625, -148.525390625, -140.64453125, -132.763671875, -124.8828125, -117.001953125, -109.12109375, -101.240234375, -93.359375, -85.478515625, -77.59765625, -69.716796875, -61.8359375, -53.955078125, -46.07421875, -38.193359375, -30.3125, -22.431640625, -14.55078125, -6.669921875, 1.2109375, 9.091796875, 16.97265625, 24.853515625, 32.734375, 40.615234375, 48.49609375, 56.376953125, 64.2578125, 72.138671875, 80.01953125, 87.900390625, 95.78125, 103.662109375, 111.54296875, 119.423828125, 127.3046875, 135.185546875, 143.06640625, 150.947265625, 158.828125, 166.708984375, 174.58984375, 182.470703125, 190.3515625, 198.232421875, 206.11328125, 213.994140625, 221.875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 10.0, 5.0, 13.0, 17.0, 16.0, 31.0, 33.0, 40.0, 43.0, 71.0, 112.0, 155.0, 259.0, 601.0, 1521.0, 448.0, 202.0, 156.0, 97.0, 54.0, 49.0, 38.0, 21.0, 15.0, 16.0, 10.0, 9.0, 5.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.1328125, -9.76171875, -9.390625, -9.01953125, -8.6484375, -8.27734375, -7.90625, -7.53515625, -7.1640625, -6.79296875, -6.421875, -6.05078125, -5.6796875, -5.30859375, -4.9375, -4.56640625, -4.1953125, -3.82421875, -3.453125, -3.08203125, -2.7109375, -2.33984375, -1.96875, -1.59765625, -1.2265625, -0.85546875, -0.484375, -0.11328125, 0.2578125, 0.62890625, 1.0, 1.37109375, 1.7421875, 2.11328125, 2.484375, 2.85546875, 3.2265625, 3.59765625, 3.96875, 4.33984375, 4.7109375, 5.08203125, 5.453125, 5.82421875, 6.1953125, 6.56640625, 6.9375, 7.30859375, 7.6796875, 8.05078125, 8.421875, 8.79296875, 9.1640625, 9.53515625, 9.90625, 10.27734375, 10.6484375, 11.01953125, 11.390625, 11.76171875, 12.1328125, 12.50390625, 12.875, 13.24609375, 13.6171875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 9.0, 10.0, 16.0, 17.0, 57.0, 60.0, 78.0, 129.0, 136.0, 135.0, 109.0, 77.0, 54.0, 37.0, 28.0, 17.0, 11.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-132.81887817382812, -129.49375915527344, -126.16864776611328, -122.8435287475586, -119.5184097290039, -116.19329833984375, -112.86817932128906, -109.54306030273438, -106.21794891357422, -102.89282989501953, -99.56771850585938, -96.24259948730469, -92.91748046875, -89.59236907958984, -86.26725006103516, -82.942138671875, -79.61701965332031, -76.29190063476562, -72.96678924560547, -69.64167022705078, -66.3165512084961, -62.99143981933594, -59.66632080078125, -56.34120559692383, -53.016082763671875, -49.69096755981445, -46.365848541259766, -43.040733337402344, -39.71561813354492, -36.3905029296875, -33.06538391113281, -29.74026870727539, -26.41515350341797, -23.090036392211914, -19.764921188354492, -16.439804077148438, -13.1146879196167, -9.789571762084961, -6.464454650878906, -3.1393394470214844, 0.1857776641845703, 3.5108940601348877, 6.836010456085205, 10.161127090454102, 13.48624324798584, 16.811359405517578, 20.136476516723633, 23.461591720581055, 26.78670883178711, 30.111825942993164, 33.43694305419922, 36.76205825805664, 40.08717346191406, 43.41229248046875, 46.73740768432617, 50.062522888183594, 53.38764190673828, 56.7127571105957, 60.03787612915039, 63.36299133300781, 66.6881103515625, 70.01322174072266, 73.33834075927734, 76.6634521484375, 79.98857116699219]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 6.0, 3.0, 9.0, 7.0, 14.0, 8.0, 10.0, 24.0, 51.0, 39.0, 28.0, 49.0, 37.0, 41.0, 66.0, 57.0, 61.0, 54.0, 50.0, 63.0, 33.0, 54.0, 34.0, 39.0, 27.0, 36.0, 14.0, 18.0, 15.0, 12.0, 8.0, 9.0, 5.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-69.30204772949219, -67.49097442626953, -65.6799087524414, -63.868839263916016, -62.057769775390625, -60.24669647216797, -58.435630798339844, -56.62455749511719, -54.8134880065918, -53.002418518066406, -51.191349029541016, -49.380279541015625, -47.569210052490234, -45.758140563964844, -43.94706726074219, -42.1359977722168, -40.324928283691406, -38.513858795166016, -36.702789306640625, -34.891719818115234, -33.080650329589844, -31.26957893371582, -29.45850944519043, -27.647438049316406, -25.83637237548828, -24.02530288696289, -22.2142333984375, -20.40316390991211, -18.592092514038086, -16.781023025512695, -14.969953536987305, -13.158883094787598, -11.34781265258789, -9.5367431640625, -7.725672721862793, -5.914603233337402, -4.1035332679748535, -2.2924633026123047, -0.48139381408691406, 1.329676628112793, 3.1407461166381836, 4.951816082000732, 6.762886047363281, 8.573955535888672, 10.385025024414062, 12.19609546661377, 14.00716495513916, 15.818235397338867, 17.629304885864258, 19.44037437438965, 21.25144386291504, 23.062515258789062, 24.873584747314453, 26.684654235839844, 28.495723724365234, 30.306793212890625, 32.117862701416016, 33.928932189941406, 35.7400016784668, 37.55107116699219, 39.36214065551758, 41.17321014404297, 42.984283447265625, 44.795352935791016, 46.606422424316406]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 15.0, 17.0, 26.0, 38.0, 51.0, 92.0, 118.0, 179.0, 275.0, 450.0, 767.0, 1181.0, 1983.0, 3383.0, 5638.0, 9803.0, 17019.0, 29433.0, 51655.0, 88089.0, 142370.0, 194851.0, 185543.0, 128926.0, 78426.0, 45228.0, 26075.0, 15094.0, 8738.0, 5128.0, 3111.0, 1775.0, 1139.0, 678.0, 436.0, 266.0, 197.0, 107.0, 82.0, 46.0, 32.0, 32.0, 16.0, 10.0, 12.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.328125, -26.47119140625, -25.6142578125, -24.75732421875, -23.900390625, -23.04345703125, -22.1865234375, -21.32958984375, -20.47265625, -19.61572265625, -18.7587890625, -17.90185546875, -17.044921875, -16.18798828125, -15.3310546875, -14.47412109375, -13.6171875, -12.76025390625, -11.9033203125, -11.04638671875, -10.189453125, -9.33251953125, -8.4755859375, -7.61865234375, -6.76171875, -5.90478515625, -5.0478515625, -4.19091796875, -3.333984375, -2.47705078125, -1.6201171875, -0.76318359375, 0.09375, 0.95068359375, 1.8076171875, 2.66455078125, 3.521484375, 4.37841796875, 5.2353515625, 6.09228515625, 6.94921875, 7.80615234375, 8.6630859375, 9.52001953125, 10.376953125, 11.23388671875, 12.0908203125, 12.94775390625, 13.8046875, 14.66162109375, 15.5185546875, 16.37548828125, 17.232421875, 18.08935546875, 18.9462890625, 19.80322265625, 20.66015625, 21.51708984375, 22.3740234375, 23.23095703125, 24.087890625, 24.94482421875, 25.8017578125, 26.65869140625, 27.515625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 0.0, 2.0, 6.0, 6.0, 5.0, 6.0, 8.0, 10.0, 9.0, 13.0, 8.0, 24.0, 32.0, 27.0, 29.0, 41.0, 32.0, 47.0, 36.0, 46.0, 45.0, 53.0, 50.0, 68.0, 48.0, 41.0, 41.0, 37.0, 34.0, 33.0, 26.0, 25.0, 20.0, 17.0, 14.0, 16.0, 8.0, 14.0, 11.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.029296875, -2.913848876953125, -2.79840087890625, -2.682952880859375, -2.5675048828125, -2.452056884765625, -2.33660888671875, -2.221160888671875, -2.105712890625, -1.990264892578125, -1.87481689453125, -1.759368896484375, -1.6439208984375, -1.528472900390625, -1.41302490234375, -1.297576904296875, -1.18212890625, -1.066680908203125, -0.95123291015625, -0.835784912109375, -0.7203369140625, -0.604888916015625, -0.48944091796875, -0.373992919921875, -0.258544921875, -0.143096923828125, -0.02764892578125, 0.087799072265625, 0.2032470703125, 0.318695068359375, 0.43414306640625, 0.549591064453125, 0.6650390625, 0.780487060546875, 0.89593505859375, 1.011383056640625, 1.1268310546875, 1.242279052734375, 1.35772705078125, 1.473175048828125, 1.588623046875, 1.704071044921875, 1.81951904296875, 1.934967041015625, 2.0504150390625, 2.165863037109375, 2.28131103515625, 2.396759033203125, 2.51220703125, 2.627655029296875, 2.74310302734375, 2.858551025390625, 2.9739990234375, 3.089447021484375, 3.20489501953125, 3.320343017578125, 3.435791015625, 3.551239013671875, 3.66668701171875, 3.782135009765625, 3.8975830078125, 4.013031005859375, 4.12847900390625, 4.243927001953125, 4.359375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 12.0, 13.0, 9.0, 33.0, 51.0, 85.0, 115.0, 175.0, 261.0, 399.0, 664.0, 1200.0, 2153.0, 4302.0, 9403.0, 21622.0, 52695.0, 130818.0, 274632.0, 294217.0, 149394.0, 60811.0, 24408.0, 10490.0, 4789.0, 2441.0, 1354.0, 767.0, 459.0, 249.0, 189.0, 118.0, 83.0, 57.0, 33.0, 13.0, 12.0, 10.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.09375, -42.5234375, -40.953125, -39.3828125, -37.8125, -36.2421875, -34.671875, -33.1015625, -31.53125, -29.9609375, -28.390625, -26.8203125, -25.25, -23.6796875, -22.109375, -20.5390625, -18.96875, -17.3984375, -15.828125, -14.2578125, -12.6875, -11.1171875, -9.546875, -7.9765625, -6.40625, -4.8359375, -3.265625, -1.6953125, -0.125, 1.4453125, 3.015625, 4.5859375, 6.15625, 7.7265625, 9.296875, 10.8671875, 12.4375, 14.0078125, 15.578125, 17.1484375, 18.71875, 20.2890625, 21.859375, 23.4296875, 25.0, 26.5703125, 28.140625, 29.7109375, 31.28125, 32.8515625, 34.421875, 35.9921875, 37.5625, 39.1328125, 40.703125, 42.2734375, 43.84375, 45.4140625, 46.984375, 48.5546875, 50.125, 51.6953125, 53.265625, 54.8359375, 56.40625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 7.0, 4.0, 5.0, 8.0, 17.0, 15.0, 22.0, 14.0, 27.0, 21.0, 32.0, 41.0, 38.0, 32.0, 39.0, 45.0, 44.0, 41.0, 44.0, 54.0, 55.0, 47.0, 39.0, 49.0, 37.0, 33.0, 36.0, 39.0, 23.0, 23.0, 13.0, 17.0, 12.0, 9.0, 5.0, 9.0, 4.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.671875, -28.717529296875, -27.76318359375, -26.808837890625, -25.8544921875, -24.900146484375, -23.94580078125, -22.991455078125, -22.037109375, -21.082763671875, -20.12841796875, -19.174072265625, -18.2197265625, -17.265380859375, -16.31103515625, -15.356689453125, -14.40234375, -13.447998046875, -12.49365234375, -11.539306640625, -10.5849609375, -9.630615234375, -8.67626953125, -7.721923828125, -6.767578125, -5.813232421875, -4.85888671875, -3.904541015625, -2.9501953125, -1.995849609375, -1.04150390625, -0.087158203125, 0.8671875, 1.821533203125, 2.77587890625, 3.730224609375, 4.6845703125, 5.638916015625, 6.59326171875, 7.547607421875, 8.501953125, 9.456298828125, 10.41064453125, 11.364990234375, 12.3193359375, 13.273681640625, 14.22802734375, 15.182373046875, 16.13671875, 17.091064453125, 18.04541015625, 18.999755859375, 19.9541015625, 20.908447265625, 21.86279296875, 22.817138671875, 23.771484375, 24.725830078125, 25.68017578125, 26.634521484375, 27.5888671875, 28.543212890625, 29.49755859375, 30.451904296875, 31.40625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 5.0, 3.0, 3.0, 4.0, 10.0, 11.0, 6.0, 17.0, 35.0, 31.0, 37.0, 70.0, 126.0, 188.0, 296.0, 500.0, 843.0, 1658.0, 3116.0, 6551.0, 14612.0, 38516.0, 116028.0, 316228.0, 341508.0, 133058.0, 43951.0, 16620.0, 7114.0, 3306.0, 1729.0, 929.0, 554.0, 309.0, 195.0, 128.0, 89.0, 60.0, 32.0, 21.0, 13.0, 14.0, 10.0, 8.0, 6.0, 10.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-41.625, -40.470703125, -39.31640625, -38.162109375, -37.0078125, -35.853515625, -34.69921875, -33.544921875, -32.390625, -31.236328125, -30.08203125, -28.927734375, -27.7734375, -26.619140625, -25.46484375, -24.310546875, -23.15625, -22.001953125, -20.84765625, -19.693359375, -18.5390625, -17.384765625, -16.23046875, -15.076171875, -13.921875, -12.767578125, -11.61328125, -10.458984375, -9.3046875, -8.150390625, -6.99609375, -5.841796875, -4.6875, -3.533203125, -2.37890625, -1.224609375, -0.0703125, 1.083984375, 2.23828125, 3.392578125, 4.546875, 5.701171875, 6.85546875, 8.009765625, 9.1640625, 10.318359375, 11.47265625, 12.626953125, 13.78125, 14.935546875, 16.08984375, 17.244140625, 18.3984375, 19.552734375, 20.70703125, 21.861328125, 23.015625, 24.169921875, 25.32421875, 26.478515625, 27.6328125, 28.787109375, 29.94140625, 31.095703125, 32.25]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 11.0, 5.0, 11.0, 16.0, 16.0, 23.0, 24.0, 49.0, 69.0, 83.0, 113.0, 133.0, 125.0, 101.0, 53.0, 51.0, 44.0, 26.0, 14.0, 8.0, 11.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006343841552734375, -0.006120145320892334, -0.005896449089050293, -0.005672752857208252, -0.005449056625366211, -0.00522536039352417, -0.005001664161682129, -0.004777967929840088, -0.004554271697998047, -0.004330575466156006, -0.004106879234313965, -0.003883183002471924, -0.003659486770629883, -0.003435790538787842, -0.0032120943069458008, -0.0029883980751037598, -0.0027647018432617188, -0.0025410056114196777, -0.0023173093795776367, -0.0020936131477355957, -0.0018699169158935547, -0.0016462206840515137, -0.0014225244522094727, -0.0011988282203674316, -0.0009751319885253906, -0.0007514357566833496, -0.0005277395248413086, -0.0003040432929992676, -8.034706115722656e-05, 0.00014334917068481445, 0.00036704540252685547, 0.0005907416343688965, 0.0008144378662109375, 0.0010381340980529785, 0.0012618303298950195, 0.0014855265617370605, 0.0017092227935791016, 0.0019329190254211426, 0.0021566152572631836, 0.0023803114891052246, 0.0026040077209472656, 0.0028277039527893066, 0.0030514001846313477, 0.0032750964164733887, 0.0034987926483154297, 0.0037224888801574707, 0.003946185111999512, 0.004169881343841553, 0.004393577575683594, 0.004617273807525635, 0.004840970039367676, 0.005064666271209717, 0.005288362503051758, 0.005512058734893799, 0.00573575496673584, 0.005959451198577881, 0.006183147430419922, 0.006406843662261963, 0.006630539894104004, 0.006854236125946045, 0.007077932357788086, 0.007301628589630127, 0.007525324821472168, 0.007749021053314209, 0.00797271728515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 13.0, 9.0, 20.0, 20.0, 43.0, 40.0, 63.0, 80.0, 131.0, 194.0, 286.0, 445.0, 744.0, 1276.0, 2413.0, 4887.0, 10953.0, 26766.0, 73726.0, 213600.0, 374729.0, 214840.0, 74320.0, 26965.0, 11078.0, 4971.0, 2475.0, 1377.0, 739.0, 474.0, 287.0, 188.0, 104.0, 75.0, 58.0, 46.0, 26.0, 19.0, 19.0, 12.0, 12.0, 9.0, 6.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.3125, -33.2568359375, -32.201171875, -31.1455078125, -30.08984375, -29.0341796875, -27.978515625, -26.9228515625, -25.8671875, -24.8115234375, -23.755859375, -22.7001953125, -21.64453125, -20.5888671875, -19.533203125, -18.4775390625, -17.421875, -16.3662109375, -15.310546875, -14.2548828125, -13.19921875, -12.1435546875, -11.087890625, -10.0322265625, -8.9765625, -7.9208984375, -6.865234375, -5.8095703125, -4.75390625, -3.6982421875, -2.642578125, -1.5869140625, -0.53125, 0.5244140625, 1.580078125, 2.6357421875, 3.69140625, 4.7470703125, 5.802734375, 6.8583984375, 7.9140625, 8.9697265625, 10.025390625, 11.0810546875, 12.13671875, 13.1923828125, 14.248046875, 15.3037109375, 16.359375, 17.4150390625, 18.470703125, 19.5263671875, 20.58203125, 21.6376953125, 22.693359375, 23.7490234375, 24.8046875, 25.8603515625, 26.916015625, 27.9716796875, 29.02734375, 30.0830078125, 31.138671875, 32.1943359375, 33.25]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 3.0, 12.0, 12.0, 18.0, 23.0, 21.0, 31.0, 57.0, 51.0, 61.0, 59.0, 73.0, 82.0, 81.0, 78.0, 53.0, 68.0, 54.0, 30.0, 31.0, 17.0, 12.0, 8.0, 13.0, 15.0, 11.0, 9.0, 6.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.1953125, -18.53125, -17.8671875, -17.203125, -16.5390625, -15.875, -15.2109375, -14.546875, -13.8828125, -13.21875, -12.5546875, -11.890625, -11.2265625, -10.5625, -9.8984375, -9.234375, -8.5703125, -7.90625, -7.2421875, -6.578125, -5.9140625, -5.25, -4.5859375, -3.921875, -3.2578125, -2.59375, -1.9296875, -1.265625, -0.6015625, 0.0625, 0.7265625, 1.390625, 2.0546875, 2.71875, 3.3828125, 4.046875, 4.7109375, 5.375, 6.0390625, 6.703125, 7.3671875, 8.03125, 8.6953125, 9.359375, 10.0234375, 10.6875, 11.3515625, 12.015625, 12.6796875, 13.34375, 14.0078125, 14.671875, 15.3359375, 16.0, 16.6640625, 17.328125, 17.9921875, 18.65625, 19.3203125, 19.984375, 20.6484375, 21.3125, 21.9765625, 22.640625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 16.0, 19.0, 65.0, 109.0, 162.0, 180.0, 165.0, 112.0, 72.0, 46.0, 17.0, 13.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-812.5789794921875, -795.4837036132812, -778.388427734375, -761.2930908203125, -744.1978149414062, -727.1025390625, -710.0072631835938, -692.9119873046875, -675.816650390625, -658.7213745117188, -641.6260986328125, -624.53076171875, -607.4354858398438, -590.3402099609375, -573.2449340820312, -556.149658203125, -539.0543823242188, -521.9591064453125, -504.8638000488281, -487.7685241699219, -470.6732177734375, -453.57794189453125, -436.482666015625, -419.38739013671875, -402.2920837402344, -385.1968078613281, -368.10150146484375, -351.0062255859375, -333.91094970703125, -316.8156433105469, -299.7203674316406, -282.62506103515625, -265.5298156738281, -248.4345245361328, -231.3392333984375, -214.24395751953125, -197.14866638183594, -180.05337524414062, -162.95809936523438, -145.86280822753906, -128.76751708984375, -111.67222595214844, -94.57694244384766, -77.48165893554688, -60.38636779785156, -43.29107666015625, -26.19579315185547, -9.100509643554688, 7.994781494140625, 25.090068817138672, 42.18535614013672, 59.280643463134766, 76.37593078613281, 93.47122192382812, 110.5665054321289, 127.66178894042969, 144.757080078125, 161.8523712158203, 178.94766235351562, 196.04293823242188, 213.1382293701172, 230.2335205078125, 247.32879638671875, 264.424072265625, 281.5193786621094]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 0.0, 2.0, 8.0, 7.0, 13.0, 16.0, 17.0, 21.0, 23.0, 39.0, 28.0, 44.0, 47.0, 51.0, 54.0, 55.0, 53.0, 59.0, 55.0, 59.0, 54.0, 31.0, 34.0, 32.0, 38.0, 30.0, 19.0, 24.0, 17.0, 15.0, 9.0, 9.0, 11.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-261.23870849609375, -253.67898559570312, -246.1192626953125, -238.55953979492188, -230.9998016357422, -223.44007873535156, -215.88035583496094, -208.3206329345703, -200.76089477539062, -193.201171875, -185.64144897460938, -178.08172607421875, -170.52198791503906, -162.96226501464844, -155.4025421142578, -147.8428192138672, -140.28309631347656, -132.72337341308594, -125.16364288330078, -117.60391998291016, -110.044189453125, -102.48446655273438, -94.92474365234375, -87.36502075195312, -79.80529022216797, -72.24556732177734, -64.68583679199219, -57.12611389160156, -49.56638717651367, -42.00666046142578, -34.446937561035156, -26.887210845947266, -19.327484130859375, -11.7677583694458, -4.208032608032227, 3.3516921997070312, 10.911418914794922, 18.471145629882812, 26.030868530273438, 33.59059524536133, 41.15032196044922, 48.71004867553711, 56.269775390625, 63.829498291015625, 71.38922119140625, 78.9489517211914, 86.50867462158203, 94.06840515136719, 101.62812805175781, 109.18785095214844, 116.7475814819336, 124.30730438232422, 131.86703491210938, 139.4267578125, 146.98648071289062, 154.54620361328125, 162.10592651367188, 169.6656494140625, 177.22537231445312, 184.78509521484375, 192.34483337402344, 199.90455627441406, 207.4642791748047, 215.0240020751953, 222.583740234375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 8.0, 7.0, 9.0, 11.0, 15.0, 18.0, 30.0, 30.0, 63.0, 68.0, 154.0, 337.0, 856.0, 3011.0, 13550.0, 92257.0, 3778183.0, 271940.0, 26392.0, 5047.0, 1329.0, 481.0, 185.0, 105.0, 57.0, 30.0, 23.0, 20.0, 20.0, 14.0, 10.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-239.0, -231.689453125, -224.37890625, -217.068359375, -209.7578125, -202.447265625, -195.13671875, -187.826171875, -180.515625, -173.205078125, -165.89453125, -158.583984375, -151.2734375, -143.962890625, -136.65234375, -129.341796875, -122.03125, -114.720703125, -107.41015625, -100.099609375, -92.7890625, -85.478515625, -78.16796875, -70.857421875, -63.546875, -56.236328125, -48.92578125, -41.615234375, -34.3046875, -26.994140625, -19.68359375, -12.373046875, -5.0625, 2.248046875, 9.55859375, 16.869140625, 24.1796875, 31.490234375, 38.80078125, 46.111328125, 53.421875, 60.732421875, 68.04296875, 75.353515625, 82.6640625, 89.974609375, 97.28515625, 104.595703125, 111.90625, 119.216796875, 126.52734375, 133.837890625, 141.1484375, 148.458984375, 155.76953125, 163.080078125, 170.390625, 177.701171875, 185.01171875, 192.322265625, 199.6328125, 206.943359375, 214.25390625, 221.564453125, 228.875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 14.0, 10.0, 16.0, 17.0, 27.0, 21.0, 24.0, 31.0, 39.0, 50.0, 55.0, 52.0, 57.0, 53.0, 59.0, 75.0, 44.0, 51.0, 44.0, 49.0, 44.0, 22.0, 26.0, 26.0, 15.0, 22.0, 16.0, 10.0, 7.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.38671875, -6.18853759765625, -5.9903564453125, -5.79217529296875, -5.593994140625, -5.39581298828125, -5.1976318359375, -4.99945068359375, -4.80126953125, -4.60308837890625, -4.4049072265625, -4.20672607421875, -4.008544921875, -3.81036376953125, -3.6121826171875, -3.41400146484375, -3.2158203125, -3.01763916015625, -2.8194580078125, -2.62127685546875, -2.423095703125, -2.22491455078125, -2.0267333984375, -1.82855224609375, -1.63037109375, -1.43218994140625, -1.2340087890625, -1.03582763671875, -0.837646484375, -0.63946533203125, -0.4412841796875, -0.24310302734375, -0.044921875, 0.15325927734375, 0.3514404296875, 0.54962158203125, 0.747802734375, 0.94598388671875, 1.1441650390625, 1.34234619140625, 1.54052734375, 1.73870849609375, 1.9368896484375, 2.13507080078125, 2.333251953125, 2.53143310546875, 2.7296142578125, 2.92779541015625, 3.1259765625, 3.32415771484375, 3.5223388671875, 3.72052001953125, 3.918701171875, 4.11688232421875, 4.3150634765625, 4.51324462890625, 4.71142578125, 4.90960693359375, 5.1077880859375, 5.30596923828125, 5.504150390625, 5.70233154296875, 5.9005126953125, 6.09869384765625, 6.296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 6.0, 16.0, 11.0, 19.0, 30.0, 55.0, 71.0, 178.0, 923.0, 9566.0, 354191.0, 3784592.0, 41755.0, 2282.0, 312.0, 108.0, 70.0, 37.0, 24.0, 17.0, 8.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-361.5, -351.2421875, -340.984375, -330.7265625, -320.46875, -310.2109375, -299.953125, -289.6953125, -279.4375, -269.1796875, -258.921875, -248.6640625, -238.40625, -228.1484375, -217.890625, -207.6328125, -197.375, -187.1171875, -176.859375, -166.6015625, -156.34375, -146.0859375, -135.828125, -125.5703125, -115.3125, -105.0546875, -94.796875, -84.5390625, -74.28125, -64.0234375, -53.765625, -43.5078125, -33.25, -22.9921875, -12.734375, -2.4765625, 7.78125, 18.0390625, 28.296875, 38.5546875, 48.8125, 59.0703125, 69.328125, 79.5859375, 89.84375, 100.1015625, 110.359375, 120.6171875, 130.875, 141.1328125, 151.390625, 161.6484375, 171.90625, 182.1640625, 192.421875, 202.6796875, 212.9375, 223.1953125, 233.453125, 243.7109375, 253.96875, 264.2265625, 274.484375, 284.7421875, 295.0]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 4.0, 8.0, 11.0, 15.0, 25.0, 28.0, 50.0, 80.0, 125.0, 236.0, 453.0, 1651.0, 673.0, 307.0, 157.0, 93.0, 58.0, 34.0, 25.0, 16.0, 9.0, 6.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.625, -33.70703125, -32.7890625, -31.87109375, -30.953125, -30.03515625, -29.1171875, -28.19921875, -27.28125, -26.36328125, -25.4453125, -24.52734375, -23.609375, -22.69140625, -21.7734375, -20.85546875, -19.9375, -19.01953125, -18.1015625, -17.18359375, -16.265625, -15.34765625, -14.4296875, -13.51171875, -12.59375, -11.67578125, -10.7578125, -9.83984375, -8.921875, -8.00390625, -7.0859375, -6.16796875, -5.25, -4.33203125, -3.4140625, -2.49609375, -1.578125, -0.66015625, 0.2578125, 1.17578125, 2.09375, 3.01171875, 3.9296875, 4.84765625, 5.765625, 6.68359375, 7.6015625, 8.51953125, 9.4375, 10.35546875, 11.2734375, 12.19140625, 13.109375, 14.02734375, 14.9453125, 15.86328125, 16.78125, 17.69921875, 18.6171875, 19.53515625, 20.453125, 21.37109375, 22.2890625, 23.20703125, 24.125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 14.0, 9.0, 15.0, 27.0, 95.0, 109.0, 166.0, 200.0, 168.0, 103.0, 61.0, 20.0, 10.0, 1.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-296.8629150390625, -288.7121887207031, -280.56146240234375, -272.41070556640625, -264.2599792480469, -256.1092529296875, -247.95852661132812, -239.80780029296875, -231.65707397460938, -223.50634765625, -215.35560607910156, -207.2048797607422, -199.0541534423828, -190.90341186523438, -182.752685546875, -174.60195922851562, -166.4512176513672, -158.3004913330078, -150.14974975585938, -141.9990234375, -133.84829711914062, -125.69756317138672, -117.54682922363281, -109.39610290527344, -101.24536895751953, -93.09463500976562, -84.94390869140625, -76.79317474365234, -68.64244079589844, -60.49171447753906, -52.340980529785156, -44.190250396728516, -36.03950500488281, -27.888774871826172, -19.7380428314209, -11.587310791015625, -3.4365806579589844, 4.714149475097656, 12.864883422851562, 21.015613555908203, 29.166343688964844, 37.317073822021484, 45.467803955078125, 53.61853790283203, 61.76926803588867, 69.91999816894531, 78.07073211669922, 86.22146606445312, 94.3721923828125, 102.5229263305664, 110.67365264892578, 118.82438659667969, 126.97511291503906, 135.1258544921875, 143.27658081054688, 151.42730712890625, 159.57803344726562, 167.728759765625, 175.87950134277344, 184.0302276611328, 192.1809539794922, 200.33169555664062, 208.482421875, 216.63314819335938, 224.7838897705078]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 5.0, 6.0, 9.0, 11.0, 14.0, 20.0, 22.0, 28.0, 24.0, 22.0, 40.0, 47.0, 38.0, 52.0, 49.0, 53.0, 57.0, 51.0, 50.0, 44.0, 53.0, 46.0, 35.0, 44.0, 40.0, 28.0, 27.0, 12.0, 11.0, 14.0, 11.0, 11.0, 7.0, 5.0, 2.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-99.9325180053711, -96.94683074951172, -93.96115112304688, -90.9754638671875, -87.98977661132812, -85.00409698486328, -82.0184097290039, -79.03273010253906, -76.04704284667969, -73.06135559082031, -70.07567596435547, -67.0899887084961, -64.10430908203125, -61.118621826171875, -58.1329345703125, -55.14725112915039, -52.16156768798828, -49.17588424682617, -46.19020080566406, -43.20451354980469, -40.21883010864258, -37.23314666748047, -34.247459411621094, -31.261775970458984, -28.276092529296875, -25.290409088134766, -22.304723739624023, -19.31903839111328, -16.333354949951172, -13.347670555114746, -10.36198616027832, -7.376300811767578, -4.3906097412109375, -1.4049253463745117, 1.580759048461914, 4.56644344329834, 7.552127838134766, 10.537812232971191, 13.523496627807617, 16.50918197631836, 19.49486541748047, 22.480548858642578, 25.46623420715332, 28.451919555664062, 31.437602996826172, 34.42328643798828, 37.408973693847656, 40.394657135009766, 43.380340576171875, 46.366024017333984, 49.351707458496094, 52.33739471435547, 55.32307815551758, 58.30876159667969, 61.29444885253906, 64.28013610839844, 67.26581573486328, 70.25150299072266, 73.2371826171875, 76.22286987304688, 79.20855712890625, 82.1942367553711, 85.17992401123047, 88.16560363769531, 91.15129089355469]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 2.0, 6.0, 10.0, 11.0, 18.0, 23.0, 35.0, 64.0, 89.0, 120.0, 182.0, 241.0, 391.0, 602.0, 1031.0, 1970.0, 4620.0, 13804.0, 48736.0, 169894.0, 398970.0, 279910.0, 89038.0, 24669.0, 7685.0, 2776.0, 1425.0, 783.0, 482.0, 317.0, 196.0, 135.0, 94.0, 53.0, 37.0, 38.0, 27.0, 21.0, 8.0, 6.0, 7.0, 4.0, 8.0, 4.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-68.375, -66.150390625, -63.92578125, -61.701171875, -59.4765625, -57.251953125, -55.02734375, -52.802734375, -50.578125, -48.353515625, -46.12890625, -43.904296875, -41.6796875, -39.455078125, -37.23046875, -35.005859375, -32.78125, -30.556640625, -28.33203125, -26.107421875, -23.8828125, -21.658203125, -19.43359375, -17.208984375, -14.984375, -12.759765625, -10.53515625, -8.310546875, -6.0859375, -3.861328125, -1.63671875, 0.587890625, 2.8125, 5.037109375, 7.26171875, 9.486328125, 11.7109375, 13.935546875, 16.16015625, 18.384765625, 20.609375, 22.833984375, 25.05859375, 27.283203125, 29.5078125, 31.732421875, 33.95703125, 36.181640625, 38.40625, 40.630859375, 42.85546875, 45.080078125, 47.3046875, 49.529296875, 51.75390625, 53.978515625, 56.203125, 58.427734375, 60.65234375, 62.876953125, 65.1015625, 67.326171875, 69.55078125, 71.775390625, 74.0]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 33.0, 40.0, 46.0, 56.0, 69.0, 80.0, 91.0, 101.0, 91.0, 90.0, 75.0, 68.0, 38.0, 26.0, 29.0, 17.0, 12.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.96875, -10.6317138671875, -10.294677734375, -9.9576416015625, -9.62060546875, -9.2835693359375, -8.946533203125, -8.6094970703125, -8.2724609375, -7.9354248046875, -7.598388671875, -7.2613525390625, -6.92431640625, -6.5872802734375, -6.250244140625, -5.9132080078125, -5.576171875, -5.2391357421875, -4.902099609375, -4.5650634765625, -4.22802734375, -3.8909912109375, -3.553955078125, -3.2169189453125, -2.8798828125, -2.5428466796875, -2.205810546875, -1.8687744140625, -1.53173828125, -1.1947021484375, -0.857666015625, -0.5206298828125, -0.18359375, 0.1534423828125, 0.490478515625, 0.8275146484375, 1.16455078125, 1.5015869140625, 1.838623046875, 2.1756591796875, 2.5126953125, 2.8497314453125, 3.186767578125, 3.5238037109375, 3.86083984375, 4.1978759765625, 4.534912109375, 4.8719482421875, 5.208984375, 5.5460205078125, 5.883056640625, 6.2200927734375, 6.55712890625, 6.8941650390625, 7.231201171875, 7.5682373046875, 7.9052734375, 8.2423095703125, 8.579345703125, 8.9163818359375, 9.25341796875, 9.5904541015625, 9.927490234375, 10.2645263671875, 10.6015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 10.0, 4.0, 5.0, 12.0, 16.0, 19.0, 24.0, 39.0, 57.0, 86.0, 139.0, 172.0, 301.0, 505.0, 854.0, 1384.0, 2764.0, 6088.0, 15487.0, 44298.0, 133842.0, 331530.0, 319660.0, 124182.0, 40937.0, 14286.0, 5681.0, 2672.0, 1432.0, 747.0, 477.0, 293.0, 178.0, 121.0, 87.0, 57.0, 33.0, 18.0, 21.0, 15.0, 4.0, 3.0, 4.0, 7.0, 1.0, 2.0, 2.0], "bins": [-75.5, -73.5625, -71.625, -69.6875, -67.75, -65.8125, -63.875, -61.9375, -60.0, -58.0625, -56.125, -54.1875, -52.25, -50.3125, -48.375, -46.4375, -44.5, -42.5625, -40.625, -38.6875, -36.75, -34.8125, -32.875, -30.9375, -29.0, -27.0625, -25.125, -23.1875, -21.25, -19.3125, -17.375, -15.4375, -13.5, -11.5625, -9.625, -7.6875, -5.75, -3.8125, -1.875, 0.0625, 2.0, 3.9375, 5.875, 7.8125, 9.75, 11.6875, 13.625, 15.5625, 17.5, 19.4375, 21.375, 23.3125, 25.25, 27.1875, 29.125, 31.0625, 33.0, 34.9375, 36.875, 38.8125, 40.75, 42.6875, 44.625, 46.5625, 48.5]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 7.0, 14.0, 21.0, 23.0, 32.0, 31.0, 30.0, 31.0, 36.0, 32.0, 44.0, 51.0, 37.0, 61.0, 41.0, 55.0, 52.0, 42.0, 59.0, 42.0, 37.0, 30.0, 22.0, 28.0, 31.0, 16.0, 21.0, 14.0, 20.0, 9.0, 6.0, 7.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.9375, -36.7490234375, -35.560546875, -34.3720703125, -33.18359375, -31.9951171875, -30.806640625, -29.6181640625, -28.4296875, -27.2412109375, -26.052734375, -24.8642578125, -23.67578125, -22.4873046875, -21.298828125, -20.1103515625, -18.921875, -17.7333984375, -16.544921875, -15.3564453125, -14.16796875, -12.9794921875, -11.791015625, -10.6025390625, -9.4140625, -8.2255859375, -7.037109375, -5.8486328125, -4.66015625, -3.4716796875, -2.283203125, -1.0947265625, 0.09375, 1.2822265625, 2.470703125, 3.6591796875, 4.84765625, 6.0361328125, 7.224609375, 8.4130859375, 9.6015625, 10.7900390625, 11.978515625, 13.1669921875, 14.35546875, 15.5439453125, 16.732421875, 17.9208984375, 19.109375, 20.2978515625, 21.486328125, 22.6748046875, 23.86328125, 25.0517578125, 26.240234375, 27.4287109375, 28.6171875, 29.8056640625, 30.994140625, 32.1826171875, 33.37109375, 34.5595703125, 35.748046875, 36.9365234375, 38.125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 15.0, 17.0, 40.0, 54.0, 137.0, 306.0, 765.0, 2291.0, 9476.0, 67210.0, 539093.0, 378711.0, 41130.0, 6619.0, 1670.0, 585.0, 236.0, 94.0, 45.0, 19.0, 17.0, 14.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.46875, -43.48193359375, -41.4951171875, -39.50830078125, -37.521484375, -35.53466796875, -33.5478515625, -31.56103515625, -29.57421875, -27.58740234375, -25.6005859375, -23.61376953125, -21.626953125, -19.64013671875, -17.6533203125, -15.66650390625, -13.6796875, -11.69287109375, -9.7060546875, -7.71923828125, -5.732421875, -3.74560546875, -1.7587890625, 0.22802734375, 2.21484375, 4.20166015625, 6.1884765625, 8.17529296875, 10.162109375, 12.14892578125, 14.1357421875, 16.12255859375, 18.109375, 20.09619140625, 22.0830078125, 24.06982421875, 26.056640625, 28.04345703125, 30.0302734375, 32.01708984375, 34.00390625, 35.99072265625, 37.9775390625, 39.96435546875, 41.951171875, 43.93798828125, 45.9248046875, 47.91162109375, 49.8984375, 51.88525390625, 53.8720703125, 55.85888671875, 57.845703125, 59.83251953125, 61.8193359375, 63.80615234375, 65.79296875, 67.77978515625, 69.7666015625, 71.75341796875, 73.740234375, 75.72705078125, 77.7138671875, 79.70068359375, 81.6875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 5.0, 13.0, 19.0, 16.0, 25.0, 33.0, 53.0, 71.0, 91.0, 114.0, 111.0, 99.0, 76.0, 71.0, 47.0, 39.0, 27.0, 23.0, 14.0, 5.0, 9.0, 8.0, 4.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0078887939453125, -0.007702350616455078, -0.007515907287597656, -0.007329463958740234, -0.0071430206298828125, -0.006956577301025391, -0.006770133972167969, -0.006583690643310547, -0.006397247314453125, -0.006210803985595703, -0.006024360656738281, -0.005837917327880859, -0.0056514739990234375, -0.005465030670166016, -0.005278587341308594, -0.005092144012451172, -0.00490570068359375, -0.004719257354736328, -0.004532814025878906, -0.004346370697021484, -0.0041599273681640625, -0.003973484039306641, -0.0037870407104492188, -0.003600597381591797, -0.003414154052734375, -0.003227710723876953, -0.0030412673950195312, -0.0028548240661621094, -0.0026683807373046875, -0.0024819374084472656, -0.0022954940795898438, -0.002109050750732422, -0.001922607421875, -0.0017361640930175781, -0.0015497207641601562, -0.0013632774353027344, -0.0011768341064453125, -0.0009903907775878906, -0.0008039474487304688, -0.0006175041198730469, -0.000431060791015625, -0.0002446174621582031, -5.817413330078125e-05, 0.00012826919555664062, 0.0003147125244140625, 0.0005011558532714844, 0.0006875991821289062, 0.0008740425109863281, 0.00106048583984375, 0.0012469291687011719, 0.0014333724975585938, 0.0016198158264160156, 0.0018062591552734375, 0.0019927024841308594, 0.0021791458129882812, 0.002365589141845703, 0.002552032470703125, 0.002738475799560547, 0.0029249191284179688, 0.0031113624572753906, 0.0032978057861328125, 0.0034842491149902344, 0.0036706924438476562, 0.003857135772705078, 0.0040435791015625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 11.0, 19.0, 19.0, 21.0, 20.0, 38.0, 68.0, 82.0, 135.0, 226.0, 295.0, 577.0, 900.0, 1633.0, 3285.0, 7197.0, 19168.0, 60963.0, 221777.0, 443162.0, 202330.0, 55208.0, 17566.0, 6700.0, 3134.0, 1609.0, 916.0, 507.0, 331.0, 186.0, 143.0, 90.0, 56.0, 41.0, 26.0, 31.0, 25.0, 7.0, 10.0, 7.0, 5.0, 8.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0], "bins": [-40.9375, -39.74951171875, -38.5615234375, -37.37353515625, -36.185546875, -34.99755859375, -33.8095703125, -32.62158203125, -31.43359375, -30.24560546875, -29.0576171875, -27.86962890625, -26.681640625, -25.49365234375, -24.3056640625, -23.11767578125, -21.9296875, -20.74169921875, -19.5537109375, -18.36572265625, -17.177734375, -15.98974609375, -14.8017578125, -13.61376953125, -12.42578125, -11.23779296875, -10.0498046875, -8.86181640625, -7.673828125, -6.48583984375, -5.2978515625, -4.10986328125, -2.921875, -1.73388671875, -0.5458984375, 0.64208984375, 1.830078125, 3.01806640625, 4.2060546875, 5.39404296875, 6.58203125, 7.77001953125, 8.9580078125, 10.14599609375, 11.333984375, 12.52197265625, 13.7099609375, 14.89794921875, 16.0859375, 17.27392578125, 18.4619140625, 19.64990234375, 20.837890625, 22.02587890625, 23.2138671875, 24.40185546875, 25.58984375, 26.77783203125, 27.9658203125, 29.15380859375, 30.341796875, 31.52978515625, 32.7177734375, 33.90576171875, 35.09375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 12.0, 7.0, 14.0, 9.0, 18.0, 18.0, 20.0, 31.0, 42.0, 61.0, 59.0, 63.0, 85.0, 65.0, 85.0, 53.0, 59.0, 67.0, 47.0, 49.0, 25.0, 27.0, 23.0, 9.0, 14.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-21.75, -21.061279296875, -20.37255859375, -19.683837890625, -18.9951171875, -18.306396484375, -17.61767578125, -16.928955078125, -16.240234375, -15.551513671875, -14.86279296875, -14.174072265625, -13.4853515625, -12.796630859375, -12.10791015625, -11.419189453125, -10.73046875, -10.041748046875, -9.35302734375, -8.664306640625, -7.9755859375, -7.286865234375, -6.59814453125, -5.909423828125, -5.220703125, -4.531982421875, -3.84326171875, -3.154541015625, -2.4658203125, -1.777099609375, -1.08837890625, -0.399658203125, 0.2890625, 0.977783203125, 1.66650390625, 2.355224609375, 3.0439453125, 3.732666015625, 4.42138671875, 5.110107421875, 5.798828125, 6.487548828125, 7.17626953125, 7.864990234375, 8.5537109375, 9.242431640625, 9.93115234375, 10.619873046875, 11.30859375, 11.997314453125, 12.68603515625, 13.374755859375, 14.0634765625, 14.752197265625, 15.44091796875, 16.129638671875, 16.818359375, 17.507080078125, 18.19580078125, 18.884521484375, 19.5732421875, 20.261962890625, 20.95068359375, 21.639404296875, 22.328125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 11.0, 12.0, 19.0, 39.0, 75.0, 99.0, 151.0, 160.0, 155.0, 113.0, 71.0, 36.0, 23.0, 13.0, 8.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-759.8929443359375, -742.8273315429688, -725.76171875, -708.6961059570312, -691.6304931640625, -674.5648803710938, -657.499267578125, -640.4336547851562, -623.3680419921875, -606.3024291992188, -589.23681640625, -572.1712036132812, -555.1055908203125, -538.0399780273438, -520.974365234375, -503.90875244140625, -486.8431091308594, -469.7774963378906, -452.7118835449219, -435.6462707519531, -418.5806579589844, -401.5150451660156, -384.44940185546875, -367.3837890625, -350.31817626953125, -333.2525634765625, -316.18695068359375, -299.121337890625, -282.05572509765625, -264.9901123046875, -247.9244842529297, -230.85887145996094, -213.79327392578125, -196.7276611328125, -179.66204833984375, -162.596435546875, -145.53082275390625, -128.4652099609375, -111.39958190917969, -94.33396911621094, -77.26835632324219, -60.20274353027344, -43.13712692260742, -26.071510314941406, -9.005897521972656, 8.059715270996094, 25.125335693359375, 42.190948486328125, 59.256561279296875, 76.32217407226562, 93.38778686523438, 110.45340728759766, 127.5190200805664, 144.58462524414062, 161.65025329589844, 178.7158660888672, 195.78147888183594, 212.8470916748047, 229.91270446777344, 246.97833251953125, 264.0439453125, 281.10955810546875, 298.1751708984375, 315.24078369140625, 332.306396484375]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 12.0, 13.0, 10.0, 15.0, 14.0, 27.0, 27.0, 15.0, 35.0, 37.0, 29.0, 55.0, 44.0, 49.0, 42.0, 50.0, 53.0, 46.0, 49.0, 52.0, 42.0, 38.0, 36.0, 33.0, 37.0, 20.0, 21.0, 14.0, 23.0, 15.0, 9.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-298.4479675292969, -289.56915283203125, -280.6903381347656, -271.8115234375, -262.9327087402344, -254.05389404296875, -245.17507934570312, -236.2962646484375, -227.41744995117188, -218.53863525390625, -209.65982055664062, -200.781005859375, -191.90219116210938, -183.02337646484375, -174.14456176757812, -165.2657470703125, -156.38693237304688, -147.50811767578125, -138.62930297851562, -129.75048828125, -120.87167358398438, -111.99285888671875, -103.11404418945312, -94.2352294921875, -85.35641479492188, -76.47760009765625, -67.59878540039062, -58.719970703125, -49.841156005859375, -40.96234130859375, -32.083526611328125, -23.2047119140625, -14.325927734375, -5.447113037109375, 3.43170166015625, 12.310516357421875, 21.1893310546875, 30.068145751953125, 38.94696044921875, 47.825775146484375, 56.70458984375, 65.58340454101562, 74.46221923828125, 83.34103393554688, 92.2198486328125, 101.09866333007812, 109.97747802734375, 118.85629272460938, 127.735107421875, 136.61392211914062, 145.49273681640625, 154.37155151367188, 163.2503662109375, 172.12918090820312, 181.00799560546875, 189.88681030273438, 198.765625, 207.64443969726562, 216.52325439453125, 225.40206909179688, 234.2808837890625, 243.15969848632812, 252.03851318359375, 260.9173278808594, 269.796142578125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 6.0, 6.0, 6.0, 7.0, 10.0, 15.0, 20.0, 41.0, 47.0, 107.0, 194.0, 458.0, 1084.0, 3278.0, 12638.0, 86704.0, 3886930.0, 178977.0, 17833.0, 3785.0, 1201.0, 468.0, 182.0, 105.0, 56.0, 36.0, 29.0, 14.0, 18.0, 4.0, 7.0, 10.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.375, -184.9140625, -178.453125, -171.9921875, -165.53125, -159.0703125, -152.609375, -146.1484375, -139.6875, -133.2265625, -126.765625, -120.3046875, -113.84375, -107.3828125, -100.921875, -94.4609375, -88.0, -81.5390625, -75.078125, -68.6171875, -62.15625, -55.6953125, -49.234375, -42.7734375, -36.3125, -29.8515625, -23.390625, -16.9296875, -10.46875, -4.0078125, 2.453125, 8.9140625, 15.375, 21.8359375, 28.296875, 34.7578125, 41.21875, 47.6796875, 54.140625, 60.6015625, 67.0625, 73.5234375, 79.984375, 86.4453125, 92.90625, 99.3671875, 105.828125, 112.2890625, 118.75, 125.2109375, 131.671875, 138.1328125, 144.59375, 151.0546875, 157.515625, 163.9765625, 170.4375, 176.8984375, 183.359375, 189.8203125, 196.28125, 202.7421875, 209.203125, 215.6640625, 222.125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 4.0, 9.0, 10.0, 5.0, 22.0, 27.0, 31.0, 32.0, 45.0, 28.0, 41.0, 47.0, 62.0, 56.0, 59.0, 81.0, 64.0, 65.0, 44.0, 52.0, 36.0, 42.0, 23.0, 26.0, 14.0, 16.0, 10.0, 9.0, 4.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.20654296875, -7.9287109375, -7.65087890625, -7.373046875, -7.09521484375, -6.8173828125, -6.53955078125, -6.26171875, -5.98388671875, -5.7060546875, -5.42822265625, -5.150390625, -4.87255859375, -4.5947265625, -4.31689453125, -4.0390625, -3.76123046875, -3.4833984375, -3.20556640625, -2.927734375, -2.64990234375, -2.3720703125, -2.09423828125, -1.81640625, -1.53857421875, -1.2607421875, -0.98291015625, -0.705078125, -0.42724609375, -0.1494140625, 0.12841796875, 0.40625, 0.68408203125, 0.9619140625, 1.23974609375, 1.517578125, 1.79541015625, 2.0732421875, 2.35107421875, 2.62890625, 2.90673828125, 3.1845703125, 3.46240234375, 3.740234375, 4.01806640625, 4.2958984375, 4.57373046875, 4.8515625, 5.12939453125, 5.4072265625, 5.68505859375, 5.962890625, 6.24072265625, 6.5185546875, 6.79638671875, 7.07421875, 7.35205078125, 7.6298828125, 7.90771484375, 8.185546875, 8.46337890625, 8.7412109375, 9.01904296875, 9.296875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 2.0, 4.0, 9.0, 8.0, 22.0, 21.0, 22.0, 33.0, 68.0, 84.0, 122.0, 196.0, 275.0, 434.0, 772.0, 1206.0, 2094.0, 3822.0, 7454.0, 16075.0, 38039.0, 111225.0, 481213.0, 2968669.0, 398782.0, 98935.0, 34401.0, 14542.0, 7016.0, 3562.0, 1961.0, 1105.0, 786.0, 421.0, 294.0, 202.0, 132.0, 82.0, 61.0, 39.0, 31.0, 20.0, 14.0, 8.0, 4.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-67.0625, -64.9296875, -62.796875, -60.6640625, -58.53125, -56.3984375, -54.265625, -52.1328125, -50.0, -47.8671875, -45.734375, -43.6015625, -41.46875, -39.3359375, -37.203125, -35.0703125, -32.9375, -30.8046875, -28.671875, -26.5390625, -24.40625, -22.2734375, -20.140625, -18.0078125, -15.875, -13.7421875, -11.609375, -9.4765625, -7.34375, -5.2109375, -3.078125, -0.9453125, 1.1875, 3.3203125, 5.453125, 7.5859375, 9.71875, 11.8515625, 13.984375, 16.1171875, 18.25, 20.3828125, 22.515625, 24.6484375, 26.78125, 28.9140625, 31.046875, 33.1796875, 35.3125, 37.4453125, 39.578125, 41.7109375, 43.84375, 45.9765625, 48.109375, 50.2421875, 52.375, 54.5078125, 56.640625, 58.7734375, 60.90625, 63.0390625, 65.171875, 67.3046875, 69.4375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 7.0, 4.0, 11.0, 11.0, 22.0, 14.0, 17.0, 34.0, 52.0, 79.0, 138.0, 232.0, 515.0, 1602.0, 573.0, 266.0, 187.0, 92.0, 57.0, 42.0, 34.0, 16.0, 16.0, 12.0, 9.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.71875, -25.966552734375, -25.21435546875, -24.462158203125, -23.7099609375, -22.957763671875, -22.20556640625, -21.453369140625, -20.701171875, -19.948974609375, -19.19677734375, -18.444580078125, -17.6923828125, -16.940185546875, -16.18798828125, -15.435791015625, -14.68359375, -13.931396484375, -13.17919921875, -12.427001953125, -11.6748046875, -10.922607421875, -10.17041015625, -9.418212890625, -8.666015625, -7.913818359375, -7.16162109375, -6.409423828125, -5.6572265625, -4.905029296875, -4.15283203125, -3.400634765625, -2.6484375, -1.896240234375, -1.14404296875, -0.391845703125, 0.3603515625, 1.112548828125, 1.86474609375, 2.616943359375, 3.369140625, 4.121337890625, 4.87353515625, 5.625732421875, 6.3779296875, 7.130126953125, 7.88232421875, 8.634521484375, 9.38671875, 10.138916015625, 10.89111328125, 11.643310546875, 12.3955078125, 13.147705078125, 13.89990234375, 14.652099609375, 15.404296875, 16.156494140625, 16.90869140625, 17.660888671875, 18.4130859375, 19.165283203125, 19.91748046875, 20.669677734375, 21.421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 4.0, 11.0, 15.0, 36.0, 41.0, 68.0, 90.0, 120.0, 143.0, 126.0, 109.0, 55.0, 61.0, 43.0, 32.0, 17.0, 9.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.11859893798828, -98.78491973876953, -93.45124816894531, -88.11756896972656, -82.78388977050781, -77.45021057128906, -72.11653137207031, -66.7828598022461, -61.449180603027344, -56.115501403808594, -50.78182601928711, -45.448150634765625, -40.114471435546875, -34.780792236328125, -29.44711685180664, -24.113441467285156, -18.779762268066406, -13.446084976196289, -8.112407684326172, -2.7787303924560547, 2.5549468994140625, 7.88862419128418, 13.222301483154297, 18.55597686767578, 23.88965606689453, 29.22333335876465, 34.557010650634766, 39.89068603515625, 45.224365234375, 50.55804443359375, 55.891719818115234, 61.22539520263672, 66.55908203125, 71.89276123046875, 77.2264404296875, 82.56011199951172, 87.89379119873047, 93.22747039794922, 98.56114196777344, 103.89482116699219, 109.22850036621094, 114.56217956542969, 119.89585876464844, 125.22953033447266, 130.56320190429688, 135.89688110351562, 141.23056030273438, 146.56423950195312, 151.89791870117188, 157.23159790039062, 162.56527709960938, 167.89895629882812, 173.23263549804688, 178.56629943847656, 183.8999786376953, 189.23365783691406, 194.5673370361328, 199.90101623535156, 205.2346954345703, 210.56837463378906, 215.90203857421875, 221.2357177734375, 226.56939697265625, 231.903076171875, 237.23675537109375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 5.0, 10.0, 12.0, 19.0, 9.0, 34.0, 35.0, 29.0, 35.0, 37.0, 41.0, 54.0, 53.0, 65.0, 57.0, 59.0, 55.0, 47.0, 59.0, 41.0, 30.0, 45.0, 27.0, 33.0, 29.0, 18.0, 17.0, 10.0, 11.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.99421691894531, -100.57024383544922, -97.14627838134766, -93.72230529785156, -90.29833984375, -86.8743667602539, -83.45039367675781, -80.02642822265625, -76.60246276855469, -73.1784896850586, -69.75452423095703, -66.33055114746094, -62.906585693359375, -59.48261260986328, -56.05864334106445, -52.634674072265625, -49.21070098876953, -45.7867317199707, -42.362762451171875, -38.93878936767578, -35.51482391357422, -32.090850830078125, -28.666881561279297, -25.24291229248047, -21.81894302368164, -18.394973754882812, -14.971003532409668, -11.547033309936523, -8.123064041137695, -4.699094772338867, -1.2751235961914062, 2.148845672607422, 5.57281494140625, 8.996784210205078, 12.420754432678223, 15.844724655151367, 19.268693923950195, 22.692663192749023, 26.116634368896484, 29.540603637695312, 32.96457290649414, 36.38854217529297, 39.8125114440918, 43.236480712890625, 46.66045379638672, 50.08441925048828, 53.508392333984375, 56.9323616027832, 60.35633087158203, 63.78030014038086, 67.20426940917969, 70.62824249267578, 74.05220794677734, 77.47618103027344, 80.900146484375, 84.3241195678711, 87.74809265136719, 91.17206573486328, 94.59603118896484, 98.02000427246094, 101.4439697265625, 104.8679428100586, 108.29191589355469, 111.71588134765625, 115.13984680175781]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 2.0, 7.0, 7.0, 17.0, 13.0, 28.0, 31.0, 41.0, 88.0, 125.0, 170.0, 250.0, 386.0, 693.0, 1017.0, 1840.0, 3700.0, 7707.0, 18155.0, 46238.0, 119392.0, 264702.0, 314668.0, 159990.0, 63841.0, 24966.0, 10210.0, 4500.0, 2396.0, 1255.0, 750.0, 445.0, 299.0, 207.0, 145.0, 84.0, 53.0, 41.0, 32.0, 21.0, 16.0, 9.0, 6.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-55.59375, -54.056640625, -52.51953125, -50.982421875, -49.4453125, -47.908203125, -46.37109375, -44.833984375, -43.296875, -41.759765625, -40.22265625, -38.685546875, -37.1484375, -35.611328125, -34.07421875, -32.537109375, -31.0, -29.462890625, -27.92578125, -26.388671875, -24.8515625, -23.314453125, -21.77734375, -20.240234375, -18.703125, -17.166015625, -15.62890625, -14.091796875, -12.5546875, -11.017578125, -9.48046875, -7.943359375, -6.40625, -4.869140625, -3.33203125, -1.794921875, -0.2578125, 1.279296875, 2.81640625, 4.353515625, 5.890625, 7.427734375, 8.96484375, 10.501953125, 12.0390625, 13.576171875, 15.11328125, 16.650390625, 18.1875, 19.724609375, 21.26171875, 22.798828125, 24.3359375, 25.873046875, 27.41015625, 28.947265625, 30.484375, 32.021484375, 33.55859375, 35.095703125, 36.6328125, 38.169921875, 39.70703125, 41.244140625, 42.78125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 7.0, 16.0, 25.0, 26.0, 26.0, 37.0, 46.0, 48.0, 50.0, 79.0, 75.0, 77.0, 79.0, 52.0, 56.0, 52.0, 57.0, 36.0, 25.0, 32.0, 23.0, 18.0, 8.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.0518798828125, -8.720947265625, -8.3900146484375, -8.05908203125, -7.7281494140625, -7.397216796875, -7.0662841796875, -6.7353515625, -6.4044189453125, -6.073486328125, -5.7425537109375, -5.41162109375, -5.0806884765625, -4.749755859375, -4.4188232421875, -4.087890625, -3.7569580078125, -3.426025390625, -3.0950927734375, -2.76416015625, -2.4332275390625, -2.102294921875, -1.7713623046875, -1.4404296875, -1.1094970703125, -0.778564453125, -0.4476318359375, -0.11669921875, 0.2142333984375, 0.545166015625, 0.8760986328125, 1.20703125, 1.5379638671875, 1.868896484375, 2.1998291015625, 2.53076171875, 2.8616943359375, 3.192626953125, 3.5235595703125, 3.8544921875, 4.1854248046875, 4.516357421875, 4.8472900390625, 5.17822265625, 5.5091552734375, 5.840087890625, 6.1710205078125, 6.501953125, 6.8328857421875, 7.163818359375, 7.4947509765625, 7.82568359375, 8.1566162109375, 8.487548828125, 8.8184814453125, 9.1494140625, 9.4803466796875, 9.811279296875, 10.1422119140625, 10.47314453125, 10.8040771484375, 11.135009765625, 11.4659423828125, 11.796875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 9.0, 16.0, 18.0, 34.0, 41.0, 62.0, 82.0, 123.0, 186.0, 273.0, 394.0, 652.0, 1221.0, 2125.0, 4149.0, 8912.0, 20709.0, 50708.0, 125982.0, 275808.0, 304240.0, 147743.0, 60018.0, 24165.0, 10333.0, 4818.0, 2343.0, 1268.0, 756.0, 467.0, 284.0, 168.0, 123.0, 104.0, 58.0, 39.0, 31.0, 28.0, 17.0, 14.0, 9.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.875, -40.4833984375, -39.091796875, -37.7001953125, -36.30859375, -34.9169921875, -33.525390625, -32.1337890625, -30.7421875, -29.3505859375, -27.958984375, -26.5673828125, -25.17578125, -23.7841796875, -22.392578125, -21.0009765625, -19.609375, -18.2177734375, -16.826171875, -15.4345703125, -14.04296875, -12.6513671875, -11.259765625, -9.8681640625, -8.4765625, -7.0849609375, -5.693359375, -4.3017578125, -2.91015625, -1.5185546875, -0.126953125, 1.2646484375, 2.65625, 4.0478515625, 5.439453125, 6.8310546875, 8.22265625, 9.6142578125, 11.005859375, 12.3974609375, 13.7890625, 15.1806640625, 16.572265625, 17.9638671875, 19.35546875, 20.7470703125, 22.138671875, 23.5302734375, 24.921875, 26.3134765625, 27.705078125, 29.0966796875, 30.48828125, 31.8798828125, 33.271484375, 34.6630859375, 36.0546875, 37.4462890625, 38.837890625, 40.2294921875, 41.62109375, 43.0126953125, 44.404296875, 45.7958984375, 47.1875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 4.0, 6.0, 11.0, 13.0, 22.0, 21.0, 19.0, 26.0, 30.0, 24.0, 33.0, 41.0, 46.0, 44.0, 50.0, 46.0, 44.0, 64.0, 54.0, 54.0, 64.0, 52.0, 39.0, 45.0, 36.0, 23.0, 22.0, 17.0, 12.0, 13.0, 9.0, 7.0, 1.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.59375, -53.15478515625, -51.7158203125, -50.27685546875, -48.837890625, -47.39892578125, -45.9599609375, -44.52099609375, -43.08203125, -41.64306640625, -40.2041015625, -38.76513671875, -37.326171875, -35.88720703125, -34.4482421875, -33.00927734375, -31.5703125, -30.13134765625, -28.6923828125, -27.25341796875, -25.814453125, -24.37548828125, -22.9365234375, -21.49755859375, -20.05859375, -18.61962890625, -17.1806640625, -15.74169921875, -14.302734375, -12.86376953125, -11.4248046875, -9.98583984375, -8.546875, -7.10791015625, -5.6689453125, -4.22998046875, -2.791015625, -1.35205078125, 0.0869140625, 1.52587890625, 2.96484375, 4.40380859375, 5.8427734375, 7.28173828125, 8.720703125, 10.15966796875, 11.5986328125, 13.03759765625, 14.4765625, 15.91552734375, 17.3544921875, 18.79345703125, 20.232421875, 21.67138671875, 23.1103515625, 24.54931640625, 25.98828125, 27.42724609375, 28.8662109375, 30.30517578125, 31.744140625, 33.18310546875, 34.6220703125, 36.06103515625, 37.5]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 7.0, 20.0, 31.0, 50.0, 90.0, 139.0, 257.0, 467.0, 935.0, 2091.0, 4632.0, 13778.0, 65050.0, 527516.0, 370865.0, 44404.0, 10852.0, 3895.0, 1709.0, 778.0, 410.0, 241.0, 115.0, 71.0, 57.0, 33.0, 27.0, 9.0, 10.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.0625, -58.4775390625, -56.892578125, -55.3076171875, -53.72265625, -52.1376953125, -50.552734375, -48.9677734375, -47.3828125, -45.7978515625, -44.212890625, -42.6279296875, -41.04296875, -39.4580078125, -37.873046875, -36.2880859375, -34.703125, -33.1181640625, -31.533203125, -29.9482421875, -28.36328125, -26.7783203125, -25.193359375, -23.6083984375, -22.0234375, -20.4384765625, -18.853515625, -17.2685546875, -15.68359375, -14.0986328125, -12.513671875, -10.9287109375, -9.34375, -7.7587890625, -6.173828125, -4.5888671875, -3.00390625, -1.4189453125, 0.166015625, 1.7509765625, 3.3359375, 4.9208984375, 6.505859375, 8.0908203125, 9.67578125, 11.2607421875, 12.845703125, 14.4306640625, 16.015625, 17.6005859375, 19.185546875, 20.7705078125, 22.35546875, 23.9404296875, 25.525390625, 27.1103515625, 28.6953125, 30.2802734375, 31.865234375, 33.4501953125, 35.03515625, 36.6201171875, 38.205078125, 39.7900390625, 41.375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 7.0, 4.0, 7.0, 11.0, 24.0, 13.0, 27.0, 33.0, 58.0, 67.0, 125.0, 153.0, 117.0, 101.0, 73.0, 42.0, 37.0, 22.0, 21.0, 13.0, 11.0, 10.0, 7.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005157470703125, -0.004965662956237793, -0.004773855209350586, -0.004582047462463379, -0.004390239715576172, -0.004198431968688965, -0.004006624221801758, -0.0038148164749145508, -0.0036230087280273438, -0.0034312009811401367, -0.0032393932342529297, -0.0030475854873657227, -0.0028557777404785156, -0.0026639699935913086, -0.0024721622467041016, -0.0022803544998168945, -0.0020885467529296875, -0.0018967390060424805, -0.0017049312591552734, -0.0015131235122680664, -0.0013213157653808594, -0.0011295080184936523, -0.0009377002716064453, -0.0007458925247192383, -0.0005540847778320312, -0.0003622770309448242, -0.0001704692840576172, 2.1338462829589844e-05, 0.00021314620971679688, 0.0004049539566040039, 0.0005967617034912109, 0.000788569450378418, 0.000980377197265625, 0.001172184944152832, 0.001363992691040039, 0.001555800437927246, 0.0017476081848144531, 0.0019394159317016602, 0.002131223678588867, 0.0023230314254760742, 0.0025148391723632812, 0.0027066469192504883, 0.0028984546661376953, 0.0030902624130249023, 0.0032820701599121094, 0.0034738779067993164, 0.0036656856536865234, 0.0038574934005737305, 0.0040493011474609375, 0.0042411088943481445, 0.0044329166412353516, 0.004624724388122559, 0.004816532135009766, 0.005008339881896973, 0.00520014762878418, 0.005391955375671387, 0.005583763122558594, 0.005775570869445801, 0.005967378616333008, 0.006159186363220215, 0.006350994110107422, 0.006542801856994629, 0.006734609603881836, 0.006926417350769043, 0.00711822509765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 3.0, 1.0, 14.0, 24.0, 31.0, 67.0, 84.0, 176.0, 222.0, 491.0, 1231.0, 3370.0, 11619.0, 61521.0, 727175.0, 210846.0, 22569.0, 5729.0, 1809.0, 754.0, 371.0, 193.0, 94.0, 55.0, 44.0, 14.0, 12.0, 13.0, 4.0, 2.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-87.625, -85.3623046875, -83.099609375, -80.8369140625, -78.57421875, -76.3115234375, -74.048828125, -71.7861328125, -69.5234375, -67.2607421875, -64.998046875, -62.7353515625, -60.47265625, -58.2099609375, -55.947265625, -53.6845703125, -51.421875, -49.1591796875, -46.896484375, -44.6337890625, -42.37109375, -40.1083984375, -37.845703125, -35.5830078125, -33.3203125, -31.0576171875, -28.794921875, -26.5322265625, -24.26953125, -22.0068359375, -19.744140625, -17.4814453125, -15.21875, -12.9560546875, -10.693359375, -8.4306640625, -6.16796875, -3.9052734375, -1.642578125, 0.6201171875, 2.8828125, 5.1455078125, 7.408203125, 9.6708984375, 11.93359375, 14.1962890625, 16.458984375, 18.7216796875, 20.984375, 23.2470703125, 25.509765625, 27.7724609375, 30.03515625, 32.2978515625, 34.560546875, 36.8232421875, 39.0859375, 41.3486328125, 43.611328125, 45.8740234375, 48.13671875, 50.3994140625, 52.662109375, 54.9248046875, 57.1875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 1.0, 8.0, 8.0, 9.0, 6.0, 13.0, 15.0, 16.0, 28.0, 35.0, 67.0, 93.0, 123.0, 110.0, 124.0, 87.0, 75.0, 48.0, 34.0, 18.0, 16.0, 14.0, 9.0, 6.0, 11.0, 4.0, 11.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-38.84375, -37.8662109375, -36.888671875, -35.9111328125, -34.93359375, -33.9560546875, -32.978515625, -32.0009765625, -31.0234375, -30.0458984375, -29.068359375, -28.0908203125, -27.11328125, -26.1357421875, -25.158203125, -24.1806640625, -23.203125, -22.2255859375, -21.248046875, -20.2705078125, -19.29296875, -18.3154296875, -17.337890625, -16.3603515625, -15.3828125, -14.4052734375, -13.427734375, -12.4501953125, -11.47265625, -10.4951171875, -9.517578125, -8.5400390625, -7.5625, -6.5849609375, -5.607421875, -4.6298828125, -3.65234375, -2.6748046875, -1.697265625, -0.7197265625, 0.2578125, 1.2353515625, 2.212890625, 3.1904296875, 4.16796875, 5.1455078125, 6.123046875, 7.1005859375, 8.078125, 9.0556640625, 10.033203125, 11.0107421875, 11.98828125, 12.9658203125, 13.943359375, 14.9208984375, 15.8984375, 16.8759765625, 17.853515625, 18.8310546875, 19.80859375, 20.7861328125, 21.763671875, 22.7412109375, 23.71875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 2.0, 2.0, 10.0, 17.0, 27.0, 54.0, 61.0, 85.0, 129.0, 125.0, 121.0, 116.0, 88.0, 49.0, 47.0, 25.0, 18.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-267.1509094238281, -254.8964080810547, -242.64190673828125, -230.3874053955078, -218.13290405273438, -205.87840270996094, -193.6239013671875, -181.36940002441406, -169.11489868164062, -156.8603973388672, -144.60589599609375, -132.3513946533203, -120.09689331054688, -107.84239196777344, -95.587890625, -83.33338928222656, -71.07888793945312, -58.82438659667969, -46.56988525390625, -34.31538391113281, -22.060882568359375, -9.806381225585938, 2.4481201171875, 14.702621459960938, 26.957122802734375, 39.21162414550781, 51.46612548828125, 63.72062683105469, 75.97512817382812, 88.22962951660156, 100.484130859375, 112.73863220214844, 124.9931640625, 137.24766540527344, 149.50216674804688, 161.7566680908203, 174.01116943359375, 186.2656707763672, 198.52017211914062, 210.77467346191406, 223.0291748046875, 235.28367614746094, 247.53817749023438, 259.79266357421875, 272.04718017578125, 284.30169677734375, 296.5561828613281, 308.8106689453125, 321.065185546875, 333.3197021484375, 345.5741882324219, 357.82867431640625, 370.08319091796875, 382.33770751953125, 394.5921936035156, 406.8466796875, 419.1011962890625, 431.355712890625, 443.6101989746094, 455.86468505859375, 468.11920166015625, 480.37371826171875, 492.6282043457031, 504.8826904296875, 517.13720703125]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 3.0, 9.0, 6.0, 12.0, 14.0, 17.0, 19.0, 26.0, 33.0, 29.0, 49.0, 59.0, 48.0, 53.0, 50.0, 50.0, 53.0, 41.0, 57.0, 56.0, 56.0, 35.0, 40.0, 24.0, 25.0, 29.0, 26.0, 18.0, 15.0, 14.0, 5.0, 7.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-252.88116455078125, -244.57766723632812, -236.274169921875, -227.97067260742188, -219.66717529296875, -211.36367797851562, -203.0601806640625, -194.75668334960938, -186.45318603515625, -178.14968872070312, -169.84619140625, -161.54269409179688, -153.23919677734375, -144.93569946289062, -136.6322021484375, -128.32870483398438, -120.02520751953125, -111.72171020507812, -103.418212890625, -95.11471557617188, -86.81121826171875, -78.50772094726562, -70.2042236328125, -61.900726318359375, -53.59722900390625, -45.293731689453125, -36.990234375, -28.686737060546875, -20.38323974609375, -12.079742431640625, -3.7762451171875, 4.527252197265625, 12.830718994140625, 21.13421630859375, 29.437713623046875, 37.7412109375, 46.044708251953125, 54.34820556640625, 62.651702880859375, 70.9552001953125, 79.25869750976562, 87.56219482421875, 95.86569213867188, 104.169189453125, 112.47268676757812, 120.77618408203125, 129.07968139648438, 137.3831787109375, 145.68667602539062, 153.99017333984375, 162.29367065429688, 170.59716796875, 178.90066528320312, 187.20416259765625, 195.50765991210938, 203.8111572265625, 212.11465454101562, 220.41815185546875, 228.72164916992188, 237.025146484375, 245.32864379882812, 253.63214111328125, 261.9356384277344, 270.2391357421875, 278.5426330566406]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 5.0, 11.0, 9.0, 20.0, 22.0, 22.0, 52.0, 63.0, 77.0, 140.0, 222.0, 358.0, 619.0, 1148.0, 2249.0, 4746.0, 11817.0, 34285.0, 172562.0, 3697683.0, 207696.0, 38059.0, 12272.0, 5012.0, 2299.0, 1138.0, 625.0, 344.0, 190.0, 144.0, 113.0, 72.0, 49.0, 28.0, 27.0, 21.0, 18.0, 11.0, 11.0, 12.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-77.6875, -75.1435546875, -72.599609375, -70.0556640625, -67.51171875, -64.9677734375, -62.423828125, -59.8798828125, -57.3359375, -54.7919921875, -52.248046875, -49.7041015625, -47.16015625, -44.6162109375, -42.072265625, -39.5283203125, -36.984375, -34.4404296875, -31.896484375, -29.3525390625, -26.80859375, -24.2646484375, -21.720703125, -19.1767578125, -16.6328125, -14.0888671875, -11.544921875, -9.0009765625, -6.45703125, -3.9130859375, -1.369140625, 1.1748046875, 3.71875, 6.2626953125, 8.806640625, 11.3505859375, 13.89453125, 16.4384765625, 18.982421875, 21.5263671875, 24.0703125, 26.6142578125, 29.158203125, 31.7021484375, 34.24609375, 36.7900390625, 39.333984375, 41.8779296875, 44.421875, 46.9658203125, 49.509765625, 52.0537109375, 54.59765625, 57.1416015625, 59.685546875, 62.2294921875, 64.7734375, 67.3173828125, 69.861328125, 72.4052734375, 74.94921875, 77.4931640625, 80.037109375, 82.5810546875, 85.125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 11.0, 12.0, 17.0, 20.0, 27.0, 35.0, 52.0, 60.0, 67.0, 80.0, 76.0, 76.0, 94.0, 71.0, 75.0, 50.0, 59.0, 40.0, 19.0, 17.0, 15.0, 8.0, 8.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.8997802734375, -11.494873046875, -11.0899658203125, -10.68505859375, -10.2801513671875, -9.875244140625, -9.4703369140625, -9.0654296875, -8.6605224609375, -8.255615234375, -7.8507080078125, -7.44580078125, -7.0408935546875, -6.635986328125, -6.2310791015625, -5.826171875, -5.4212646484375, -5.016357421875, -4.6114501953125, -4.20654296875, -3.8016357421875, -3.396728515625, -2.9918212890625, -2.5869140625, -2.1820068359375, -1.777099609375, -1.3721923828125, -0.96728515625, -0.5623779296875, -0.157470703125, 0.2474365234375, 0.65234375, 1.0572509765625, 1.462158203125, 1.8670654296875, 2.27197265625, 2.6768798828125, 3.081787109375, 3.4866943359375, 3.8916015625, 4.2965087890625, 4.701416015625, 5.1063232421875, 5.51123046875, 5.9161376953125, 6.321044921875, 6.7259521484375, 7.130859375, 7.5357666015625, 7.940673828125, 8.3455810546875, 8.75048828125, 9.1553955078125, 9.560302734375, 9.9652099609375, 10.3701171875, 10.7750244140625, 11.179931640625, 11.5848388671875, 11.98974609375, 12.3946533203125, 12.799560546875, 13.2044677734375, 13.609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 6.0, 2.0, 6.0, 9.0, 22.0, 16.0, 17.0, 29.0, 49.0, 73.0, 117.0, 180.0, 300.0, 472.0, 787.0, 1544.0, 3191.0, 7126.0, 18807.0, 60045.0, 295363.0, 3404103.0, 306150.0, 62156.0, 19570.0, 7567.0, 3191.0, 1583.0, 708.0, 426.0, 232.0, 163.0, 94.0, 52.0, 39.0, 33.0, 19.0, 17.0, 9.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-72.4375, -70.138671875, -67.83984375, -65.541015625, -63.2421875, -60.943359375, -58.64453125, -56.345703125, -54.046875, -51.748046875, -49.44921875, -47.150390625, -44.8515625, -42.552734375, -40.25390625, -37.955078125, -35.65625, -33.357421875, -31.05859375, -28.759765625, -26.4609375, -24.162109375, -21.86328125, -19.564453125, -17.265625, -14.966796875, -12.66796875, -10.369140625, -8.0703125, -5.771484375, -3.47265625, -1.173828125, 1.125, 3.423828125, 5.72265625, 8.021484375, 10.3203125, 12.619140625, 14.91796875, 17.216796875, 19.515625, 21.814453125, 24.11328125, 26.412109375, 28.7109375, 31.009765625, 33.30859375, 35.607421875, 37.90625, 40.205078125, 42.50390625, 44.802734375, 47.1015625, 49.400390625, 51.69921875, 53.998046875, 56.296875, 58.595703125, 60.89453125, 63.193359375, 65.4921875, 67.791015625, 70.08984375, 72.388671875, 74.6875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 2.0, 4.0, 5.0, 8.0, 18.0, 14.0, 19.0, 31.0, 35.0, 54.0, 69.0, 125.0, 166.0, 362.0, 1605.0, 777.0, 288.0, 130.0, 85.0, 78.0, 47.0, 36.0, 25.0, 20.0, 19.0, 15.0, 11.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.953125, -20.36865234375, -19.7841796875, -19.19970703125, -18.615234375, -18.03076171875, -17.4462890625, -16.86181640625, -16.27734375, -15.69287109375, -15.1083984375, -14.52392578125, -13.939453125, -13.35498046875, -12.7705078125, -12.18603515625, -11.6015625, -11.01708984375, -10.4326171875, -9.84814453125, -9.263671875, -8.67919921875, -8.0947265625, -7.51025390625, -6.92578125, -6.34130859375, -5.7568359375, -5.17236328125, -4.587890625, -4.00341796875, -3.4189453125, -2.83447265625, -2.25, -1.66552734375, -1.0810546875, -0.49658203125, 0.087890625, 0.67236328125, 1.2568359375, 1.84130859375, 2.42578125, 3.01025390625, 3.5947265625, 4.17919921875, 4.763671875, 5.34814453125, 5.9326171875, 6.51708984375, 7.1015625, 7.68603515625, 8.2705078125, 8.85498046875, 9.439453125, 10.02392578125, 10.6083984375, 11.19287109375, 11.77734375, 12.36181640625, 12.9462890625, 13.53076171875, 14.115234375, 14.69970703125, 15.2841796875, 15.86865234375, 16.453125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 11.0, 24.0, 42.0, 63.0, 103.0, 161.0, 177.0, 150.0, 107.0, 78.0, 34.0, 20.0, 14.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-228.23052978515625, -222.45838928222656, -216.68624877929688, -210.9141082763672, -205.1419677734375, -199.36981201171875, -193.59767150878906, -187.82553100585938, -182.0533905029297, -176.28125, -170.5091094970703, -164.73696899414062, -158.96481323242188, -153.1926727294922, -147.4205322265625, -141.6483917236328, -135.87625122070312, -130.10411071777344, -124.33197021484375, -118.55982208251953, -112.78768157958984, -107.01554107666016, -101.24339294433594, -95.47125244140625, -89.69911193847656, -83.92697143554688, -78.15483093261719, -72.38268280029297, -66.61054229736328, -60.838401794433594, -55.06625747680664, -49.29411315917969, -43.52198791503906, -37.749847412109375, -31.977703094482422, -26.2055606842041, -20.43341827392578, -14.661275863647461, -8.88913345336914, -3.1169891357421875, 2.6551513671875, 8.42729377746582, 14.19943618774414, 19.97157859802246, 25.74372100830078, 31.5158634185791, 37.28800582885742, 43.060150146484375, 48.83229064941406, 54.60443115234375, 60.3765754699707, 66.14871978759766, 71.92086029052734, 77.69300079345703, 83.46514892578125, 89.23728942871094, 95.00942993164062, 100.78157043457031, 106.5537109375, 112.32585906982422, 118.0979995727539, 123.8701400756836, 129.6422882080078, 135.4144287109375, 141.1865692138672]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 9.0, 12.0, 17.0, 20.0, 25.0, 26.0, 32.0, 41.0, 55.0, 77.0, 51.0, 59.0, 67.0, 57.0, 64.0, 47.0, 56.0, 48.0, 47.0, 38.0, 37.0, 29.0, 28.0, 15.0, 10.0, 8.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-122.79973602294922, -119.90010070800781, -117.0004653930664, -114.100830078125, -111.2011947631836, -108.30155944824219, -105.40191650390625, -102.50228881835938, -99.60264587402344, -96.70301055908203, -93.80337524414062, -90.90373992919922, -88.00410461425781, -85.1044692993164, -82.204833984375, -79.30519104003906, -76.40556335449219, -73.50592803955078, -70.60629272460938, -67.70665740966797, -64.80702209472656, -61.907386779785156, -59.007747650146484, -56.10811233520508, -53.20847702026367, -50.308841705322266, -47.40920639038086, -44.50956726074219, -41.60993194580078, -38.710296630859375, -35.81066131591797, -32.91102600097656, -30.011383056640625, -27.11174774169922, -24.212112426757812, -21.312475204467773, -18.412839889526367, -15.513204574584961, -12.613567352294922, -9.713932037353516, -6.814296722412109, -3.914660930633545, -1.0150251388549805, 1.8846111297607422, 4.784246444702148, 7.683881759643555, 10.583518981933594, 13.483154296875, 16.382789611816406, 19.282424926757812, 22.18206024169922, 25.081697463989258, 27.981332778930664, 30.88096809387207, 33.78060531616211, 36.680240631103516, 39.57987594604492, 42.47951126098633, 45.379146575927734, 48.278785705566406, 51.17842102050781, 54.07805633544922, 56.977691650390625, 59.87732696533203, 62.77696228027344]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 6.0, 6.0, 13.0, 16.0, 28.0, 49.0, 68.0, 137.0, 336.0, 574.0, 1166.0, 3016.0, 9219.0, 35143.0, 160700.0, 494270.0, 263090.0, 59265.0, 14059.0, 4234.0, 1607.0, 737.0, 339.0, 197.0, 98.0, 59.0, 45.0, 22.0, 22.0, 7.0, 9.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-98.0, -95.4658203125, -92.931640625, -90.3974609375, -87.86328125, -85.3291015625, -82.794921875, -80.2607421875, -77.7265625, -75.1923828125, -72.658203125, -70.1240234375, -67.58984375, -65.0556640625, -62.521484375, -59.9873046875, -57.453125, -54.9189453125, -52.384765625, -49.8505859375, -47.31640625, -44.7822265625, -42.248046875, -39.7138671875, -37.1796875, -34.6455078125, -32.111328125, -29.5771484375, -27.04296875, -24.5087890625, -21.974609375, -19.4404296875, -16.90625, -14.3720703125, -11.837890625, -9.3037109375, -6.76953125, -4.2353515625, -1.701171875, 0.8330078125, 3.3671875, 5.9013671875, 8.435546875, 10.9697265625, 13.50390625, 16.0380859375, 18.572265625, 21.1064453125, 23.640625, 26.1748046875, 28.708984375, 31.2431640625, 33.77734375, 36.3115234375, 38.845703125, 41.3798828125, 43.9140625, 46.4482421875, 48.982421875, 51.5166015625, 54.05078125, 56.5849609375, 59.119140625, 61.6533203125, 64.1875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 7.0, 13.0, 16.0, 21.0, 25.0, 25.0, 36.0, 60.0, 78.0, 66.0, 69.0, 83.0, 71.0, 68.0, 94.0, 56.0, 55.0, 46.0, 32.0, 31.0, 12.0, 13.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.10546875, -11.6875, -11.26953125, -10.8515625, -10.43359375, -10.015625, -9.59765625, -9.1796875, -8.76171875, -8.34375, -7.92578125, -7.5078125, -7.08984375, -6.671875, -6.25390625, -5.8359375, -5.41796875, -5.0, -4.58203125, -4.1640625, -3.74609375, -3.328125, -2.91015625, -2.4921875, -2.07421875, -1.65625, -1.23828125, -0.8203125, -0.40234375, 0.015625, 0.43359375, 0.8515625, 1.26953125, 1.6875, 2.10546875, 2.5234375, 2.94140625, 3.359375, 3.77734375, 4.1953125, 4.61328125, 5.03125, 5.44921875, 5.8671875, 6.28515625, 6.703125, 7.12109375, 7.5390625, 7.95703125, 8.375, 8.79296875, 9.2109375, 9.62890625, 10.046875, 10.46484375, 10.8828125, 11.30078125, 11.71875, 12.13671875, 12.5546875, 12.97265625, 13.390625, 13.80859375, 14.2265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 8.0, 14.0, 17.0, 24.0, 21.0, 51.0, 78.0, 82.0, 161.0, 207.0, 363.0, 623.0, 1075.0, 1888.0, 3700.0, 7770.0, 17844.0, 45003.0, 116883.0, 276752.0, 324156.0, 150577.0, 58819.0, 22941.0, 9601.0, 4374.0, 2334.0, 1204.0, 725.0, 460.0, 272.0, 163.0, 103.0, 76.0, 50.0, 42.0, 26.0, 25.0, 15.0, 6.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.15625, -45.68896484375, -44.2216796875, -42.75439453125, -41.287109375, -39.81982421875, -38.3525390625, -36.88525390625, -35.41796875, -33.95068359375, -32.4833984375, -31.01611328125, -29.548828125, -28.08154296875, -26.6142578125, -25.14697265625, -23.6796875, -22.21240234375, -20.7451171875, -19.27783203125, -17.810546875, -16.34326171875, -14.8759765625, -13.40869140625, -11.94140625, -10.47412109375, -9.0068359375, -7.53955078125, -6.072265625, -4.60498046875, -3.1376953125, -1.67041015625, -0.203125, 1.26416015625, 2.7314453125, 4.19873046875, 5.666015625, 7.13330078125, 8.6005859375, 10.06787109375, 11.53515625, 13.00244140625, 14.4697265625, 15.93701171875, 17.404296875, 18.87158203125, 20.3388671875, 21.80615234375, 23.2734375, 24.74072265625, 26.2080078125, 27.67529296875, 29.142578125, 30.60986328125, 32.0771484375, 33.54443359375, 35.01171875, 36.47900390625, 37.9462890625, 39.41357421875, 40.880859375, 42.34814453125, 43.8154296875, 45.28271484375, 46.75]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 9.0, 8.0, 6.0, 9.0, 11.0, 12.0, 12.0, 18.0, 14.0, 19.0, 18.0, 23.0, 22.0, 28.0, 30.0, 34.0, 39.0, 35.0, 39.0, 37.0, 41.0, 42.0, 44.0, 42.0, 41.0, 32.0, 34.0, 37.0, 35.0, 28.0, 24.0, 30.0, 14.0, 20.0, 21.0, 17.0, 11.0, 13.0, 10.0, 20.0, 6.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-34.1875, -33.08349609375, -31.9794921875, -30.87548828125, -29.771484375, -28.66748046875, -27.5634765625, -26.45947265625, -25.35546875, -24.25146484375, -23.1474609375, -22.04345703125, -20.939453125, -19.83544921875, -18.7314453125, -17.62744140625, -16.5234375, -15.41943359375, -14.3154296875, -13.21142578125, -12.107421875, -11.00341796875, -9.8994140625, -8.79541015625, -7.69140625, -6.58740234375, -5.4833984375, -4.37939453125, -3.275390625, -2.17138671875, -1.0673828125, 0.03662109375, 1.140625, 2.24462890625, 3.3486328125, 4.45263671875, 5.556640625, 6.66064453125, 7.7646484375, 8.86865234375, 9.97265625, 11.07666015625, 12.1806640625, 13.28466796875, 14.388671875, 15.49267578125, 16.5966796875, 17.70068359375, 18.8046875, 19.90869140625, 21.0126953125, 22.11669921875, 23.220703125, 24.32470703125, 25.4287109375, 26.53271484375, 27.63671875, 28.74072265625, 29.8447265625, 30.94873046875, 32.052734375, 33.15673828125, 34.2607421875, 35.36474609375, 36.46875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 17.0, 11.0, 24.0, 20.0, 32.0, 52.0, 70.0, 123.0, 155.0, 240.0, 408.0, 704.0, 1292.0, 2462.0, 4997.0, 11421.0, 29721.0, 91555.0, 320840.0, 395170.0, 124372.0, 37936.0, 14243.0, 6132.0, 2918.0, 1558.0, 839.0, 454.0, 265.0, 155.0, 132.0, 62.0, 59.0, 29.0, 20.0, 17.0, 9.0, 10.0, 10.0, 5.0, 2.0, 0.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-30.171875, -29.312744140625, -28.45361328125, -27.594482421875, -26.7353515625, -25.876220703125, -25.01708984375, -24.157958984375, -23.298828125, -22.439697265625, -21.58056640625, -20.721435546875, -19.8623046875, -19.003173828125, -18.14404296875, -17.284912109375, -16.42578125, -15.566650390625, -14.70751953125, -13.848388671875, -12.9892578125, -12.130126953125, -11.27099609375, -10.411865234375, -9.552734375, -8.693603515625, -7.83447265625, -6.975341796875, -6.1162109375, -5.257080078125, -4.39794921875, -3.538818359375, -2.6796875, -1.820556640625, -0.96142578125, -0.102294921875, 0.7568359375, 1.615966796875, 2.47509765625, 3.334228515625, 4.193359375, 5.052490234375, 5.91162109375, 6.770751953125, 7.6298828125, 8.489013671875, 9.34814453125, 10.207275390625, 11.06640625, 11.925537109375, 12.78466796875, 13.643798828125, 14.5029296875, 15.362060546875, 16.22119140625, 17.080322265625, 17.939453125, 18.798583984375, 19.65771484375, 20.516845703125, 21.3759765625, 22.235107421875, 23.09423828125, 23.953369140625, 24.8125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 7.0, 9.0, 6.0, 12.0, 21.0, 33.0, 47.0, 88.0, 109.0, 198.0, 160.0, 106.0, 55.0, 38.0, 33.0, 17.0, 17.0, 11.0, 6.0, 7.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.008636474609375, -0.008365035057067871, -0.008093595504760742, -0.007822155952453613, -0.007550716400146484, -0.0072792768478393555, -0.0070078372955322266, -0.006736397743225098, -0.006464958190917969, -0.00619351863861084, -0.005922079086303711, -0.005650639533996582, -0.005379199981689453, -0.005107760429382324, -0.004836320877075195, -0.004564881324768066, -0.0042934417724609375, -0.004022002220153809, -0.0037505626678466797, -0.0034791231155395508, -0.003207683563232422, -0.002936244010925293, -0.002664804458618164, -0.002393364906311035, -0.0021219253540039062, -0.0018504858016967773, -0.0015790462493896484, -0.0013076066970825195, -0.0010361671447753906, -0.0007647275924682617, -0.0004932880401611328, -0.0002218484878540039, 4.9591064453125e-05, 0.0003210306167602539, 0.0005924701690673828, 0.0008639097213745117, 0.0011353492736816406, 0.0014067888259887695, 0.0016782283782958984, 0.0019496679306030273, 0.0022211074829101562, 0.002492547035217285, 0.002763986587524414, 0.003035426139831543, 0.003306865692138672, 0.0035783052444458008, 0.0038497447967529297, 0.004121184349060059, 0.0043926239013671875, 0.004664063453674316, 0.004935503005981445, 0.005206942558288574, 0.005478382110595703, 0.005749821662902832, 0.006021261215209961, 0.00629270076751709, 0.006564140319824219, 0.006835579872131348, 0.0071070194244384766, 0.0073784589767456055, 0.007649898529052734, 0.007921338081359863, 0.008192777633666992, 0.008464217185974121, 0.00873565673828125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 7.0, 7.0, 14.0, 19.0, 29.0, 32.0, 44.0, 69.0, 150.0, 236.0, 464.0, 875.0, 1876.0, 4782.0, 15040.0, 63458.0, 398389.0, 462287.0, 74416.0, 17092.0, 5148.0, 2030.0, 958.0, 469.0, 261.0, 136.0, 100.0, 54.0, 34.0, 22.0, 12.0, 12.0, 8.0, 13.0, 1.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.875, -40.568359375, -39.26171875, -37.955078125, -36.6484375, -35.341796875, -34.03515625, -32.728515625, -31.421875, -30.115234375, -28.80859375, -27.501953125, -26.1953125, -24.888671875, -23.58203125, -22.275390625, -20.96875, -19.662109375, -18.35546875, -17.048828125, -15.7421875, -14.435546875, -13.12890625, -11.822265625, -10.515625, -9.208984375, -7.90234375, -6.595703125, -5.2890625, -3.982421875, -2.67578125, -1.369140625, -0.0625, 1.244140625, 2.55078125, 3.857421875, 5.1640625, 6.470703125, 7.77734375, 9.083984375, 10.390625, 11.697265625, 13.00390625, 14.310546875, 15.6171875, 16.923828125, 18.23046875, 19.537109375, 20.84375, 22.150390625, 23.45703125, 24.763671875, 26.0703125, 27.376953125, 28.68359375, 29.990234375, 31.296875, 32.603515625, 33.91015625, 35.216796875, 36.5234375, 37.830078125, 39.13671875, 40.443359375, 41.75]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 9.0, 13.0, 20.0, 16.0, 21.0, 23.0, 31.0, 57.0, 72.0, 83.0, 75.0, 99.0, 84.0, 80.0, 63.0, 53.0, 50.0, 39.0, 21.0, 20.0, 20.0, 11.0, 7.0, 12.0, 4.0, 0.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.53125, -18.76806640625, -18.0048828125, -17.24169921875, -16.478515625, -15.71533203125, -14.9521484375, -14.18896484375, -13.42578125, -12.66259765625, -11.8994140625, -11.13623046875, -10.373046875, -9.60986328125, -8.8466796875, -8.08349609375, -7.3203125, -6.55712890625, -5.7939453125, -5.03076171875, -4.267578125, -3.50439453125, -2.7412109375, -1.97802734375, -1.21484375, -0.45166015625, 0.3115234375, 1.07470703125, 1.837890625, 2.60107421875, 3.3642578125, 4.12744140625, 4.890625, 5.65380859375, 6.4169921875, 7.18017578125, 7.943359375, 8.70654296875, 9.4697265625, 10.23291015625, 10.99609375, 11.75927734375, 12.5224609375, 13.28564453125, 14.048828125, 14.81201171875, 15.5751953125, 16.33837890625, 17.1015625, 17.86474609375, 18.6279296875, 19.39111328125, 20.154296875, 20.91748046875, 21.6806640625, 22.44384765625, 23.20703125, 23.97021484375, 24.7333984375, 25.49658203125, 26.259765625, 27.02294921875, 27.7861328125, 28.54931640625, 29.3125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 6.0, 16.0, 25.0, 31.0, 49.0, 73.0, 87.0, 97.0, 98.0, 106.0, 95.0, 66.0, 68.0, 47.0, 32.0, 33.0, 23.0, 11.0, 5.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-264.46893310546875, -254.33636474609375, -244.20379638671875, -234.07122802734375, -223.9386444091797, -213.8060760498047, -203.6735076904297, -193.54092407226562, -183.40835571289062, -173.27578735351562, -163.14321899414062, -153.01065063476562, -142.87806701660156, -132.74549865722656, -122.61293029785156, -112.48035430908203, -102.34779357910156, -92.21522521972656, -82.08264923095703, -71.95008087158203, -61.817508697509766, -51.6849365234375, -41.5523681640625, -31.41979217529297, -21.28722381591797, -11.15465259552002, -1.0220813751220703, 9.110488891601562, 19.243061065673828, 29.375633239746094, 39.508201599121094, 49.640777587890625, 59.773345947265625, 69.90591430664062, 80.03849029541016, 90.17105865478516, 100.30363464355469, 110.43620300292969, 120.56877136230469, 130.70135498046875, 140.83392333984375, 150.96649169921875, 161.09906005859375, 171.23162841796875, 181.3642120361328, 191.4967803955078, 201.6293487548828, 211.76193237304688, 221.8944854736328, 232.0270538330078, 242.1596221923828, 252.29220581054688, 262.4247741699219, 272.5573425292969, 282.6899108886719, 292.8224792480469, 302.9550476074219, 313.0876159667969, 323.2201843261719, 333.3527526855469, 343.4853210449219, 353.617919921875, 363.75048828125, 373.883056640625, 384.015625]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 1.0, 13.0, 13.0, 28.0, 19.0, 46.0, 46.0, 59.0, 51.0, 68.0, 63.0, 77.0, 84.0, 75.0, 68.0, 52.0, 46.0, 48.0, 33.0, 31.0, 20.0, 19.0, 11.0, 10.0, 6.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-356.84967041015625, -345.3248291015625, -333.7999572753906, -322.2751159667969, -310.7502746582031, -299.22540283203125, -287.7005615234375, -276.17572021484375, -264.65087890625, -253.1260223388672, -241.60118103027344, -230.07632446289062, -218.55148315429688, -207.02662658691406, -195.50177001953125, -183.9769287109375, -172.45205688476562, -160.9272003173828, -149.40235900878906, -137.87750244140625, -126.35265350341797, -114.82780456542969, -103.30294799804688, -91.7780990600586, -80.25325012207031, -68.72840118408203, -57.203548431396484, -45.67869567871094, -34.153846740722656, -22.628997802734375, -11.104141235351562, 0.42070770263671875, 11.945556640625, 23.470407485961914, 34.99525833129883, 46.520111083984375, 58.044960021972656, 69.56980895996094, 81.09466552734375, 92.61951446533203, 104.14436340332031, 115.6692123413086, 127.19406127929688, 138.7189178466797, 150.2437744140625, 161.76861572265625, 173.29347229003906, 184.81832885742188, 196.34317016601562, 207.86802673339844, 219.3928680419922, 230.917724609375, 242.44256591796875, 253.96742248535156, 265.4922790527344, 277.0171203613281, 288.5419921875, 300.06683349609375, 311.5917053222656, 323.1165466308594, 334.6413879394531, 346.166259765625, 357.69110107421875, 369.2159423828125, 380.74078369140625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 12.0, 14.0, 29.0, 48.0, 72.0, 120.0, 177.0, 273.0, 482.0, 891.0, 1901.0, 3857.0, 8835.0, 24121.0, 85960.0, 708885.0, 3160391.0, 142277.0, 34439.0, 11656.0, 4742.0, 2234.0, 1109.0, 617.0, 406.0, 217.0, 126.0, 104.0, 55.0, 58.0, 37.0, 35.0, 24.0, 22.0, 7.0, 8.0, 9.0, 6.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.375, -65.857421875, -63.33984375, -60.822265625, -58.3046875, -55.787109375, -53.26953125, -50.751953125, -48.234375, -45.716796875, -43.19921875, -40.681640625, -38.1640625, -35.646484375, -33.12890625, -30.611328125, -28.09375, -25.576171875, -23.05859375, -20.541015625, -18.0234375, -15.505859375, -12.98828125, -10.470703125, -7.953125, -5.435546875, -2.91796875, -0.400390625, 2.1171875, 4.634765625, 7.15234375, 9.669921875, 12.1875, 14.705078125, 17.22265625, 19.740234375, 22.2578125, 24.775390625, 27.29296875, 29.810546875, 32.328125, 34.845703125, 37.36328125, 39.880859375, 42.3984375, 44.916015625, 47.43359375, 49.951171875, 52.46875, 54.986328125, 57.50390625, 60.021484375, 62.5390625, 65.056640625, 67.57421875, 70.091796875, 72.609375, 75.126953125, 77.64453125, 80.162109375, 82.6796875, 85.197265625, 87.71484375, 90.232421875, 92.75]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 9.0, 14.0, 26.0, 27.0, 40.0, 47.0, 53.0, 82.0, 80.0, 81.0, 81.0, 83.0, 87.0, 73.0, 54.0, 46.0, 35.0, 22.0, 21.0, 13.0, 6.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5546875, -12.0955810546875, -11.636474609375, -11.1773681640625, -10.71826171875, -10.2591552734375, -9.800048828125, -9.3409423828125, -8.8818359375, -8.4227294921875, -7.963623046875, -7.5045166015625, -7.04541015625, -6.5863037109375, -6.127197265625, -5.6680908203125, -5.208984375, -4.7498779296875, -4.290771484375, -3.8316650390625, -3.37255859375, -2.9134521484375, -2.454345703125, -1.9952392578125, -1.5361328125, -1.0770263671875, -0.617919921875, -0.1588134765625, 0.30029296875, 0.7593994140625, 1.218505859375, 1.6776123046875, 2.13671875, 2.5958251953125, 3.054931640625, 3.5140380859375, 3.97314453125, 4.4322509765625, 4.891357421875, 5.3504638671875, 5.8095703125, 6.2686767578125, 6.727783203125, 7.1868896484375, 7.64599609375, 8.1051025390625, 8.564208984375, 9.0233154296875, 9.482421875, 9.9415283203125, 10.400634765625, 10.8597412109375, 11.31884765625, 11.7779541015625, 12.237060546875, 12.6961669921875, 13.1552734375, 13.6143798828125, 14.073486328125, 14.5325927734375, 14.99169921875, 15.4508056640625, 15.909912109375, 16.3690185546875, 16.828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 11.0, 15.0, 30.0, 33.0, 64.0, 72.0, 127.0, 202.0, 353.0, 643.0, 1185.0, 2513.0, 5722.0, 15314.0, 52460.0, 322305.0, 3399826.0, 313633.0, 52701.0, 15748.0, 5763.0, 2514.0, 1247.0, 681.0, 402.0, 250.0, 164.0, 111.0, 61.0, 37.0, 21.0, 19.0, 11.0, 9.0, 11.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.5, -75.64453125, -72.7890625, -69.93359375, -67.078125, -64.22265625, -61.3671875, -58.51171875, -55.65625, -52.80078125, -49.9453125, -47.08984375, -44.234375, -41.37890625, -38.5234375, -35.66796875, -32.8125, -29.95703125, -27.1015625, -24.24609375, -21.390625, -18.53515625, -15.6796875, -12.82421875, -9.96875, -7.11328125, -4.2578125, -1.40234375, 1.453125, 4.30859375, 7.1640625, 10.01953125, 12.875, 15.73046875, 18.5859375, 21.44140625, 24.296875, 27.15234375, 30.0078125, 32.86328125, 35.71875, 38.57421875, 41.4296875, 44.28515625, 47.140625, 49.99609375, 52.8515625, 55.70703125, 58.5625, 61.41796875, 64.2734375, 67.12890625, 69.984375, 72.83984375, 75.6953125, 78.55078125, 81.40625, 84.26171875, 87.1171875, 89.97265625, 92.828125, 95.68359375, 98.5390625, 101.39453125, 104.25]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 10.0, 27.0, 23.0, 38.0, 51.0, 117.0, 190.0, 397.0, 1340.0, 999.0, 360.0, 194.0, 103.0, 68.0, 36.0, 33.0, 21.0, 9.0, 18.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.09375, -35.853515625, -34.61328125, -33.373046875, -32.1328125, -30.892578125, -29.65234375, -28.412109375, -27.171875, -25.931640625, -24.69140625, -23.451171875, -22.2109375, -20.970703125, -19.73046875, -18.490234375, -17.25, -16.009765625, -14.76953125, -13.529296875, -12.2890625, -11.048828125, -9.80859375, -8.568359375, -7.328125, -6.087890625, -4.84765625, -3.607421875, -2.3671875, -1.126953125, 0.11328125, 1.353515625, 2.59375, 3.833984375, 5.07421875, 6.314453125, 7.5546875, 8.794921875, 10.03515625, 11.275390625, 12.515625, 13.755859375, 14.99609375, 16.236328125, 17.4765625, 18.716796875, 19.95703125, 21.197265625, 22.4375, 23.677734375, 24.91796875, 26.158203125, 27.3984375, 28.638671875, 29.87890625, 31.119140625, 32.359375, 33.599609375, 34.83984375, 36.080078125, 37.3203125, 38.560546875, 39.80078125, 41.041015625, 42.28125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 2.0, 1.0, 8.0, 8.0, 14.0, 20.0, 34.0, 71.0, 98.0, 132.0, 142.0, 133.0, 111.0, 73.0, 56.0, 39.0, 19.0, 10.0, 10.0, 13.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-175.38735961914062, -167.56399536132812, -159.7406463623047, -151.9172821044922, -144.09393310546875, -136.27056884765625, -128.44720458984375, -120.62384796142578, -112.80049133300781, -104.97713470458984, -97.15377807617188, -89.33041381835938, -81.5070571899414, -73.68370056152344, -65.86033630371094, -58.03697967529297, -50.213623046875, -42.39026641845703, -34.5669059753418, -26.743547439575195, -18.920188903808594, -11.096832275390625, -3.2734718322753906, 4.549888610839844, 12.373245239257812, 20.196603775024414, 28.019962310791016, 35.84332275390625, 43.66667938232422, 51.49003601074219, 59.31339645385742, 67.13675689697266, 74.96011352539062, 82.7834701538086, 90.60682678222656, 98.43019104003906, 106.25354766845703, 114.076904296875, 121.9002685546875, 129.7236328125, 137.54698181152344, 145.37034606933594, 153.19369506835938, 161.01705932617188, 168.84042358398438, 176.6637725830078, 184.4871368408203, 192.31048583984375, 200.13385009765625, 207.95721435546875, 215.7805633544922, 223.6039276123047, 231.42727661132812, 239.25064086914062, 247.07400512695312, 254.89736938476562, 262.720703125, 270.5440673828125, 278.367431640625, 286.1907653808594, 294.0141296386719, 301.8374938964844, 309.6608581542969, 317.4842224121094, 325.3075866699219]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 6.0, 10.0, 16.0, 19.0, 21.0, 41.0, 38.0, 49.0, 46.0, 52.0, 62.0, 56.0, 62.0, 60.0, 62.0, 62.0, 64.0, 48.0, 38.0, 37.0, 33.0, 31.0, 19.0, 16.0, 14.0, 14.0, 2.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-201.68508911132812, -196.15420532226562, -190.62332153320312, -185.09243774414062, -179.56155395507812, -174.03067016601562, -168.49978637695312, -162.96890258789062, -157.43801879882812, -151.90713500976562, -146.37625122070312, -140.84536743164062, -135.31448364257812, -129.78359985351562, -124.2527084350586, -118.7218246459961, -113.19093322753906, -107.66004943847656, -102.12916564941406, -96.59828186035156, -91.06739807128906, -85.53651428222656, -80.00562286376953, -74.47473907470703, -68.94385528564453, -63.41297149658203, -57.88208770751953, -52.351200103759766, -46.820316314697266, -41.289432525634766, -35.758544921875, -30.2276611328125, -24.69677734375, -19.1658935546875, -13.635007858276367, -8.104122161865234, -2.5732383728027344, 2.9576454162597656, 8.488533020019531, 14.019416809082031, 19.55030059814453, 25.08118438720703, 30.612070083618164, 36.1429557800293, 41.6738395690918, 47.2047233581543, 52.73561096191406, 58.26649475097656, 63.79737854003906, 69.32826232910156, 74.85914611816406, 80.39002990722656, 85.92091369628906, 91.45179748535156, 96.9826889038086, 102.5135726928711, 108.0444564819336, 113.5753402709961, 119.1062240600586, 124.63711547851562, 130.16799926757812, 135.69888305664062, 141.22976684570312, 146.76065063476562, 152.29153442382812]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 9.0, 14.0, 29.0, 47.0, 89.0, 148.0, 326.0, 652.0, 1692.0, 5453.0, 29972.0, 230994.0, 651697.0, 106409.0, 15386.0, 3387.0, 1159.0, 508.0, 281.0, 135.0, 69.0, 35.0, 27.0, 11.0, 9.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-169.5, -165.2958984375, -161.091796875, -156.8876953125, -152.68359375, -148.4794921875, -144.275390625, -140.0712890625, -135.8671875, -131.6630859375, -127.458984375, -123.2548828125, -119.05078125, -114.8466796875, -110.642578125, -106.4384765625, -102.234375, -98.0302734375, -93.826171875, -89.6220703125, -85.41796875, -81.2138671875, -77.009765625, -72.8056640625, -68.6015625, -64.3974609375, -60.193359375, -55.9892578125, -51.78515625, -47.5810546875, -43.376953125, -39.1728515625, -34.96875, -30.7646484375, -26.560546875, -22.3564453125, -18.15234375, -13.9482421875, -9.744140625, -5.5400390625, -1.3359375, 2.8681640625, 7.072265625, 11.2763671875, 15.48046875, 19.6845703125, 23.888671875, 28.0927734375, 32.296875, 36.5009765625, 40.705078125, 44.9091796875, 49.11328125, 53.3173828125, 57.521484375, 61.7255859375, 65.9296875, 70.1337890625, 74.337890625, 78.5419921875, 82.74609375, 86.9501953125, 91.154296875, 95.3583984375, 99.5625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 2.0, 11.0, 16.0, 21.0, 32.0, 52.0, 50.0, 56.0, 66.0, 81.0, 78.0, 68.0, 83.0, 65.0, 65.0, 55.0, 57.0, 29.0, 32.0, 25.0, 15.0, 10.0, 12.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6171875, -10.1651611328125, -9.713134765625, -9.2611083984375, -8.80908203125, -8.3570556640625, -7.905029296875, -7.4530029296875, -7.0009765625, -6.5489501953125, -6.096923828125, -5.6448974609375, -5.19287109375, -4.7408447265625, -4.288818359375, -3.8367919921875, -3.384765625, -2.9327392578125, -2.480712890625, -2.0286865234375, -1.57666015625, -1.1246337890625, -0.672607421875, -0.2205810546875, 0.2314453125, 0.6834716796875, 1.135498046875, 1.5875244140625, 2.03955078125, 2.4915771484375, 2.943603515625, 3.3956298828125, 3.84765625, 4.2996826171875, 4.751708984375, 5.2037353515625, 5.65576171875, 6.1077880859375, 6.559814453125, 7.0118408203125, 7.4638671875, 7.9158935546875, 8.367919921875, 8.8199462890625, 9.27197265625, 9.7239990234375, 10.176025390625, 10.6280517578125, 11.080078125, 11.5321044921875, 11.984130859375, 12.4361572265625, 12.88818359375, 13.3402099609375, 13.792236328125, 14.2442626953125, 14.6962890625, 15.1483154296875, 15.600341796875, 16.0523681640625, 16.50439453125, 16.9564208984375, 17.408447265625, 17.8604736328125, 18.3125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 10.0, 15.0, 14.0, 12.0, 23.0, 24.0, 30.0, 58.0, 82.0, 107.0, 165.0, 224.0, 328.0, 476.0, 721.0, 1316.0, 2208.0, 3942.0, 7620.0, 14937.0, 30093.0, 63343.0, 132477.0, 261708.0, 265181.0, 134532.0, 64806.0, 30955.0, 15277.0, 7821.0, 4123.0, 2263.0, 1335.0, 800.0, 474.0, 317.0, 218.0, 155.0, 93.0, 73.0, 55.0, 31.0, 30.0, 21.0, 17.0, 11.0, 9.0, 6.0, 8.0, 7.0, 2.0, 4.0, 3.0, 2.0], "bins": [-37.28125, -36.18505859375, -35.0888671875, -33.99267578125, -32.896484375, -31.80029296875, -30.7041015625, -29.60791015625, -28.51171875, -27.41552734375, -26.3193359375, -25.22314453125, -24.126953125, -23.03076171875, -21.9345703125, -20.83837890625, -19.7421875, -18.64599609375, -17.5498046875, -16.45361328125, -15.357421875, -14.26123046875, -13.1650390625, -12.06884765625, -10.97265625, -9.87646484375, -8.7802734375, -7.68408203125, -6.587890625, -5.49169921875, -4.3955078125, -3.29931640625, -2.203125, -1.10693359375, -0.0107421875, 1.08544921875, 2.181640625, 3.27783203125, 4.3740234375, 5.47021484375, 6.56640625, 7.66259765625, 8.7587890625, 9.85498046875, 10.951171875, 12.04736328125, 13.1435546875, 14.23974609375, 15.3359375, 16.43212890625, 17.5283203125, 18.62451171875, 19.720703125, 20.81689453125, 21.9130859375, 23.00927734375, 24.10546875, 25.20166015625, 26.2978515625, 27.39404296875, 28.490234375, 29.58642578125, 30.6826171875, 31.77880859375, 32.875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 4.0, 3.0, 8.0, 7.0, 11.0, 12.0, 15.0, 22.0, 25.0, 26.0, 18.0, 42.0, 43.0, 38.0, 45.0, 43.0, 39.0, 36.0, 38.0, 33.0, 51.0, 50.0, 48.0, 37.0, 35.0, 36.0, 37.0, 25.0, 31.0, 31.0, 29.0, 15.0, 11.0, 14.0, 10.0, 6.0, 7.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.875, -40.63427734375, -39.3935546875, -38.15283203125, -36.912109375, -35.67138671875, -34.4306640625, -33.18994140625, -31.94921875, -30.70849609375, -29.4677734375, -28.22705078125, -26.986328125, -25.74560546875, -24.5048828125, -23.26416015625, -22.0234375, -20.78271484375, -19.5419921875, -18.30126953125, -17.060546875, -15.81982421875, -14.5791015625, -13.33837890625, -12.09765625, -10.85693359375, -9.6162109375, -8.37548828125, -7.134765625, -5.89404296875, -4.6533203125, -3.41259765625, -2.171875, -0.93115234375, 0.3095703125, 1.55029296875, 2.791015625, 4.03173828125, 5.2724609375, 6.51318359375, 7.75390625, 8.99462890625, 10.2353515625, 11.47607421875, 12.716796875, 13.95751953125, 15.1982421875, 16.43896484375, 17.6796875, 18.92041015625, 20.1611328125, 21.40185546875, 22.642578125, 23.88330078125, 25.1240234375, 26.36474609375, 27.60546875, 28.84619140625, 30.0869140625, 31.32763671875, 32.568359375, 33.80908203125, 35.0498046875, 36.29052734375, 37.53125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 13.0, 14.0, 12.0, 23.0, 30.0, 48.0, 69.0, 121.0, 135.0, 273.0, 506.0, 924.0, 2026.0, 4960.0, 13445.0, 48104.0, 278082.0, 571157.0, 93027.0, 22299.0, 7477.0, 2910.0, 1368.0, 685.0, 322.0, 193.0, 133.0, 63.0, 56.0, 31.0, 17.0, 10.0, 7.0, 4.0, 7.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-55.8125, -54.0244140625, -52.236328125, -50.4482421875, -48.66015625, -46.8720703125, -45.083984375, -43.2958984375, -41.5078125, -39.7197265625, -37.931640625, -36.1435546875, -34.35546875, -32.5673828125, -30.779296875, -28.9912109375, -27.203125, -25.4150390625, -23.626953125, -21.8388671875, -20.05078125, -18.2626953125, -16.474609375, -14.6865234375, -12.8984375, -11.1103515625, -9.322265625, -7.5341796875, -5.74609375, -3.9580078125, -2.169921875, -0.3818359375, 1.40625, 3.1943359375, 4.982421875, 6.7705078125, 8.55859375, 10.3466796875, 12.134765625, 13.9228515625, 15.7109375, 17.4990234375, 19.287109375, 21.0751953125, 22.86328125, 24.6513671875, 26.439453125, 28.2275390625, 30.015625, 31.8037109375, 33.591796875, 35.3798828125, 37.16796875, 38.9560546875, 40.744140625, 42.5322265625, 44.3203125, 46.1083984375, 47.896484375, 49.6845703125, 51.47265625, 53.2607421875, 55.048828125, 56.8369140625, 58.625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 0.0, 7.0, 8.0, 7.0, 12.0, 22.0, 27.0, 34.0, 55.0, 92.0, 188.0, 248.0, 108.0, 57.0, 50.0, 20.0, 20.0, 17.0, 12.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0062408447265625, -0.005876779556274414, -0.005512714385986328, -0.005148649215698242, -0.004784584045410156, -0.00442051887512207, -0.004056453704833984, -0.0036923885345458984, -0.0033283233642578125, -0.0029642581939697266, -0.0026001930236816406, -0.0022361278533935547, -0.0018720626831054688, -0.0015079975128173828, -0.0011439323425292969, -0.0007798671722412109, -0.000415802001953125, -5.173683166503906e-05, 0.0003123283386230469, 0.0006763935089111328, 0.0010404586791992188, 0.0014045238494873047, 0.0017685890197753906, 0.0021326541900634766, 0.0024967193603515625, 0.0028607845306396484, 0.0032248497009277344, 0.0035889148712158203, 0.003952980041503906, 0.004317045211791992, 0.004681110382080078, 0.005045175552368164, 0.00540924072265625, 0.005773305892944336, 0.006137371063232422, 0.006501436233520508, 0.006865501403808594, 0.00722956657409668, 0.007593631744384766, 0.007957696914672852, 0.008321762084960938, 0.008685827255249023, 0.00904989242553711, 0.009413957595825195, 0.009778022766113281, 0.010142087936401367, 0.010506153106689453, 0.010870218276977539, 0.011234283447265625, 0.011598348617553711, 0.011962413787841797, 0.012326478958129883, 0.012690544128417969, 0.013054609298706055, 0.01341867446899414, 0.013782739639282227, 0.014146804809570312, 0.014510869979858398, 0.014874935150146484, 0.01523900032043457, 0.015603065490722656, 0.015967130661010742, 0.016331195831298828, 0.016695261001586914, 0.017059326171875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 2.0, 2.0, 12.0, 18.0, 21.0, 28.0, 43.0, 69.0, 125.0, 226.0, 338.0, 603.0, 1147.0, 2298.0, 5349.0, 13661.0, 41133.0, 172730.0, 586759.0, 161669.0, 39270.0, 13053.0, 5211.0, 2258.0, 1111.0, 572.0, 307.0, 180.0, 111.0, 78.0, 48.0, 33.0, 33.0, 18.0, 10.0, 8.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.5, -45.02294921875, -43.5458984375, -42.06884765625, -40.591796875, -39.11474609375, -37.6376953125, -36.16064453125, -34.68359375, -33.20654296875, -31.7294921875, -30.25244140625, -28.775390625, -27.29833984375, -25.8212890625, -24.34423828125, -22.8671875, -21.39013671875, -19.9130859375, -18.43603515625, -16.958984375, -15.48193359375, -14.0048828125, -12.52783203125, -11.05078125, -9.57373046875, -8.0966796875, -6.61962890625, -5.142578125, -3.66552734375, -2.1884765625, -0.71142578125, 0.765625, 2.24267578125, 3.7197265625, 5.19677734375, 6.673828125, 8.15087890625, 9.6279296875, 11.10498046875, 12.58203125, 14.05908203125, 15.5361328125, 17.01318359375, 18.490234375, 19.96728515625, 21.4443359375, 22.92138671875, 24.3984375, 25.87548828125, 27.3525390625, 28.82958984375, 30.306640625, 31.78369140625, 33.2607421875, 34.73779296875, 36.21484375, 37.69189453125, 39.1689453125, 40.64599609375, 42.123046875, 43.60009765625, 45.0771484375, 46.55419921875, 48.03125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 6.0, 5.0, 9.0, 6.0, 8.0, 20.0, 20.0, 15.0, 27.0, 31.0, 45.0, 40.0, 61.0, 75.0, 87.0, 107.0, 91.0, 67.0, 45.0, 48.0, 27.0, 30.0, 17.0, 23.0, 12.0, 13.0, 14.0, 10.0, 12.0, 4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.09375, -20.255859375, -19.41796875, -18.580078125, -17.7421875, -16.904296875, -16.06640625, -15.228515625, -14.390625, -13.552734375, -12.71484375, -11.876953125, -11.0390625, -10.201171875, -9.36328125, -8.525390625, -7.6875, -6.849609375, -6.01171875, -5.173828125, -4.3359375, -3.498046875, -2.66015625, -1.822265625, -0.984375, -0.146484375, 0.69140625, 1.529296875, 2.3671875, 3.205078125, 4.04296875, 4.880859375, 5.71875, 6.556640625, 7.39453125, 8.232421875, 9.0703125, 9.908203125, 10.74609375, 11.583984375, 12.421875, 13.259765625, 14.09765625, 14.935546875, 15.7734375, 16.611328125, 17.44921875, 18.287109375, 19.125, 19.962890625, 20.80078125, 21.638671875, 22.4765625, 23.314453125, 24.15234375, 24.990234375, 25.828125, 26.666015625, 27.50390625, 28.341796875, 29.1796875, 30.017578125, 30.85546875, 31.693359375, 32.53125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 17.0, 14.0, 51.0, 86.0, 163.0, 182.0, 187.0, 132.0, 79.0, 42.0, 19.0, 9.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-388.23504638671875, -367.2371826171875, -346.2392883300781, -325.24139404296875, -304.2435302734375, -283.24566650390625, -262.2477722167969, -241.24989318847656, -220.25201416015625, -199.25413513183594, -178.25625610351562, -157.2583770751953, -136.260498046875, -115.26261901855469, -94.26473999023438, -73.26686096191406, -52.26898193359375, -31.271102905273438, -10.273223876953125, 10.724655151367188, 31.7225341796875, 52.72041320800781, 73.71829223632812, 94.71617126464844, 115.71405029296875, 136.71192932128906, 157.70980834960938, 178.7076873779297, 199.70556640625, 220.7034454345703, 241.70132446289062, 262.69921875, 283.697021484375, 304.69488525390625, 325.6927795410156, 346.690673828125, 367.68853759765625, 388.6864013671875, 409.6842956542969, 430.68218994140625, 451.6800537109375, 472.67791748046875, 493.6758117675781, 514.6737060546875, 535.6715698242188, 556.66943359375, 577.6673583984375, 598.6652221679688, 619.6630859375, 640.6609497070312, 661.6588134765625, 682.65673828125, 703.6546020507812, 724.6524658203125, 745.650390625, 766.6482543945312, 787.6461181640625, 808.6439819335938, 829.641845703125, 850.6397705078125, 871.6376342773438, 892.635498046875, 913.6334228515625, 934.6312866210938, 955.629150390625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 8.0, 18.0, 33.0, 50.0, 59.0, 76.0, 101.0, 101.0, 97.0, 87.0, 99.0, 75.0, 53.0, 42.0, 36.0, 23.0, 18.0, 10.0, 9.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-325.04083251953125, -309.2027587890625, -293.3647155761719, -277.5266418457031, -261.6885681152344, -245.8505096435547, -230.012451171875, -214.17437744140625, -198.3363037109375, -182.4982452392578, -166.66017150878906, -150.82211303710938, -134.98403930664062, -119.14598083496094, -103.30791473388672, -87.4698486328125, -71.63179016113281, -55.793724060058594, -39.955657958984375, -24.117595672607422, -8.279529571533203, 7.55853271484375, 23.39659881591797, 39.23466491699219, 55.072731018066406, 70.91079711914062, 86.74886322021484, 102.58692932128906, 118.42498779296875, 134.2630615234375, 150.1011199951172, 165.93917846679688, 181.77725219726562, 197.6153106689453, 213.45338439941406, 229.29144287109375, 245.1295166015625, 260.96759033203125, 276.8056335449219, 292.6437072753906, 308.4817810058594, 324.3198547363281, 340.15789794921875, 355.9959716796875, 371.83404541015625, 387.672119140625, 403.5101623535156, 419.3482360839844, 435.186279296875, 451.02435302734375, 466.8623962402344, 482.7004699707031, 498.5385437011719, 514.3765869140625, 530.2146606445312, 546.052734375, 561.8908081054688, 577.7288818359375, 593.5669555664062, 609.405029296875, 625.2430419921875, 641.0811157226562, 656.919189453125, 672.7572631835938, 688.5953369140625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 6.0, 14.0, 14.0, 29.0, 58.0, 92.0, 193.0, 355.0, 743.0, 1845.0, 6172.0, 27288.0, 459644.0, 3640063.0, 44532.0, 8463.0, 2583.0, 991.0, 466.0, 250.0, 150.0, 94.0, 58.0, 46.0, 29.0, 22.0, 10.0, 17.0, 10.0, 9.0, 11.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.5625, -100.0419921875, -95.521484375, -91.0009765625, -86.48046875, -81.9599609375, -77.439453125, -72.9189453125, -68.3984375, -63.8779296875, -59.357421875, -54.8369140625, -50.31640625, -45.7958984375, -41.275390625, -36.7548828125, -32.234375, -27.7138671875, -23.193359375, -18.6728515625, -14.15234375, -9.6318359375, -5.111328125, -0.5908203125, 3.9296875, 8.4501953125, 12.970703125, 17.4912109375, 22.01171875, 26.5322265625, 31.052734375, 35.5732421875, 40.09375, 44.6142578125, 49.134765625, 53.6552734375, 58.17578125, 62.6962890625, 67.216796875, 71.7373046875, 76.2578125, 80.7783203125, 85.298828125, 89.8193359375, 94.33984375, 98.8603515625, 103.380859375, 107.9013671875, 112.421875, 116.9423828125, 121.462890625, 125.9833984375, 130.50390625, 135.0244140625, 139.544921875, 144.0654296875, 148.5859375, 153.1064453125, 157.626953125, 162.1474609375, 166.66796875, 171.1884765625, 175.708984375, 180.2294921875, 184.75]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 11.0, 20.0, 17.0, 35.0, 48.0, 54.0, 91.0, 100.0, 86.0, 99.0, 111.0, 87.0, 78.0, 52.0, 41.0, 30.0, 20.0, 10.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.0587158203125, -10.422119140625, -9.7855224609375, -9.14892578125, -8.5123291015625, -7.875732421875, -7.2391357421875, -6.6025390625, -5.9659423828125, -5.329345703125, -4.6927490234375, -4.05615234375, -3.4195556640625, -2.782958984375, -2.1463623046875, -1.509765625, -0.8731689453125, -0.236572265625, 0.4000244140625, 1.03662109375, 1.6732177734375, 2.309814453125, 2.9464111328125, 3.5830078125, 4.2196044921875, 4.856201171875, 5.4927978515625, 6.12939453125, 6.7659912109375, 7.402587890625, 8.0391845703125, 8.67578125, 9.3123779296875, 9.948974609375, 10.5855712890625, 11.22216796875, 11.8587646484375, 12.495361328125, 13.1319580078125, 13.7685546875, 14.4051513671875, 15.041748046875, 15.6783447265625, 16.31494140625, 16.9515380859375, 17.588134765625, 18.2247314453125, 18.861328125, 19.4979248046875, 20.134521484375, 20.7711181640625, 21.40771484375, 22.0443115234375, 22.680908203125, 23.3175048828125, 23.9541015625, 24.5906982421875, 25.227294921875, 25.8638916015625, 26.50048828125, 27.1370849609375, 27.773681640625, 28.4102783203125, 29.046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 6.0, 6.0, 9.0, 14.0, 14.0, 14.0, 14.0, 38.0, 33.0, 73.0, 119.0, 173.0, 357.0, 651.0, 1297.0, 2718.0, 6830.0, 20823.0, 93730.0, 3249264.0, 732601.0, 60263.0, 15211.0, 5313.0, 2288.0, 1063.0, 562.0, 282.0, 155.0, 94.0, 63.0, 54.0, 30.0, 38.0, 14.0, 15.0, 13.0, 7.0, 6.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-109.625, -106.185546875, -102.74609375, -99.306640625, -95.8671875, -92.427734375, -88.98828125, -85.548828125, -82.109375, -78.669921875, -75.23046875, -71.791015625, -68.3515625, -64.912109375, -61.47265625, -58.033203125, -54.59375, -51.154296875, -47.71484375, -44.275390625, -40.8359375, -37.396484375, -33.95703125, -30.517578125, -27.078125, -23.638671875, -20.19921875, -16.759765625, -13.3203125, -9.880859375, -6.44140625, -3.001953125, 0.4375, 3.876953125, 7.31640625, 10.755859375, 14.1953125, 17.634765625, 21.07421875, 24.513671875, 27.953125, 31.392578125, 34.83203125, 38.271484375, 41.7109375, 45.150390625, 48.58984375, 52.029296875, 55.46875, 58.908203125, 62.34765625, 65.787109375, 69.2265625, 72.666015625, 76.10546875, 79.544921875, 82.984375, 86.423828125, 89.86328125, 93.302734375, 96.7421875, 100.181640625, 103.62109375, 107.060546875, 110.5]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 7.0, 9.0, 13.0, 17.0, 39.0, 54.0, 95.0, 228.0, 945.0, 2053.0, 325.0, 120.0, 54.0, 40.0, 24.0, 21.0, 9.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.96875, -25.39599609375, -23.8232421875, -22.25048828125, -20.677734375, -19.10498046875, -17.5322265625, -15.95947265625, -14.38671875, -12.81396484375, -11.2412109375, -9.66845703125, -8.095703125, -6.52294921875, -4.9501953125, -3.37744140625, -1.8046875, -0.23193359375, 1.3408203125, 2.91357421875, 4.486328125, 6.05908203125, 7.6318359375, 9.20458984375, 10.77734375, 12.35009765625, 13.9228515625, 15.49560546875, 17.068359375, 18.64111328125, 20.2138671875, 21.78662109375, 23.359375, 24.93212890625, 26.5048828125, 28.07763671875, 29.650390625, 31.22314453125, 32.7958984375, 34.36865234375, 35.94140625, 37.51416015625, 39.0869140625, 40.65966796875, 42.232421875, 43.80517578125, 45.3779296875, 46.95068359375, 48.5234375, 50.09619140625, 51.6689453125, 53.24169921875, 54.814453125, 56.38720703125, 57.9599609375, 59.53271484375, 61.10546875, 62.67822265625, 64.2509765625, 65.82373046875, 67.396484375, 68.96923828125, 70.5419921875, 72.11474609375, 73.6875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 13.0, 25.0, 19.0, 37.0, 47.0, 57.0, 85.0, 93.0, 100.0, 104.0, 121.0, 79.0, 50.0, 34.0, 37.0, 18.0, 18.0, 14.0, 16.0, 7.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.31192016601562, -130.0359649658203, -124.75999450683594, -119.4840316772461, -114.20806884765625, -108.9321060180664, -103.65614318847656, -98.38018798828125, -93.10421752929688, -87.82825469970703, -82.55229187011719, -77.27632904052734, -72.0003662109375, -66.72440338134766, -61.44844436645508, -56.172481536865234, -50.896522521972656, -45.62055969238281, -40.34459686279297, -35.068634033203125, -29.792673110961914, -24.51671028137207, -19.24074935913086, -13.964786529541016, -8.688823699951172, -3.4128613471984863, 1.8631010055541992, 7.139062881469727, 12.41502571105957, 17.690988540649414, 22.966949462890625, 28.24291229248047, 33.51887512207031, 38.794837951660156, 44.07080078125, 49.346763610839844, 54.62272644042969, 59.89868927001953, 65.17465209960938, 70.45060729980469, 75.72657775878906, 81.0025405883789, 86.27850341796875, 91.5544662475586, 96.83042907714844, 102.10639190673828, 107.38235473632812, 112.65830993652344, 117.93427276611328, 123.21023559570312, 128.48619079589844, 133.7621612548828, 139.03811645507812, 144.3140869140625, 149.5900421142578, 154.8660125732422, 160.1419677734375, 165.4179229736328, 170.6938934326172, 175.9698486328125, 181.24581909179688, 186.5217742919922, 191.79774475097656, 197.07369995117188, 202.34967041015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 12.0, 20.0, 25.0, 43.0, 35.0, 36.0, 30.0, 47.0, 61.0, 59.0, 67.0, 59.0, 70.0, 70.0, 62.0, 49.0, 42.0, 37.0, 26.0, 32.0, 37.0, 19.0, 19.0, 10.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-221.72837829589844, -216.7640838623047, -211.79977416992188, -206.83547973632812, -201.87118530273438, -196.90687561035156, -191.9425811767578, -186.978271484375, -182.01397705078125, -177.0496826171875, -172.0853729248047, -167.12107849121094, -162.15676879882812, -157.19247436523438, -152.22817993164062, -147.26388549804688, -142.29957580566406, -137.3352813720703, -132.3709716796875, -127.40667724609375, -122.44237518310547, -117.47807312011719, -112.51377868652344, -107.54947662353516, -102.58517456054688, -97.6208724975586, -92.65657043457031, -87.69227600097656, -82.72797393798828, -77.763671875, -72.79937744140625, -67.83507537841797, -62.870758056640625, -57.906455993652344, -52.94215774536133, -47.97785949707031, -43.01355743408203, -38.04925537109375, -33.084957122802734, -28.12065887451172, -23.156356811523438, -18.19205665588379, -13.22775650024414, -8.263456344604492, -3.2991561889648438, 1.6651439666748047, 6.629444122314453, 11.593742370605469, 16.55804443359375, 21.5223445892334, 26.486644744873047, 31.450944900512695, 36.415245056152344, 41.379547119140625, 46.34384536743164, 51.308143615722656, 56.27244567871094, 61.23674774169922, 66.2010498046875, 71.16534423828125, 76.12964630126953, 81.09394836425781, 86.05824279785156, 91.02254486083984, 95.98684692382812]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 10.0, 9.0, 10.0, 11.0, 23.0, 27.0, 44.0, 73.0, 94.0, 134.0, 207.0, 383.0, 681.0, 1354.0, 2643.0, 6181.0, 15868.0, 48595.0, 167304.0, 455198.0, 242553.0, 70183.0, 21947.0, 7921.0, 3475.0, 1611.0, 778.0, 475.0, 264.0, 174.0, 106.0, 58.0, 46.0, 28.0, 25.0, 18.0, 7.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-97.375, -94.6435546875, -91.912109375, -89.1806640625, -86.44921875, -83.7177734375, -80.986328125, -78.2548828125, -75.5234375, -72.7919921875, -70.060546875, -67.3291015625, -64.59765625, -61.8662109375, -59.134765625, -56.4033203125, -53.671875, -50.9404296875, -48.208984375, -45.4775390625, -42.74609375, -40.0146484375, -37.283203125, -34.5517578125, -31.8203125, -29.0888671875, -26.357421875, -23.6259765625, -20.89453125, -18.1630859375, -15.431640625, -12.7001953125, -9.96875, -7.2373046875, -4.505859375, -1.7744140625, 0.95703125, 3.6884765625, 6.419921875, 9.1513671875, 11.8828125, 14.6142578125, 17.345703125, 20.0771484375, 22.80859375, 25.5400390625, 28.271484375, 31.0029296875, 33.734375, 36.4658203125, 39.197265625, 41.9287109375, 44.66015625, 47.3916015625, 50.123046875, 52.8544921875, 55.5859375, 58.3173828125, 61.048828125, 63.7802734375, 66.51171875, 69.2431640625, 71.974609375, 74.7060546875, 77.4375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 6.0, 13.0, 14.0, 24.0, 33.0, 32.0, 45.0, 48.0, 54.0, 58.0, 72.0, 81.0, 78.0, 67.0, 82.0, 66.0, 51.0, 38.0, 34.0, 26.0, 18.0, 13.0, 13.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.6484375, -12.1446533203125, -11.640869140625, -11.1370849609375, -10.63330078125, -10.1295166015625, -9.625732421875, -9.1219482421875, -8.6181640625, -8.1143798828125, -7.610595703125, -7.1068115234375, -6.60302734375, -6.0992431640625, -5.595458984375, -5.0916748046875, -4.587890625, -4.0841064453125, -3.580322265625, -3.0765380859375, -2.57275390625, -2.0689697265625, -1.565185546875, -1.0614013671875, -0.5576171875, -0.0538330078125, 0.449951171875, 0.9537353515625, 1.45751953125, 1.9613037109375, 2.465087890625, 2.9688720703125, 3.47265625, 3.9764404296875, 4.480224609375, 4.9840087890625, 5.48779296875, 5.9915771484375, 6.495361328125, 6.9991455078125, 7.5029296875, 8.0067138671875, 8.510498046875, 9.0142822265625, 9.51806640625, 10.0218505859375, 10.525634765625, 11.0294189453125, 11.533203125, 12.0369873046875, 12.540771484375, 13.0445556640625, 13.54833984375, 14.0521240234375, 14.555908203125, 15.0596923828125, 15.5634765625, 16.0672607421875, 16.571044921875, 17.0748291015625, 17.57861328125, 18.0823974609375, 18.586181640625, 19.0899658203125, 19.59375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 0.0, 3.0, 7.0, 11.0, 10.0, 18.0, 27.0, 43.0, 67.0, 115.0, 218.0, 456.0, 934.0, 2607.0, 9855.0, 48495.0, 336116.0, 546830.0, 81534.0, 15120.0, 3727.0, 1207.0, 519.0, 251.0, 140.0, 85.0, 53.0, 40.0, 25.0, 15.0, 14.0, 3.0, 8.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.0625, -98.560546875, -95.05859375, -91.556640625, -88.0546875, -84.552734375, -81.05078125, -77.548828125, -74.046875, -70.544921875, -67.04296875, -63.541015625, -60.0390625, -56.537109375, -53.03515625, -49.533203125, -46.03125, -42.529296875, -39.02734375, -35.525390625, -32.0234375, -28.521484375, -25.01953125, -21.517578125, -18.015625, -14.513671875, -11.01171875, -7.509765625, -4.0078125, -0.505859375, 2.99609375, 6.498046875, 10.0, 13.501953125, 17.00390625, 20.505859375, 24.0078125, 27.509765625, 31.01171875, 34.513671875, 38.015625, 41.517578125, 45.01953125, 48.521484375, 52.0234375, 55.525390625, 59.02734375, 62.529296875, 66.03125, 69.533203125, 73.03515625, 76.537109375, 80.0390625, 83.541015625, 87.04296875, 90.544921875, 94.046875, 97.548828125, 101.05078125, 104.552734375, 108.0546875, 111.556640625, 115.05859375, 118.560546875, 122.0625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 3.0, 6.0, 4.0, 10.0, 4.0, 13.0, 15.0, 9.0, 13.0, 17.0, 26.0, 32.0, 33.0, 21.0, 43.0, 37.0, 38.0, 45.0, 40.0, 39.0, 37.0, 48.0, 33.0, 39.0, 41.0, 29.0, 38.0, 37.0, 38.0, 30.0, 18.0, 19.0, 23.0, 20.0, 17.0, 17.0, 14.0, 7.0, 8.0, 5.0, 4.0, 6.0, 5.0, 0.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-42.53125, -41.09765625, -39.6640625, -38.23046875, -36.796875, -35.36328125, -33.9296875, -32.49609375, -31.0625, -29.62890625, -28.1953125, -26.76171875, -25.328125, -23.89453125, -22.4609375, -21.02734375, -19.59375, -18.16015625, -16.7265625, -15.29296875, -13.859375, -12.42578125, -10.9921875, -9.55859375, -8.125, -6.69140625, -5.2578125, -3.82421875, -2.390625, -0.95703125, 0.4765625, 1.91015625, 3.34375, 4.77734375, 6.2109375, 7.64453125, 9.078125, 10.51171875, 11.9453125, 13.37890625, 14.8125, 16.24609375, 17.6796875, 19.11328125, 20.546875, 21.98046875, 23.4140625, 24.84765625, 26.28125, 27.71484375, 29.1484375, 30.58203125, 32.015625, 33.44921875, 34.8828125, 36.31640625, 37.75, 39.18359375, 40.6171875, 42.05078125, 43.484375, 44.91796875, 46.3515625, 47.78515625, 49.21875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 8.0, 18.0, 23.0, 47.0, 86.0, 131.0, 253.0, 622.0, 1339.0, 3562.0, 12550.0, 75996.0, 766844.0, 159474.0, 19380.0, 5037.0, 1739.0, 695.0, 339.0, 168.0, 101.0, 36.0, 36.0, 28.0, 12.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.9375, -65.2880859375, -62.638671875, -59.9892578125, -57.33984375, -54.6904296875, -52.041015625, -49.3916015625, -46.7421875, -44.0927734375, -41.443359375, -38.7939453125, -36.14453125, -33.4951171875, -30.845703125, -28.1962890625, -25.546875, -22.8974609375, -20.248046875, -17.5986328125, -14.94921875, -12.2998046875, -9.650390625, -7.0009765625, -4.3515625, -1.7021484375, 0.947265625, 3.5966796875, 6.24609375, 8.8955078125, 11.544921875, 14.1943359375, 16.84375, 19.4931640625, 22.142578125, 24.7919921875, 27.44140625, 30.0908203125, 32.740234375, 35.3896484375, 38.0390625, 40.6884765625, 43.337890625, 45.9873046875, 48.63671875, 51.2861328125, 53.935546875, 56.5849609375, 59.234375, 61.8837890625, 64.533203125, 67.1826171875, 69.83203125, 72.4814453125, 75.130859375, 77.7802734375, 80.4296875, 83.0791015625, 85.728515625, 88.3779296875, 91.02734375, 93.6767578125, 96.326171875, 98.9755859375, 101.625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 8.0, 5.0, 7.0, 17.0, 16.0, 28.0, 40.0, 57.0, 93.0, 189.0, 226.0, 100.0, 47.0, 52.0, 31.0, 23.0, 16.0, 6.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01129150390625, -0.010890841484069824, -0.010490179061889648, -0.010089516639709473, -0.009688854217529297, -0.009288191795349121, -0.008887529373168945, -0.00848686695098877, -0.008086204528808594, -0.007685542106628418, -0.007284879684448242, -0.006884217262268066, -0.006483554840087891, -0.006082892417907715, -0.005682229995727539, -0.005281567573547363, -0.0048809051513671875, -0.004480242729187012, -0.004079580307006836, -0.00367891788482666, -0.0032782554626464844, -0.0028775930404663086, -0.002476930618286133, -0.002076268196105957, -0.0016756057739257812, -0.0012749433517456055, -0.0008742809295654297, -0.0004736185073852539, -7.295608520507812e-05, 0.00032770633697509766, 0.0007283687591552734, 0.0011290311813354492, 0.001529693603515625, 0.0019303560256958008, 0.0023310184478759766, 0.0027316808700561523, 0.003132343292236328, 0.003533005714416504, 0.00393366813659668, 0.0043343305587768555, 0.004734992980957031, 0.005135655403137207, 0.005536317825317383, 0.005936980247497559, 0.006337642669677734, 0.00673830509185791, 0.007138967514038086, 0.007539629936218262, 0.007940292358398438, 0.008340954780578613, 0.008741617202758789, 0.009142279624938965, 0.00954294204711914, 0.009943604469299316, 0.010344266891479492, 0.010744929313659668, 0.011145591735839844, 0.01154625415802002, 0.011946916580200195, 0.012347579002380371, 0.012748241424560547, 0.013148903846740723, 0.013549566268920898, 0.013950228691101074, 0.01435089111328125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 6.0, 6.0, 9.0, 17.0, 19.0, 39.0, 46.0, 101.0, 123.0, 244.0, 427.0, 825.0, 1660.0, 3941.0, 12228.0, 63176.0, 707757.0, 221022.0, 25308.0, 6497.0, 2423.0, 1160.0, 602.0, 342.0, 227.0, 120.0, 68.0, 36.0, 25.0, 22.0, 16.0, 12.0, 8.0, 7.0, 3.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.5, -66.197265625, -63.89453125, -61.591796875, -59.2890625, -56.986328125, -54.68359375, -52.380859375, -50.078125, -47.775390625, -45.47265625, -43.169921875, -40.8671875, -38.564453125, -36.26171875, -33.958984375, -31.65625, -29.353515625, -27.05078125, -24.748046875, -22.4453125, -20.142578125, -17.83984375, -15.537109375, -13.234375, -10.931640625, -8.62890625, -6.326171875, -4.0234375, -1.720703125, 0.58203125, 2.884765625, 5.1875, 7.490234375, 9.79296875, 12.095703125, 14.3984375, 16.701171875, 19.00390625, 21.306640625, 23.609375, 25.912109375, 28.21484375, 30.517578125, 32.8203125, 35.123046875, 37.42578125, 39.728515625, 42.03125, 44.333984375, 46.63671875, 48.939453125, 51.2421875, 53.544921875, 55.84765625, 58.150390625, 60.453125, 62.755859375, 65.05859375, 67.361328125, 69.6640625, 71.966796875, 74.26953125, 76.572265625, 78.875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 7.0, 7.0, 6.0, 9.0, 9.0, 23.0, 27.0, 34.0, 49.0, 76.0, 94.0, 129.0, 137.0, 109.0, 73.0, 59.0, 27.0, 27.0, 21.0, 16.0, 13.0, 13.0, 3.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-39.03125, -37.8505859375, -36.669921875, -35.4892578125, -34.30859375, -33.1279296875, -31.947265625, -30.7666015625, -29.5859375, -28.4052734375, -27.224609375, -26.0439453125, -24.86328125, -23.6826171875, -22.501953125, -21.3212890625, -20.140625, -18.9599609375, -17.779296875, -16.5986328125, -15.41796875, -14.2373046875, -13.056640625, -11.8759765625, -10.6953125, -9.5146484375, -8.333984375, -7.1533203125, -5.97265625, -4.7919921875, -3.611328125, -2.4306640625, -1.25, -0.0693359375, 1.111328125, 2.2919921875, 3.47265625, 4.6533203125, 5.833984375, 7.0146484375, 8.1953125, 9.3759765625, 10.556640625, 11.7373046875, 12.91796875, 14.0986328125, 15.279296875, 16.4599609375, 17.640625, 18.8212890625, 20.001953125, 21.1826171875, 22.36328125, 23.5439453125, 24.724609375, 25.9052734375, 27.0859375, 28.2666015625, 29.447265625, 30.6279296875, 31.80859375, 32.9892578125, 34.169921875, 35.3505859375, 36.53125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 7.0, 9.0, 17.0, 21.0, 19.0, 46.0, 63.0, 90.0, 118.0, 133.0, 141.0, 107.0, 82.0, 52.0, 39.0, 25.0, 17.0, 9.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-521.2030029296875, -504.33343505859375, -487.4638671875, -470.59429931640625, -453.7247619628906, -436.8551940917969, -419.9856262207031, -403.1160583496094, -386.24652099609375, -369.376953125, -352.50738525390625, -335.6378173828125, -318.7682800292969, -301.8987121582031, -285.0291442871094, -268.1595764160156, -251.29000854492188, -234.42044067382812, -217.55088806152344, -200.6813201904297, -183.811767578125, -166.94219970703125, -150.0726318359375, -133.20306396484375, -116.33351135253906, -99.46395111083984, -82.59439086914062, -65.72482299804688, -48.855262756347656, -31.985702514648438, -15.116134643554688, 1.7534255981445312, 18.62298583984375, 35.49254608154297, 52.36211013793945, 69.23167419433594, 86.10123443603516, 102.97079467773438, 119.84036254882812, 136.70993041992188, 153.57948303222656, 170.4490509033203, 187.318603515625, 204.18817138671875, 221.0577392578125, 237.9272918701172, 254.79685974121094, 271.6664123535156, 288.5359802246094, 305.4055480957031, 322.2751159667969, 339.1446533203125, 356.01422119140625, 372.8837890625, 389.75335693359375, 406.6229248046875, 423.49249267578125, 440.362060546875, 457.23162841796875, 474.1011962890625, 490.9707336425781, 507.8403015136719, 524.7098388671875, 541.5794067382812, 558.448974609375]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 11.0, 16.0, 26.0, 43.0, 38.0, 46.0, 69.0, 51.0, 80.0, 80.0, 84.0, 78.0, 67.0, 57.0, 39.0, 60.0, 37.0, 33.0, 25.0, 14.0, 17.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-334.359619140625, -319.3934326171875, -304.42724609375, -289.4610595703125, -274.494873046875, -259.5286865234375, -244.56251525878906, -229.59634399414062, -214.63015747070312, -199.66397094726562, -184.69778442382812, -169.73159790039062, -154.7654266357422, -139.7992401123047, -124.83305358886719, -109.86687469482422, -94.90068054199219, -79.93449401855469, -64.96831512451172, -50.00212860107422, -35.035945892333984, -20.06976318359375, -5.10357666015625, 9.862602233886719, 24.82878875732422, 39.79497146606445, 54.76115417480469, 69.72734069824219, 84.69352722167969, 99.65970611572266, 114.62589263916016, 129.59207153320312, 144.55825805664062, 159.52444458007812, 174.49063110351562, 189.45681762695312, 204.42298889160156, 219.38917541503906, 234.35536193847656, 249.321533203125, 264.2877197265625, 279.25390625, 294.2200927734375, 309.186279296875, 324.1524658203125, 339.11865234375, 354.0848388671875, 369.0509948730469, 384.0172119140625, 398.9833984375, 413.9495849609375, 428.915771484375, 443.8819580078125, 458.84814453125, 473.8143310546875, 488.7804870605469, 503.7466735839844, 518.7128295898438, 533.6790161132812, 548.6452026367188, 563.6113891601562, 578.5775756835938, 593.5437622070312, 608.5099487304688, 623.4761352539062]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 8.0, 5.0, 22.0, 42.0, 56.0, 114.0, 191.0, 462.0, 907.0, 2230.0, 5661.0, 18690.0, 91718.0, 3587659.0, 427253.0, 41366.0, 10800.0, 3730.0, 1532.0, 728.0, 367.0, 213.0, 147.0, 112.0, 66.0, 44.0, 38.0, 29.0, 22.0, 14.0, 15.0, 11.0, 5.0, 4.0, 3.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-96.0, -91.787109375, -87.57421875, -83.361328125, -79.1484375, -74.935546875, -70.72265625, -66.509765625, -62.296875, -58.083984375, -53.87109375, -49.658203125, -45.4453125, -41.232421875, -37.01953125, -32.806640625, -28.59375, -24.380859375, -20.16796875, -15.955078125, -11.7421875, -7.529296875, -3.31640625, 0.896484375, 5.109375, 9.322265625, 13.53515625, 17.748046875, 21.9609375, 26.173828125, 30.38671875, 34.599609375, 38.8125, 43.025390625, 47.23828125, 51.451171875, 55.6640625, 59.876953125, 64.08984375, 68.302734375, 72.515625, 76.728515625, 80.94140625, 85.154296875, 89.3671875, 93.580078125, 97.79296875, 102.005859375, 106.21875, 110.431640625, 114.64453125, 118.857421875, 123.0703125, 127.283203125, 131.49609375, 135.708984375, 139.921875, 144.134765625, 148.34765625, 152.560546875, 156.7734375, 160.986328125, 165.19921875, 169.412109375, 173.625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 12.0, 18.0, 34.0, 33.0, 64.0, 70.0, 81.0, 106.0, 119.0, 93.0, 95.0, 71.0, 71.0, 48.0, 27.0, 21.0, 15.0, 10.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.015625, -10.273193359375, -9.53076171875, -8.788330078125, -8.0458984375, -7.303466796875, -6.56103515625, -5.818603515625, -5.076171875, -4.333740234375, -3.59130859375, -2.848876953125, -2.1064453125, -1.364013671875, -0.62158203125, 0.120849609375, 0.86328125, 1.605712890625, 2.34814453125, 3.090576171875, 3.8330078125, 4.575439453125, 5.31787109375, 6.060302734375, 6.802734375, 7.545166015625, 8.28759765625, 9.030029296875, 9.7724609375, 10.514892578125, 11.25732421875, 11.999755859375, 12.7421875, 13.484619140625, 14.22705078125, 14.969482421875, 15.7119140625, 16.454345703125, 17.19677734375, 17.939208984375, 18.681640625, 19.424072265625, 20.16650390625, 20.908935546875, 21.6513671875, 22.393798828125, 23.13623046875, 23.878662109375, 24.62109375, 25.363525390625, 26.10595703125, 26.848388671875, 27.5908203125, 28.333251953125, 29.07568359375, 29.818115234375, 30.560546875, 31.302978515625, 32.04541015625, 32.787841796875, 33.5302734375, 34.272705078125, 35.01513671875, 35.757568359375, 36.5]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 10.0, 12.0, 10.0, 18.0, 26.0, 43.0, 64.0, 82.0, 119.0, 171.0, 296.0, 474.0, 710.0, 1308.0, 2270.0, 4606.0, 9345.0, 22045.0, 62779.0, 276017.0, 3304596.0, 386052.0, 76007.0, 25505.0, 10344.0, 4961.0, 2547.0, 1458.0, 873.0, 509.0, 328.0, 220.0, 141.0, 121.0, 62.0, 47.0, 31.0, 25.0, 24.0, 12.0, 4.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-79.9375, -77.3232421875, -74.708984375, -72.0947265625, -69.48046875, -66.8662109375, -64.251953125, -61.6376953125, -59.0234375, -56.4091796875, -53.794921875, -51.1806640625, -48.56640625, -45.9521484375, -43.337890625, -40.7236328125, -38.109375, -35.4951171875, -32.880859375, -30.2666015625, -27.65234375, -25.0380859375, -22.423828125, -19.8095703125, -17.1953125, -14.5810546875, -11.966796875, -9.3525390625, -6.73828125, -4.1240234375, -1.509765625, 1.1044921875, 3.71875, 6.3330078125, 8.947265625, 11.5615234375, 14.17578125, 16.7900390625, 19.404296875, 22.0185546875, 24.6328125, 27.2470703125, 29.861328125, 32.4755859375, 35.08984375, 37.7041015625, 40.318359375, 42.9326171875, 45.546875, 48.1611328125, 50.775390625, 53.3896484375, 56.00390625, 58.6181640625, 61.232421875, 63.8466796875, 66.4609375, 69.0751953125, 71.689453125, 74.3037109375, 76.91796875, 79.5322265625, 82.146484375, 84.7607421875, 87.375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 4.0, 5.0, 8.0, 9.0, 18.0, 12.0, 29.0, 34.0, 49.0, 68.0, 89.0, 195.0, 415.0, 1648.0, 806.0, 264.0, 141.0, 78.0, 60.0, 41.0, 34.0, 16.0, 14.0, 6.0, 8.0, 7.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.9375, -35.5048828125, -34.072265625, -32.6396484375, -31.20703125, -29.7744140625, -28.341796875, -26.9091796875, -25.4765625, -24.0439453125, -22.611328125, -21.1787109375, -19.74609375, -18.3134765625, -16.880859375, -15.4482421875, -14.015625, -12.5830078125, -11.150390625, -9.7177734375, -8.28515625, -6.8525390625, -5.419921875, -3.9873046875, -2.5546875, -1.1220703125, 0.310546875, 1.7431640625, 3.17578125, 4.6083984375, 6.041015625, 7.4736328125, 8.90625, 10.3388671875, 11.771484375, 13.2041015625, 14.63671875, 16.0693359375, 17.501953125, 18.9345703125, 20.3671875, 21.7998046875, 23.232421875, 24.6650390625, 26.09765625, 27.5302734375, 28.962890625, 30.3955078125, 31.828125, 33.2607421875, 34.693359375, 36.1259765625, 37.55859375, 38.9912109375, 40.423828125, 41.8564453125, 43.2890625, 44.7216796875, 46.154296875, 47.5869140625, 49.01953125, 50.4521484375, 51.884765625, 53.3173828125, 54.75]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 15.0, 27.0, 54.0, 87.0, 140.0, 148.0, 154.0, 120.0, 96.0, 62.0, 42.0, 20.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-253.23733520507812, -242.7930145263672, -232.34869384765625, -221.9043731689453, -211.46005249023438, -201.01573181152344, -190.5714111328125, -180.12709045410156, -169.68276977539062, -159.2384490966797, -148.79412841796875, -138.3498077392578, -127.90548706054688, -117.46116638183594, -107.016845703125, -96.57252502441406, -86.12820434570312, -75.68388366699219, -65.23956298828125, -54.79524230957031, -44.350921630859375, -33.90660095214844, -23.4622802734375, -13.017959594726562, -2.573638916015625, 7.8706817626953125, 18.31500244140625, 28.759323120117188, 39.203643798828125, 49.64796447753906, 60.09228515625, 70.53660583496094, 80.98089599609375, 91.42521667480469, 101.86953735351562, 112.31385803222656, 122.7581787109375, 133.20249938964844, 143.64682006835938, 154.0911407470703, 164.53546142578125, 174.9797821044922, 185.42410278320312, 195.86842346191406, 206.312744140625, 216.75706481933594, 227.20138549804688, 237.6457061767578, 248.09002685546875, 258.53436279296875, 268.9786682128906, 279.4229736328125, 289.8673095703125, 300.3116455078125, 310.7559509277344, 321.20025634765625, 331.64459228515625, 342.08892822265625, 352.5332336425781, 362.9775390625, 373.421875, 383.8662109375, 394.3105163574219, 404.75482177734375, 415.19915771484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 4.0, 4.0, 6.0, 7.0, 14.0, 17.0, 21.0, 13.0, 24.0, 28.0, 27.0, 26.0, 51.0, 34.0, 56.0, 49.0, 59.0, 58.0, 50.0, 64.0, 58.0, 43.0, 48.0, 46.0, 36.0, 36.0, 20.0, 24.0, 16.0, 15.0, 15.0, 10.0, 12.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-204.3353729248047, -199.1943359375, -194.05331420898438, -188.9122772216797, -183.77125549316406, -178.63021850585938, -173.48919677734375, -168.34815979003906, -163.20712280273438, -158.0660858154297, -152.92506408691406, -147.78402709960938, -142.64300537109375, -137.50196838378906, -132.36094665527344, -127.21990966796875, -122.07888793945312, -116.93785858154297, -111.79682922363281, -106.65579986572266, -101.5147705078125, -96.37373352050781, -91.23270416259766, -86.0916748046875, -80.95064544677734, -75.80961608886719, -70.66858673095703, -65.52755737304688, -60.38652420043945, -55.2454948425293, -50.104461669921875, -44.96343231201172, -39.822410583496094, -34.68138122558594, -29.54034996032715, -24.39931869506836, -19.258289337158203, -14.117259979248047, -8.976228713989258, -3.8351974487304688, 1.3058319091796875, 6.44686222076416, 11.587892532348633, 16.728923797607422, 21.869953155517578, 27.010982513427734, 32.152015686035156, 37.29304504394531, 42.43407440185547, 47.575103759765625, 52.71613311767578, 57.8571662902832, 62.99819564819336, 68.13922119140625, 73.28025817871094, 78.4212875366211, 83.56231689453125, 88.7033462524414, 93.84437561035156, 98.98540496826172, 104.12643432617188, 109.26747131347656, 114.40850067138672, 119.54953002929688, 124.69055938720703]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 5.0, 12.0, 17.0, 27.0, 35.0, 50.0, 88.0, 116.0, 198.0, 418.0, 747.0, 1666.0, 4172.0, 12099.0, 45609.0, 221265.0, 591885.0, 127286.0, 28773.0, 8378.0, 2961.0, 1291.0, 611.0, 323.0, 169.0, 108.0, 67.0, 42.0, 23.0, 26.0, 17.0, 12.0, 9.0, 13.0, 9.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.1875, -99.7861328125, -96.384765625, -92.9833984375, -89.58203125, -86.1806640625, -82.779296875, -79.3779296875, -75.9765625, -72.5751953125, -69.173828125, -65.7724609375, -62.37109375, -58.9697265625, -55.568359375, -52.1669921875, -48.765625, -45.3642578125, -41.962890625, -38.5615234375, -35.16015625, -31.7587890625, -28.357421875, -24.9560546875, -21.5546875, -18.1533203125, -14.751953125, -11.3505859375, -7.94921875, -4.5478515625, -1.146484375, 2.2548828125, 5.65625, 9.0576171875, 12.458984375, 15.8603515625, 19.26171875, 22.6630859375, 26.064453125, 29.4658203125, 32.8671875, 36.2685546875, 39.669921875, 43.0712890625, 46.47265625, 49.8740234375, 53.275390625, 56.6767578125, 60.078125, 63.4794921875, 66.880859375, 70.2822265625, 73.68359375, 77.0849609375, 80.486328125, 83.8876953125, 87.2890625, 90.6904296875, 94.091796875, 97.4931640625, 100.89453125, 104.2958984375, 107.697265625, 111.0986328125, 114.5]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 5.0, 7.0, 13.0, 16.0, 25.0, 31.0, 43.0, 54.0, 56.0, 75.0, 70.0, 88.0, 72.0, 78.0, 61.0, 63.0, 48.0, 54.0, 33.0, 38.0, 17.0, 18.0, 11.0, 7.0, 11.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5546875, -10.9627685546875, -10.370849609375, -9.7789306640625, -9.18701171875, -8.5950927734375, -8.003173828125, -7.4112548828125, -6.8193359375, -6.2274169921875, -5.635498046875, -5.0435791015625, -4.45166015625, -3.8597412109375, -3.267822265625, -2.6759033203125, -2.083984375, -1.4920654296875, -0.900146484375, -0.3082275390625, 0.28369140625, 0.8756103515625, 1.467529296875, 2.0594482421875, 2.6513671875, 3.2432861328125, 3.835205078125, 4.4271240234375, 5.01904296875, 5.6109619140625, 6.202880859375, 6.7947998046875, 7.38671875, 7.9786376953125, 8.570556640625, 9.1624755859375, 9.75439453125, 10.3463134765625, 10.938232421875, 11.5301513671875, 12.1220703125, 12.7139892578125, 13.305908203125, 13.8978271484375, 14.48974609375, 15.0816650390625, 15.673583984375, 16.2655029296875, 16.857421875, 17.4493408203125, 18.041259765625, 18.6331787109375, 19.22509765625, 19.8170166015625, 20.408935546875, 21.0008544921875, 21.5927734375, 22.1846923828125, 22.776611328125, 23.3685302734375, 23.96044921875, 24.5523681640625, 25.144287109375, 25.7362060546875, 26.328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 8.0, 5.0, 9.0, 9.0, 18.0, 19.0, 35.0, 26.0, 43.0, 75.0, 110.0, 175.0, 246.0, 421.0, 745.0, 1529.0, 3603.0, 9707.0, 33419.0, 141730.0, 595286.0, 196343.0, 44087.0, 12653.0, 4339.0, 1748.0, 852.0, 476.0, 269.0, 194.0, 112.0, 79.0, 49.0, 28.0, 25.0, 30.0, 16.0, 15.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-84.5625, -81.798828125, -79.03515625, -76.271484375, -73.5078125, -70.744140625, -67.98046875, -65.216796875, -62.453125, -59.689453125, -56.92578125, -54.162109375, -51.3984375, -48.634765625, -45.87109375, -43.107421875, -40.34375, -37.580078125, -34.81640625, -32.052734375, -29.2890625, -26.525390625, -23.76171875, -20.998046875, -18.234375, -15.470703125, -12.70703125, -9.943359375, -7.1796875, -4.416015625, -1.65234375, 1.111328125, 3.875, 6.638671875, 9.40234375, 12.166015625, 14.9296875, 17.693359375, 20.45703125, 23.220703125, 25.984375, 28.748046875, 31.51171875, 34.275390625, 37.0390625, 39.802734375, 42.56640625, 45.330078125, 48.09375, 50.857421875, 53.62109375, 56.384765625, 59.1484375, 61.912109375, 64.67578125, 67.439453125, 70.203125, 72.966796875, 75.73046875, 78.494140625, 81.2578125, 84.021484375, 86.78515625, 89.548828125, 92.3125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 6.0, 8.0, 11.0, 9.0, 15.0, 29.0, 20.0, 31.0, 29.0, 41.0, 41.0, 53.0, 49.0, 51.0, 55.0, 55.0, 50.0, 52.0, 43.0, 50.0, 47.0, 33.0, 39.0, 38.0, 29.0, 10.0, 22.0, 11.0, 19.0, 13.0, 7.0, 8.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.09375, -51.21923828125, -49.3447265625, -47.47021484375, -45.595703125, -43.72119140625, -41.8466796875, -39.97216796875, -38.09765625, -36.22314453125, -34.3486328125, -32.47412109375, -30.599609375, -28.72509765625, -26.8505859375, -24.97607421875, -23.1015625, -21.22705078125, -19.3525390625, -17.47802734375, -15.603515625, -13.72900390625, -11.8544921875, -9.97998046875, -8.10546875, -6.23095703125, -4.3564453125, -2.48193359375, -0.607421875, 1.26708984375, 3.1416015625, 5.01611328125, 6.890625, 8.76513671875, 10.6396484375, 12.51416015625, 14.388671875, 16.26318359375, 18.1376953125, 20.01220703125, 21.88671875, 23.76123046875, 25.6357421875, 27.51025390625, 29.384765625, 31.25927734375, 33.1337890625, 35.00830078125, 36.8828125, 38.75732421875, 40.6318359375, 42.50634765625, 44.380859375, 46.25537109375, 48.1298828125, 50.00439453125, 51.87890625, 53.75341796875, 55.6279296875, 57.50244140625, 59.376953125, 61.25146484375, 63.1259765625, 65.00048828125, 66.875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 8.0, 5.0, 16.0, 14.0, 35.0, 88.0, 167.0, 359.0, 820.0, 2016.0, 6357.0, 28219.0, 532319.0, 443025.0, 25496.0, 6093.0, 2025.0, 801.0, 370.0, 160.0, 82.0, 34.0, 24.0, 10.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-119.25, -116.1904296875, -113.130859375, -110.0712890625, -107.01171875, -103.9521484375, -100.892578125, -97.8330078125, -94.7734375, -91.7138671875, -88.654296875, -85.5947265625, -82.53515625, -79.4755859375, -76.416015625, -73.3564453125, -70.296875, -67.2373046875, -64.177734375, -61.1181640625, -58.05859375, -54.9990234375, -51.939453125, -48.8798828125, -45.8203125, -42.7607421875, -39.701171875, -36.6416015625, -33.58203125, -30.5224609375, -27.462890625, -24.4033203125, -21.34375, -18.2841796875, -15.224609375, -12.1650390625, -9.10546875, -6.0458984375, -2.986328125, 0.0732421875, 3.1328125, 6.1923828125, 9.251953125, 12.3115234375, 15.37109375, 18.4306640625, 21.490234375, 24.5498046875, 27.609375, 30.6689453125, 33.728515625, 36.7880859375, 39.84765625, 42.9072265625, 45.966796875, 49.0263671875, 52.0859375, 55.1455078125, 58.205078125, 61.2646484375, 64.32421875, 67.3837890625, 70.443359375, 73.5029296875, 76.5625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 6.0, 2.0, 6.0, 4.0, 10.0, 6.0, 14.0, 20.0, 17.0, 30.0, 41.0, 96.0, 303.0, 222.0, 71.0, 37.0, 25.0, 17.0, 14.0, 9.0, 6.0, 12.0, 2.0, 4.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01201629638671875, -0.011638879776000977, -0.011261463165283203, -0.01088404655456543, -0.010506629943847656, -0.010129213333129883, -0.00975179672241211, -0.009374380111694336, -0.008996963500976562, -0.008619546890258789, -0.008242130279541016, -0.007864713668823242, -0.007487297058105469, -0.007109880447387695, -0.006732463836669922, -0.0063550472259521484, -0.005977630615234375, -0.0056002140045166016, -0.005222797393798828, -0.004845380783081055, -0.004467964172363281, -0.004090547561645508, -0.0037131309509277344, -0.003335714340209961, -0.0029582977294921875, -0.002580881118774414, -0.0022034645080566406, -0.0018260478973388672, -0.0014486312866210938, -0.0010712146759033203, -0.0006937980651855469, -0.00031638145446777344, 6.103515625e-05, 0.00043845176696777344, 0.0008158683776855469, 0.0011932849884033203, 0.0015707015991210938, 0.0019481182098388672, 0.0023255348205566406, 0.002702951431274414, 0.0030803680419921875, 0.003457784652709961, 0.0038352012634277344, 0.004212617874145508, 0.004590034484863281, 0.004967451095581055, 0.005344867706298828, 0.0057222843170166016, 0.006099700927734375, 0.0064771175384521484, 0.006854534149169922, 0.007231950759887695, 0.007609367370605469, 0.007986783981323242, 0.008364200592041016, 0.008741617202758789, 0.009119033813476562, 0.009496450424194336, 0.00987386703491211, 0.010251283645629883, 0.010628700256347656, 0.01100611686706543, 0.011383533477783203, 0.011760950088500977, 0.01213836669921875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 6.0, 7.0, 15.0, 28.0, 21.0, 37.0, 61.0, 100.0, 138.0, 270.0, 438.0, 975.0, 2283.0, 7380.0, 34147.0, 696986.0, 273914.0, 22604.0, 5396.0, 1923.0, 814.0, 414.0, 219.0, 149.0, 75.0, 48.0, 39.0, 19.0, 18.0, 5.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-97.0, -94.296875, -91.59375, -88.890625, -86.1875, -83.484375, -80.78125, -78.078125, -75.375, -72.671875, -69.96875, -67.265625, -64.5625, -61.859375, -59.15625, -56.453125, -53.75, -51.046875, -48.34375, -45.640625, -42.9375, -40.234375, -37.53125, -34.828125, -32.125, -29.421875, -26.71875, -24.015625, -21.3125, -18.609375, -15.90625, -13.203125, -10.5, -7.796875, -5.09375, -2.390625, 0.3125, 3.015625, 5.71875, 8.421875, 11.125, 13.828125, 16.53125, 19.234375, 21.9375, 24.640625, 27.34375, 30.046875, 32.75, 35.453125, 38.15625, 40.859375, 43.5625, 46.265625, 48.96875, 51.671875, 54.375, 57.078125, 59.78125, 62.484375, 65.1875, 67.890625, 70.59375, 73.296875, 76.0]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 11.0, 5.0, 5.0, 8.0, 6.0, 3.0, 8.0, 7.0, 8.0, 19.0, 27.0, 32.0, 51.0, 85.0, 127.0, 151.0, 136.0, 96.0, 48.0, 39.0, 27.0, 17.0, 11.0, 8.0, 10.0, 6.0, 10.0, 6.0, 7.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.375, -31.35302734375, -30.3310546875, -29.30908203125, -28.287109375, -27.26513671875, -26.2431640625, -25.22119140625, -24.19921875, -23.17724609375, -22.1552734375, -21.13330078125, -20.111328125, -19.08935546875, -18.0673828125, -17.04541015625, -16.0234375, -15.00146484375, -13.9794921875, -12.95751953125, -11.935546875, -10.91357421875, -9.8916015625, -8.86962890625, -7.84765625, -6.82568359375, -5.8037109375, -4.78173828125, -3.759765625, -2.73779296875, -1.7158203125, -0.69384765625, 0.328125, 1.35009765625, 2.3720703125, 3.39404296875, 4.416015625, 5.43798828125, 6.4599609375, 7.48193359375, 8.50390625, 9.52587890625, 10.5478515625, 11.56982421875, 12.591796875, 13.61376953125, 14.6357421875, 15.65771484375, 16.6796875, 17.70166015625, 18.7236328125, 19.74560546875, 20.767578125, 21.78955078125, 22.8115234375, 23.83349609375, 24.85546875, 25.87744140625, 26.8994140625, 27.92138671875, 28.943359375, 29.96533203125, 30.9873046875, 32.00927734375, 33.03125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 16.0, 17.0, 37.0, 67.0, 99.0, 149.0, 142.0, 145.0, 87.0, 93.0, 52.0, 26.0, 22.0, 10.0, 10.0, 3.0, 6.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-274.26544189453125, -255.51858520507812, -236.77174377441406, -218.02490234375, -199.27804565429688, -180.53118896484375, -161.7843475341797, -143.03750610351562, -124.2906494140625, -105.5438003540039, -86.79695129394531, -68.05010223388672, -49.303253173828125, -30.55640411376953, -11.809555053710938, 6.937286376953125, 25.68414306640625, 44.430992126464844, 63.17784118652344, 81.92469024658203, 100.67153930664062, 119.41838836669922, 138.1652374267578, 156.91207885742188, 175.658935546875, 194.40579223632812, 213.1526336669922, 231.89947509765625, 250.64633178710938, 269.3931884765625, 288.1400146484375, 306.8868713378906, 325.6336669921875, 344.3805236816406, 363.12738037109375, 381.87420654296875, 400.6210632324219, 419.367919921875, 438.11474609375, 456.8616027832031, 475.60845947265625, 494.3553161621094, 513.1021728515625, 531.8489990234375, 550.5958251953125, 569.3427124023438, 588.0895385742188, 606.83642578125, 625.583251953125, 644.330078125, 663.0769653320312, 681.8237915039062, 700.5706787109375, 719.3175048828125, 738.0643310546875, 756.8111572265625, 775.5580444335938, 794.3048706054688, 813.0517578125, 831.798583984375, 850.54541015625, 869.2922973632812, 888.0391235351562, 906.7860107421875, 925.5328369140625]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 7.0, 7.0, 13.0, 6.0, 21.0, 17.0, 28.0, 16.0, 26.0, 37.0, 41.0, 25.0, 44.0, 45.0, 45.0, 50.0, 66.0, 52.0, 70.0, 51.0, 47.0, 42.0, 37.0, 27.0, 41.0, 21.0, 23.0, 22.0, 13.0, 18.0, 9.0, 9.0, 2.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-354.4935607910156, -344.0801696777344, -333.6667785644531, -323.2533874511719, -312.8399963378906, -302.4266052246094, -292.0132141113281, -281.5998229980469, -271.1864318847656, -260.7730407714844, -250.35964965820312, -239.94625854492188, -229.53286743164062, -219.11947631835938, -208.70608520507812, -198.29269409179688, -187.87930297851562, -177.46591186523438, -167.05252075195312, -156.63912963867188, -146.22573852539062, -135.81234741210938, -125.39895629882812, -114.98556518554688, -104.57217407226562, -94.15878295898438, -83.74539184570312, -73.33200073242188, -62.918609619140625, -52.505218505859375, -42.091827392578125, -31.678436279296875, -21.2650146484375, -10.85162353515625, -0.438232421875, 9.97515869140625, 20.3885498046875, 30.80194091796875, 41.21533203125, 51.62872314453125, 62.0421142578125, 72.45550537109375, 82.868896484375, 93.28228759765625, 103.6956787109375, 114.10906982421875, 124.5224609375, 134.93585205078125, 145.3492431640625, 155.76263427734375, 166.176025390625, 176.58941650390625, 187.0028076171875, 197.41619873046875, 207.82958984375, 218.24298095703125, 228.6563720703125, 239.06976318359375, 249.483154296875, 259.89654541015625, 270.3099365234375, 280.72332763671875, 291.13671875, 301.55010986328125, 311.9635009765625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 6.0, 12.0, 27.0, 36.0, 52.0, 90.0, 184.0, 340.0, 766.0, 1770.0, 4141.0, 10992.0, 37319.0, 255698.0, 3718898.0, 125132.0, 24530.0, 7972.0, 3156.0, 1432.0, 652.0, 384.0, 221.0, 130.0, 77.0, 63.0, 50.0, 31.0, 24.0, 22.0, 17.0, 12.0, 9.0, 8.0, 4.0, 4.0, 5.0, 6.0, 2.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.875, -71.50390625, -67.1328125, -62.76171875, -58.390625, -54.01953125, -49.6484375, -45.27734375, -40.90625, -36.53515625, -32.1640625, -27.79296875, -23.421875, -19.05078125, -14.6796875, -10.30859375, -5.9375, -1.56640625, 2.8046875, 7.17578125, 11.546875, 15.91796875, 20.2890625, 24.66015625, 29.03125, 33.40234375, 37.7734375, 42.14453125, 46.515625, 50.88671875, 55.2578125, 59.62890625, 64.0, 68.37109375, 72.7421875, 77.11328125, 81.484375, 85.85546875, 90.2265625, 94.59765625, 98.96875, 103.33984375, 107.7109375, 112.08203125, 116.453125, 120.82421875, 125.1953125, 129.56640625, 133.9375, 138.30859375, 142.6796875, 147.05078125, 151.421875, 155.79296875, 160.1640625, 164.53515625, 168.90625, 173.27734375, 177.6484375, 182.01953125, 186.390625, 190.76171875, 195.1328125, 199.50390625, 203.875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 3.0, 8.0, 15.0, 23.0, 35.0, 34.0, 52.0, 66.0, 76.0, 78.0, 96.0, 89.0, 90.0, 74.0, 69.0, 67.0, 47.0, 20.0, 25.0, 16.0, 10.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5859375, -10.8262939453125, -10.066650390625, -9.3070068359375, -8.54736328125, -7.7877197265625, -7.028076171875, -6.2684326171875, -5.5087890625, -4.7491455078125, -3.989501953125, -3.2298583984375, -2.47021484375, -1.7105712890625, -0.950927734375, -0.1912841796875, 0.568359375, 1.3280029296875, 2.087646484375, 2.8472900390625, 3.60693359375, 4.3665771484375, 5.126220703125, 5.8858642578125, 6.6455078125, 7.4051513671875, 8.164794921875, 8.9244384765625, 9.68408203125, 10.4437255859375, 11.203369140625, 11.9630126953125, 12.72265625, 13.4822998046875, 14.241943359375, 15.0015869140625, 15.76123046875, 16.5208740234375, 17.280517578125, 18.0401611328125, 18.7998046875, 19.5594482421875, 20.319091796875, 21.0787353515625, 21.83837890625, 22.5980224609375, 23.357666015625, 24.1173095703125, 24.876953125, 25.6365966796875, 26.396240234375, 27.1558837890625, 27.91552734375, 28.6751708984375, 29.434814453125, 30.1944580078125, 30.9541015625, 31.7137451171875, 32.473388671875, 33.2330322265625, 33.99267578125, 34.7523193359375, 35.511962890625, 36.2716064453125, 37.03125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 7.0, 3.0, 6.0, 11.0, 11.0, 27.0, 15.0, 21.0, 33.0, 41.0, 77.0, 88.0, 153.0, 241.0, 531.0, 1104.0, 2868.0, 8199.0, 28243.0, 168955.0, 3763777.0, 177531.0, 28590.0, 8237.0, 2958.0, 1223.0, 535.0, 286.0, 159.0, 99.0, 66.0, 42.0, 32.0, 24.0, 16.0, 15.0, 7.0, 17.0, 9.0, 7.0, 1.0, 6.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-155.625, -150.837890625, -146.05078125, -141.263671875, -136.4765625, -131.689453125, -126.90234375, -122.115234375, -117.328125, -112.541015625, -107.75390625, -102.966796875, -98.1796875, -93.392578125, -88.60546875, -83.818359375, -79.03125, -74.244140625, -69.45703125, -64.669921875, -59.8828125, -55.095703125, -50.30859375, -45.521484375, -40.734375, -35.947265625, -31.16015625, -26.373046875, -21.5859375, -16.798828125, -12.01171875, -7.224609375, -2.4375, 2.349609375, 7.13671875, 11.923828125, 16.7109375, 21.498046875, 26.28515625, 31.072265625, 35.859375, 40.646484375, 45.43359375, 50.220703125, 55.0078125, 59.794921875, 64.58203125, 69.369140625, 74.15625, 78.943359375, 83.73046875, 88.517578125, 93.3046875, 98.091796875, 102.87890625, 107.666015625, 112.453125, 117.240234375, 122.02734375, 126.814453125, 131.6015625, 136.388671875, 141.17578125, 145.962890625, 150.75]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 8.0, 13.0, 16.0, 29.0, 39.0, 99.0, 216.0, 1423.0, 1788.0, 221.0, 97.0, 44.0, 33.0, 16.0, 9.0, 8.0, 12.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.1875, -94.697265625, -92.20703125, -89.716796875, -87.2265625, -84.736328125, -82.24609375, -79.755859375, -77.265625, -74.775390625, -72.28515625, -69.794921875, -67.3046875, -64.814453125, -62.32421875, -59.833984375, -57.34375, -54.853515625, -52.36328125, -49.873046875, -47.3828125, -44.892578125, -42.40234375, -39.912109375, -37.421875, -34.931640625, -32.44140625, -29.951171875, -27.4609375, -24.970703125, -22.48046875, -19.990234375, -17.5, -15.009765625, -12.51953125, -10.029296875, -7.5390625, -5.048828125, -2.55859375, -0.068359375, 2.421875, 4.912109375, 7.40234375, 9.892578125, 12.3828125, 14.873046875, 17.36328125, 19.853515625, 22.34375, 24.833984375, 27.32421875, 29.814453125, 32.3046875, 34.794921875, 37.28515625, 39.775390625, 42.265625, 44.755859375, 47.24609375, 49.736328125, 52.2265625, 54.716796875, 57.20703125, 59.697265625, 62.1875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 11.0, 11.0, 21.0, 34.0, 48.0, 73.0, 109.0, 129.0, 170.0, 136.0, 113.0, 64.0, 34.0, 19.0, 9.0, 8.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.38232421875, -160.8244171142578, -150.2665252685547, -139.7086181640625, -129.15072631835938, -118.59281921386719, -108.034912109375, -97.47701263427734, -86.91911315917969, -76.36121368408203, -65.80331420898438, -55.24540710449219, -44.68750762939453, -34.129608154296875, -23.571704864501953, -13.013801574707031, -2.455902099609375, 8.101999282836914, 18.659900665283203, 29.217802047729492, 39.77570343017578, 50.33360290527344, 60.89150619506836, 71.44940948486328, 82.00730895996094, 92.5652084350586, 103.12310791015625, 113.68101501464844, 124.2389144897461, 134.79681396484375, 145.35472106933594, 155.91262817382812, 166.47052001953125, 177.02842712402344, 187.58631896972656, 198.14422607421875, 208.70211791992188, 219.26002502441406, 229.81793212890625, 240.37582397460938, 250.93373107910156, 261.49163818359375, 272.0495300292969, 282.607421875, 293.16534423828125, 303.7232360839844, 314.2811279296875, 324.83905029296875, 335.3969421386719, 345.954833984375, 356.51275634765625, 367.0706481933594, 377.6285400390625, 388.18646240234375, 398.7443542480469, 409.30224609375, 419.86016845703125, 430.4180603027344, 440.9759826660156, 451.53387451171875, 462.0917663574219, 472.649658203125, 483.20758056640625, 493.7654724121094, 504.3233642578125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 8.0, 11.0, 11.0, 16.0, 20.0, 15.0, 23.0, 33.0, 32.0, 38.0, 44.0, 45.0, 62.0, 49.0, 53.0, 59.0, 47.0, 39.0, 62.0, 49.0, 43.0, 45.0, 44.0, 33.0, 25.0, 20.0, 17.0, 20.0, 9.0, 8.0, 7.0, 2.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.5383758544922, -187.1134033203125, -181.68841552734375, -176.263427734375, -170.8384552001953, -165.41348266601562, -159.98849487304688, -154.56350708007812, -149.13853454589844, -143.71356201171875, -138.28857421875, -132.86358642578125, -127.43861389160156, -122.01363372802734, -116.58865356445312, -111.1636734008789, -105.73869323730469, -100.31371307373047, -94.88873291015625, -89.46375274658203, -84.03877258300781, -78.6137924194336, -73.18881225585938, -67.76383209228516, -62.33885192871094, -56.91387176513672, -51.4888916015625, -46.06391143798828, -40.63893127441406, -35.213951110839844, -29.788970947265625, -24.363990783691406, -18.938995361328125, -13.514015197753906, -8.089035034179688, -2.6640548706054688, 2.76092529296875, 8.185905456542969, 13.610885620117188, 19.035865783691406, 24.460845947265625, 29.885826110839844, 35.31080627441406, 40.73578643798828, 46.1607666015625, 51.58574676513672, 57.01072692871094, 62.435707092285156, 67.86068725585938, 73.2856674194336, 78.71064758300781, 84.13562774658203, 89.56060791015625, 94.98558807373047, 100.41056823730469, 105.8355484008789, 111.26052856445312, 116.68550872802734, 122.11048889160156, 127.53546905517578, 132.96044921875, 138.38543701171875, 143.81040954589844, 149.23538208007812, 154.66036987304688]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 6.0, 18.0, 26.0, 40.0, 81.0, 154.0, 237.0, 550.0, 1310.0, 4574.0, 19729.0, 108117.0, 699981.0, 175261.0, 29101.0, 6356.0, 1712.0, 646.0, 279.0, 158.0, 86.0, 42.0, 35.0, 17.0, 9.0, 3.0, 0.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.8125, -110.3310546875, -105.849609375, -101.3681640625, -96.88671875, -92.4052734375, -87.923828125, -83.4423828125, -78.9609375, -74.4794921875, -69.998046875, -65.5166015625, -61.03515625, -56.5537109375, -52.072265625, -47.5908203125, -43.109375, -38.6279296875, -34.146484375, -29.6650390625, -25.18359375, -20.7021484375, -16.220703125, -11.7392578125, -7.2578125, -2.7763671875, 1.705078125, 6.1865234375, 10.66796875, 15.1494140625, 19.630859375, 24.1123046875, 28.59375, 33.0751953125, 37.556640625, 42.0380859375, 46.51953125, 51.0009765625, 55.482421875, 59.9638671875, 64.4453125, 68.9267578125, 73.408203125, 77.8896484375, 82.37109375, 86.8525390625, 91.333984375, 95.8154296875, 100.296875, 104.7783203125, 109.259765625, 113.7412109375, 118.22265625, 122.7041015625, 127.185546875, 131.6669921875, 136.1484375, 140.6298828125, 145.111328125, 149.5927734375, 154.07421875, 158.5556640625, 163.037109375, 167.5185546875, 172.0]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 19.0, 13.0, 9.0, 30.0, 25.0, 39.0, 48.0, 44.0, 59.0, 54.0, 54.0, 58.0, 72.0, 71.0, 48.0, 41.0, 54.0, 55.0, 45.0, 30.0, 28.0, 21.0, 8.0, 26.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.203125, -13.624755859375, -13.04638671875, -12.468017578125, -11.8896484375, -11.311279296875, -10.73291015625, -10.154541015625, -9.576171875, -8.997802734375, -8.41943359375, -7.841064453125, -7.2626953125, -6.684326171875, -6.10595703125, -5.527587890625, -4.94921875, -4.370849609375, -3.79248046875, -3.214111328125, -2.6357421875, -2.057373046875, -1.47900390625, -0.900634765625, -0.322265625, 0.256103515625, 0.83447265625, 1.412841796875, 1.9912109375, 2.569580078125, 3.14794921875, 3.726318359375, 4.3046875, 4.883056640625, 5.46142578125, 6.039794921875, 6.6181640625, 7.196533203125, 7.77490234375, 8.353271484375, 8.931640625, 9.510009765625, 10.08837890625, 10.666748046875, 11.2451171875, 11.823486328125, 12.40185546875, 12.980224609375, 13.55859375, 14.136962890625, 14.71533203125, 15.293701171875, 15.8720703125, 16.450439453125, 17.02880859375, 17.607177734375, 18.185546875, 18.763916015625, 19.34228515625, 19.920654296875, 20.4990234375, 21.077392578125, 21.65576171875, 22.234130859375, 22.8125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 3.0, 7.0, 5.0, 5.0, 10.0, 16.0, 12.0, 26.0, 34.0, 56.0, 74.0, 102.0, 197.0, 408.0, 717.0, 1478.0, 3239.0, 7832.0, 21612.0, 68458.0, 345492.0, 469556.0, 86702.0, 25766.0, 9441.0, 3688.0, 1768.0, 769.0, 414.0, 235.0, 123.0, 107.0, 62.0, 41.0, 18.0, 14.0, 20.0, 16.0, 9.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-80.125, -77.6279296875, -75.130859375, -72.6337890625, -70.13671875, -67.6396484375, -65.142578125, -62.6455078125, -60.1484375, -57.6513671875, -55.154296875, -52.6572265625, -50.16015625, -47.6630859375, -45.166015625, -42.6689453125, -40.171875, -37.6748046875, -35.177734375, -32.6806640625, -30.18359375, -27.6865234375, -25.189453125, -22.6923828125, -20.1953125, -17.6982421875, -15.201171875, -12.7041015625, -10.20703125, -7.7099609375, -5.212890625, -2.7158203125, -0.21875, 2.2783203125, 4.775390625, 7.2724609375, 9.76953125, 12.2666015625, 14.763671875, 17.2607421875, 19.7578125, 22.2548828125, 24.751953125, 27.2490234375, 29.74609375, 32.2431640625, 34.740234375, 37.2373046875, 39.734375, 42.2314453125, 44.728515625, 47.2255859375, 49.72265625, 52.2197265625, 54.716796875, 57.2138671875, 59.7109375, 62.2080078125, 64.705078125, 67.2021484375, 69.69921875, 72.1962890625, 74.693359375, 77.1904296875, 79.6875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 8.0, 7.0, 8.0, 11.0, 14.0, 18.0, 17.0, 19.0, 22.0, 36.0, 35.0, 32.0, 47.0, 39.0, 66.0, 47.0, 49.0, 52.0, 61.0, 49.0, 46.0, 39.0, 50.0, 31.0, 48.0, 25.0, 24.0, 22.0, 21.0, 9.0, 11.0, 3.0, 8.0, 4.0, 5.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-70.5625, -68.3466796875, -66.130859375, -63.9150390625, -61.69921875, -59.4833984375, -57.267578125, -55.0517578125, -52.8359375, -50.6201171875, -48.404296875, -46.1884765625, -43.97265625, -41.7568359375, -39.541015625, -37.3251953125, -35.109375, -32.8935546875, -30.677734375, -28.4619140625, -26.24609375, -24.0302734375, -21.814453125, -19.5986328125, -17.3828125, -15.1669921875, -12.951171875, -10.7353515625, -8.51953125, -6.3037109375, -4.087890625, -1.8720703125, 0.34375, 2.5595703125, 4.775390625, 6.9912109375, 9.20703125, 11.4228515625, 13.638671875, 15.8544921875, 18.0703125, 20.2861328125, 22.501953125, 24.7177734375, 26.93359375, 29.1494140625, 31.365234375, 33.5810546875, 35.796875, 38.0126953125, 40.228515625, 42.4443359375, 44.66015625, 46.8759765625, 49.091796875, 51.3076171875, 53.5234375, 55.7392578125, 57.955078125, 60.1708984375, 62.38671875, 64.6025390625, 66.818359375, 69.0341796875, 71.25]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 9.0, 4.0, 12.0, 13.0, 25.0, 28.0, 70.0, 100.0, 142.0, 250.0, 566.0, 1306.0, 3478.0, 10498.0, 39068.0, 292106.0, 614880.0, 62833.0, 15075.0, 4813.0, 1766.0, 697.0, 344.0, 180.0, 108.0, 66.0, 42.0, 22.0, 13.0, 10.0, 8.0, 6.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.03125, -43.24072265625, -41.4501953125, -39.65966796875, -37.869140625, -36.07861328125, -34.2880859375, -32.49755859375, -30.70703125, -28.91650390625, -27.1259765625, -25.33544921875, -23.544921875, -21.75439453125, -19.9638671875, -18.17333984375, -16.3828125, -14.59228515625, -12.8017578125, -11.01123046875, -9.220703125, -7.43017578125, -5.6396484375, -3.84912109375, -2.05859375, -0.26806640625, 1.5224609375, 3.31298828125, 5.103515625, 6.89404296875, 8.6845703125, 10.47509765625, 12.265625, 14.05615234375, 15.8466796875, 17.63720703125, 19.427734375, 21.21826171875, 23.0087890625, 24.79931640625, 26.58984375, 28.38037109375, 30.1708984375, 31.96142578125, 33.751953125, 35.54248046875, 37.3330078125, 39.12353515625, 40.9140625, 42.70458984375, 44.4951171875, 46.28564453125, 48.076171875, 49.86669921875, 51.6572265625, 53.44775390625, 55.23828125, 57.02880859375, 58.8193359375, 60.60986328125, 62.400390625, 64.19091796875, 65.9814453125, 67.77197265625, 69.5625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 3.0, 12.0, 10.0, 10.0, 10.0, 20.0, 17.0, 25.0, 25.0, 48.0, 131.0, 280.0, 194.0, 61.0, 36.0, 18.0, 18.0, 6.0, 7.0, 14.0, 10.0, 4.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.009429931640625, -0.009149909019470215, -0.00886988639831543, -0.008589863777160645, -0.00830984115600586, -0.008029818534851074, -0.007749795913696289, -0.007469773292541504, -0.007189750671386719, -0.006909728050231934, -0.0066297054290771484, -0.006349682807922363, -0.006069660186767578, -0.005789637565612793, -0.005509614944458008, -0.005229592323303223, -0.0049495697021484375, -0.004669547080993652, -0.004389524459838867, -0.004109501838684082, -0.003829479217529297, -0.0035494565963745117, -0.0032694339752197266, -0.0029894113540649414, -0.0027093887329101562, -0.002429366111755371, -0.002149343490600586, -0.0018693208694458008, -0.0015892982482910156, -0.0013092756271362305, -0.0010292530059814453, -0.0007492303848266602, -0.000469207763671875, -0.00018918514251708984, 9.083747863769531e-05, 0.00037086009979248047, 0.0006508827209472656, 0.0009309053421020508, 0.001210927963256836, 0.001490950584411621, 0.0017709732055664062, 0.0020509958267211914, 0.0023310184478759766, 0.0026110410690307617, 0.002891063690185547, 0.003171086311340332, 0.003451108932495117, 0.0037311315536499023, 0.0040111541748046875, 0.004291176795959473, 0.004571199417114258, 0.004851222038269043, 0.005131244659423828, 0.005411267280578613, 0.0056912899017333984, 0.005971312522888184, 0.006251335144042969, 0.006531357765197754, 0.006811380386352539, 0.007091403007507324, 0.007371425628662109, 0.0076514482498168945, 0.00793147087097168, 0.008211493492126465, 0.00849151611328125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 4.0, 11.0, 16.0, 31.0, 34.0, 42.0, 87.0, 128.0, 215.0, 366.0, 812.0, 1734.0, 4162.0, 11880.0, 42713.0, 318922.0, 580696.0, 61561.0, 15895.0, 5253.0, 1956.0, 931.0, 474.0, 213.0, 141.0, 83.0, 56.0, 36.0, 28.0, 17.0, 20.0, 5.0, 6.0, 7.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-65.875, -64.19091796875, -62.5068359375, -60.82275390625, -59.138671875, -57.45458984375, -55.7705078125, -54.08642578125, -52.40234375, -50.71826171875, -49.0341796875, -47.35009765625, -45.666015625, -43.98193359375, -42.2978515625, -40.61376953125, -38.9296875, -37.24560546875, -35.5615234375, -33.87744140625, -32.193359375, -30.50927734375, -28.8251953125, -27.14111328125, -25.45703125, -23.77294921875, -22.0888671875, -20.40478515625, -18.720703125, -17.03662109375, -15.3525390625, -13.66845703125, -11.984375, -10.30029296875, -8.6162109375, -6.93212890625, -5.248046875, -3.56396484375, -1.8798828125, -0.19580078125, 1.48828125, 3.17236328125, 4.8564453125, 6.54052734375, 8.224609375, 9.90869140625, 11.5927734375, 13.27685546875, 14.9609375, 16.64501953125, 18.3291015625, 20.01318359375, 21.697265625, 23.38134765625, 25.0654296875, 26.74951171875, 28.43359375, 30.11767578125, 31.8017578125, 33.48583984375, 35.169921875, 36.85400390625, 38.5380859375, 40.22216796875, 41.90625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 13.0, 14.0, 15.0, 20.0, 24.0, 35.0, 60.0, 87.0, 159.0, 157.0, 131.0, 63.0, 46.0, 38.0, 18.0, 15.0, 10.0, 11.0, 17.0, 12.0, 9.0, 11.0, 6.0, 1.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.46875, -40.35791015625, -39.2470703125, -38.13623046875, -37.025390625, -35.91455078125, -34.8037109375, -33.69287109375, -32.58203125, -31.47119140625, -30.3603515625, -29.24951171875, -28.138671875, -27.02783203125, -25.9169921875, -24.80615234375, -23.6953125, -22.58447265625, -21.4736328125, -20.36279296875, -19.251953125, -18.14111328125, -17.0302734375, -15.91943359375, -14.80859375, -13.69775390625, -12.5869140625, -11.47607421875, -10.365234375, -9.25439453125, -8.1435546875, -7.03271484375, -5.921875, -4.81103515625, -3.7001953125, -2.58935546875, -1.478515625, -0.36767578125, 0.7431640625, 1.85400390625, 2.96484375, 4.07568359375, 5.1865234375, 6.29736328125, 7.408203125, 8.51904296875, 9.6298828125, 10.74072265625, 11.8515625, 12.96240234375, 14.0732421875, 15.18408203125, 16.294921875, 17.40576171875, 18.5166015625, 19.62744140625, 20.73828125, 21.84912109375, 22.9599609375, 24.07080078125, 25.181640625, 26.29248046875, 27.4033203125, 28.51416015625, 29.625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 9.0, 4.0, 8.0, 10.0, 12.0, 26.0, 22.0, 38.0, 55.0, 66.0, 76.0, 93.0, 86.0, 94.0, 85.0, 62.0, 64.0, 50.0, 36.0, 34.0, 14.0, 19.0, 11.0, 7.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-312.44696044921875, -299.7755126953125, -287.1040954589844, -274.4326477050781, -261.7611999511719, -249.0897674560547, -236.4183349609375, -223.74688720703125, -211.07545471191406, -198.40402221679688, -185.73257446289062, -173.06114196777344, -160.38970947265625, -147.71826171875, -135.0468292236328, -122.3753890991211, -109.70394897460938, -97.03250885009766, -84.36106872558594, -71.68963623046875, -59.01819610595703, -46.34675598144531, -33.675323486328125, -21.003883361816406, -8.332443237304688, 4.338994979858398, 17.010433197021484, 29.681869506835938, 42.353309631347656, 55.024749755859375, 67.69618225097656, 80.36762237548828, 93.03903198242188, 105.7104721069336, 118.38191223144531, 131.0533447265625, 143.72479248046875, 156.39622497558594, 169.06765747070312, 181.73910522460938, 194.41053771972656, 207.08197021484375, 219.75341796875, 232.4248504638672, 245.09628295898438, 257.7677307128906, 270.43914794921875, 283.110595703125, 295.78204345703125, 308.4534912109375, 321.1249084472656, 333.7963562011719, 346.4678039550781, 359.13922119140625, 371.8106689453125, 384.48211669921875, 397.153564453125, 409.82501220703125, 422.4964294433594, 435.1678771972656, 447.8393249511719, 460.5107421875, 473.18218994140625, 485.8536376953125, 498.5250549316406]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 9.0, 6.0, 8.0, 10.0, 9.0, 16.0, 24.0, 32.0, 29.0, 41.0, 35.0, 38.0, 33.0, 60.0, 50.0, 58.0, 54.0, 47.0, 65.0, 50.0, 47.0, 47.0, 34.0, 26.0, 38.0, 31.0, 14.0, 15.0, 18.0, 18.0, 12.0, 3.0, 5.0, 6.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.9058837890625, -278.63897705078125, -267.3720397949219, -256.1051330566406, -244.8382110595703, -233.5712890625, -222.3043670654297, -211.03744506835938, -199.77053833007812, -188.5036163330078, -177.2366943359375, -165.96978759765625, -154.70286560058594, -143.43594360351562, -132.1690216064453, -120.90210723876953, -109.63517761230469, -98.36825561523438, -87.1013412475586, -75.83441925048828, -64.5675048828125, -53.30058288574219, -42.033660888671875, -30.766746520996094, -19.49982452392578, -8.232905387878418, 3.0340137481689453, 14.300933837890625, 25.567852020263672, 36.83477020263672, 48.10169219970703, 59.36860656738281, 70.63552856445312, 81.90245056152344, 93.16936492919922, 104.43628692626953, 115.70320129394531, 126.97012329101562, 138.23704528808594, 149.50396728515625, 160.7708740234375, 172.0377960205078, 183.30471801757812, 194.57162475585938, 205.8385467529297, 217.10546875, 228.3723907470703, 239.63931274414062, 250.90623474121094, 262.17315673828125, 273.4400634765625, 284.7070007324219, 295.9739074707031, 307.2408447265625, 318.50775146484375, 329.774658203125, 341.0415954589844, 352.3085021972656, 363.575439453125, 374.84234619140625, 386.1092834472656, 397.3761901855469, 408.64312744140625, 419.9100341796875, 431.17694091796875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 10.0, 5.0, 16.0, 21.0, 19.0, 33.0, 70.0, 109.0, 156.0, 313.0, 522.0, 992.0, 1857.0, 3847.0, 8631.0, 21634.0, 66351.0, 594146.0, 3347899.0, 99007.0, 27587.0, 10740.0, 4749.0, 2264.0, 1200.0, 709.0, 445.0, 286.0, 181.0, 114.0, 97.0, 70.0, 48.0, 45.0, 23.0, 19.0, 16.0, 9.0, 3.0, 5.0, 9.0, 4.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-106.375, -101.96875, -97.5625, -93.15625, -88.75, -84.34375, -79.9375, -75.53125, -71.125, -66.71875, -62.3125, -57.90625, -53.5, -49.09375, -44.6875, -40.28125, -35.875, -31.46875, -27.0625, -22.65625, -18.25, -13.84375, -9.4375, -5.03125, -0.625, 3.78125, 8.1875, 12.59375, 17.0, 21.40625, 25.8125, 30.21875, 34.625, 39.03125, 43.4375, 47.84375, 52.25, 56.65625, 61.0625, 65.46875, 69.875, 74.28125, 78.6875, 83.09375, 87.5, 91.90625, 96.3125, 100.71875, 105.125, 109.53125, 113.9375, 118.34375, 122.75, 127.15625, 131.5625, 135.96875, 140.375, 144.78125, 149.1875, 153.59375, 158.0, 162.40625, 166.8125, 171.21875, 175.625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 7.0, 5.0, 8.0, 13.0, 19.0, 26.0, 19.0, 52.0, 50.0, 71.0, 64.0, 67.0, 64.0, 81.0, 82.0, 81.0, 62.0, 59.0, 46.0, 35.0, 30.0, 28.0, 17.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0703125, -11.2908935546875, -10.511474609375, -9.7320556640625, -8.95263671875, -8.1732177734375, -7.393798828125, -6.6143798828125, -5.8349609375, -5.0555419921875, -4.276123046875, -3.4967041015625, -2.71728515625, -1.9378662109375, -1.158447265625, -0.3790283203125, 0.400390625, 1.1798095703125, 1.959228515625, 2.7386474609375, 3.51806640625, 4.2974853515625, 5.076904296875, 5.8563232421875, 6.6357421875, 7.4151611328125, 8.194580078125, 8.9739990234375, 9.75341796875, 10.5328369140625, 11.312255859375, 12.0916748046875, 12.87109375, 13.6505126953125, 14.429931640625, 15.2093505859375, 15.98876953125, 16.7681884765625, 17.547607421875, 18.3270263671875, 19.1064453125, 19.8858642578125, 20.665283203125, 21.4447021484375, 22.22412109375, 23.0035400390625, 23.782958984375, 24.5623779296875, 25.341796875, 26.1212158203125, 26.900634765625, 27.6800537109375, 28.45947265625, 29.2388916015625, 30.018310546875, 30.7977294921875, 31.5771484375, 32.3565673828125, 33.135986328125, 33.9154052734375, 34.69482421875, 35.4742431640625, 36.253662109375, 37.0330810546875, 37.8125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 5.0, 5.0, 12.0, 21.0, 28.0, 47.0, 45.0, 82.0, 98.0, 159.0, 248.0, 336.0, 565.0, 854.0, 1302.0, 2294.0, 3992.0, 7284.0, 14729.0, 35966.0, 122537.0, 3230258.0, 642685.0, 78354.0, 26396.0, 11565.0, 5933.0, 3365.0, 1845.0, 1116.0, 756.0, 428.0, 294.0, 201.0, 129.0, 100.0, 75.0, 40.0, 41.0, 23.0, 17.0, 13.0, 13.0, 10.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-125.1875, -121.3759765625, -117.564453125, -113.7529296875, -109.94140625, -106.1298828125, -102.318359375, -98.5068359375, -94.6953125, -90.8837890625, -87.072265625, -83.2607421875, -79.44921875, -75.6376953125, -71.826171875, -68.0146484375, -64.203125, -60.3916015625, -56.580078125, -52.7685546875, -48.95703125, -45.1455078125, -41.333984375, -37.5224609375, -33.7109375, -29.8994140625, -26.087890625, -22.2763671875, -18.46484375, -14.6533203125, -10.841796875, -7.0302734375, -3.21875, 0.5927734375, 4.404296875, 8.2158203125, 12.02734375, 15.8388671875, 19.650390625, 23.4619140625, 27.2734375, 31.0849609375, 34.896484375, 38.7080078125, 42.51953125, 46.3310546875, 50.142578125, 53.9541015625, 57.765625, 61.5771484375, 65.388671875, 69.2001953125, 73.01171875, 76.8232421875, 80.634765625, 84.4462890625, 88.2578125, 92.0693359375, 95.880859375, 99.6923828125, 103.50390625, 107.3154296875, 111.126953125, 114.9384765625, 118.75]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 8.0, 8.0, 12.0, 14.0, 13.0, 19.0, 23.0, 31.0, 52.0, 75.0, 173.0, 539.0, 2264.0, 412.0, 161.0, 65.0, 56.0, 33.0, 27.0, 12.0, 9.0, 13.0, 4.0, 6.0, 8.0, 6.0, 2.0, 1.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.84375, -59.021484375, -57.19921875, -55.376953125, -53.5546875, -51.732421875, -49.91015625, -48.087890625, -46.265625, -44.443359375, -42.62109375, -40.798828125, -38.9765625, -37.154296875, -35.33203125, -33.509765625, -31.6875, -29.865234375, -28.04296875, -26.220703125, -24.3984375, -22.576171875, -20.75390625, -18.931640625, -17.109375, -15.287109375, -13.46484375, -11.642578125, -9.8203125, -7.998046875, -6.17578125, -4.353515625, -2.53125, -0.708984375, 1.11328125, 2.935546875, 4.7578125, 6.580078125, 8.40234375, 10.224609375, 12.046875, 13.869140625, 15.69140625, 17.513671875, 19.3359375, 21.158203125, 22.98046875, 24.802734375, 26.625, 28.447265625, 30.26953125, 32.091796875, 33.9140625, 35.736328125, 37.55859375, 39.380859375, 41.203125, 43.025390625, 44.84765625, 46.669921875, 48.4921875, 50.314453125, 52.13671875, 53.958984375, 55.78125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 7.0, 11.0, 18.0, 35.0, 51.0, 106.0, 137.0, 194.0, 154.0, 106.0, 84.0, 43.0, 25.0, 13.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-411.00469970703125, -398.42449951171875, -385.84429931640625, -373.26409912109375, -360.68389892578125, -348.10369873046875, -335.52349853515625, -322.94329833984375, -310.36309814453125, -297.78289794921875, -285.20269775390625, -272.62249755859375, -260.04229736328125, -247.46209716796875, -234.8818817138672, -222.3016815185547, -209.72146606445312, -197.14126586914062, -184.56106567382812, -171.98086547851562, -159.40066528320312, -146.82046508789062, -134.24024963378906, -121.66004943847656, -109.07984924316406, -96.49964904785156, -83.91944885253906, -71.33924102783203, -58.75904083251953, -46.17884063720703, -33.5986328125, -21.0184326171875, -8.438201904296875, 4.142000198364258, 16.72220230102539, 29.302406311035156, 41.882606506347656, 54.462806701660156, 67.04301452636719, 79.62321472167969, 92.20341491699219, 104.78361511230469, 117.36381530761719, 129.94403076171875, 142.52423095703125, 155.10443115234375, 167.68463134765625, 180.26483154296875, 192.84503173828125, 205.42523193359375, 218.00543212890625, 230.58563232421875, 243.16583251953125, 255.74603271484375, 268.32623291015625, 280.90643310546875, 293.48663330078125, 306.06683349609375, 318.64703369140625, 331.22723388671875, 343.80743408203125, 356.38763427734375, 368.96783447265625, 381.54803466796875, 394.1282653808594]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 12.0, 10.0, 3.0, 15.0, 23.0, 26.0, 29.0, 33.0, 35.0, 45.0, 61.0, 59.0, 58.0, 58.0, 52.0, 63.0, 67.0, 56.0, 47.0, 59.0, 43.0, 37.0, 32.0, 27.0, 26.0, 7.0, 11.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-286.4460754394531, -279.5267639160156, -272.607421875, -265.6881103515625, -258.768798828125, -251.8494873046875, -244.93016052246094, -238.01083374023438, -231.09152221679688, -224.17221069335938, -217.2528839111328, -210.33355712890625, -203.41424560546875, -196.49493408203125, -189.5756072998047, -182.65628051757812, -175.73696899414062, -168.81765747070312, -161.89833068847656, -154.97900390625, -148.0596923828125, -141.140380859375, -134.22105407714844, -127.3017349243164, -120.38241577148438, -113.46309661865234, -106.54377746582031, -99.62445831298828, -92.70513916015625, -85.78582000732422, -78.86650085449219, -71.94718170166016, -65.02784729003906, -58.10852813720703, -51.189208984375, -44.26988983154297, -37.35057067871094, -30.431251525878906, -23.511932373046875, -16.592613220214844, -9.673294067382812, -2.7539749145507812, 4.16534423828125, 11.084663391113281, 18.003982543945312, 24.923301696777344, 31.842620849609375, 38.761940002441406, 45.68125915527344, 52.60057830810547, 59.5198974609375, 66.43921661376953, 73.35853576660156, 80.2778549194336, 87.19717407226562, 94.11649322509766, 101.03581237792969, 107.95513153076172, 114.87445068359375, 121.79376983642578, 128.7130889892578, 135.63241577148438, 142.55172729492188, 149.47103881835938, 156.39036560058594]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 6.0, 9.0, 8.0, 14.0, 13.0, 25.0, 46.0, 76.0, 101.0, 180.0, 349.0, 577.0, 1216.0, 2444.0, 5547.0, 12934.0, 32332.0, 82612.0, 219307.0, 411450.0, 170282.0, 64565.0, 25222.0, 10333.0, 4600.0, 2048.0, 1023.0, 481.0, 283.0, 206.0, 88.0, 69.0, 39.0, 22.0, 15.0, 12.0, 10.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0], "bins": [-107.8125, -105.14208984375, -102.4716796875, -99.80126953125, -97.130859375, -94.46044921875, -91.7900390625, -89.11962890625, -86.44921875, -83.77880859375, -81.1083984375, -78.43798828125, -75.767578125, -73.09716796875, -70.4267578125, -67.75634765625, -65.0859375, -62.41552734375, -59.7451171875, -57.07470703125, -54.404296875, -51.73388671875, -49.0634765625, -46.39306640625, -43.72265625, -41.05224609375, -38.3818359375, -35.71142578125, -33.041015625, -30.37060546875, -27.7001953125, -25.02978515625, -22.359375, -19.68896484375, -17.0185546875, -14.34814453125, -11.677734375, -9.00732421875, -6.3369140625, -3.66650390625, -0.99609375, 1.67431640625, 4.3447265625, 7.01513671875, 9.685546875, 12.35595703125, 15.0263671875, 17.69677734375, 20.3671875, 23.03759765625, 25.7080078125, 28.37841796875, 31.048828125, 33.71923828125, 36.3896484375, 39.06005859375, 41.73046875, 44.40087890625, 47.0712890625, 49.74169921875, 52.412109375, 55.08251953125, 57.7529296875, 60.42333984375, 63.09375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 1.0, 6.0, 11.0, 11.0, 16.0, 23.0, 24.0, 26.0, 26.0, 35.0, 24.0, 45.0, 36.0, 51.0, 44.0, 53.0, 61.0, 54.0, 45.0, 43.0, 48.0, 43.0, 43.0, 32.0, 26.0, 38.0, 25.0, 25.0, 17.0, 10.0, 11.0, 11.0, 10.0, 4.0, 6.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.078125, -13.520263671875, -12.96240234375, -12.404541015625, -11.8466796875, -11.288818359375, -10.73095703125, -10.173095703125, -9.615234375, -9.057373046875, -8.49951171875, -7.941650390625, -7.3837890625, -6.825927734375, -6.26806640625, -5.710205078125, -5.15234375, -4.594482421875, -4.03662109375, -3.478759765625, -2.9208984375, -2.363037109375, -1.80517578125, -1.247314453125, -0.689453125, -0.131591796875, 0.42626953125, 0.984130859375, 1.5419921875, 2.099853515625, 2.65771484375, 3.215576171875, 3.7734375, 4.331298828125, 4.88916015625, 5.447021484375, 6.0048828125, 6.562744140625, 7.12060546875, 7.678466796875, 8.236328125, 8.794189453125, 9.35205078125, 9.909912109375, 10.4677734375, 11.025634765625, 11.58349609375, 12.141357421875, 12.69921875, 13.257080078125, 13.81494140625, 14.372802734375, 14.9306640625, 15.488525390625, 16.04638671875, 16.604248046875, 17.162109375, 17.719970703125, 18.27783203125, 18.835693359375, 19.3935546875, 19.951416015625, 20.50927734375, 21.067138671875, 21.625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 10.0, 3.0, 8.0, 13.0, 19.0, 26.0, 47.0, 34.0, 67.0, 91.0, 133.0, 209.0, 260.0, 415.0, 754.0, 1286.0, 3227.0, 8906.0, 31249.0, 134359.0, 580993.0, 217826.0, 47587.0, 12868.0, 4135.0, 1656.0, 843.0, 475.0, 293.0, 206.0, 167.0, 99.0, 70.0, 57.0, 45.0, 30.0, 21.0, 18.0, 13.0, 12.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-115.4375, -112.0068359375, -108.576171875, -105.1455078125, -101.71484375, -98.2841796875, -94.853515625, -91.4228515625, -87.9921875, -84.5615234375, -81.130859375, -77.7001953125, -74.26953125, -70.8388671875, -67.408203125, -63.9775390625, -60.546875, -57.1162109375, -53.685546875, -50.2548828125, -46.82421875, -43.3935546875, -39.962890625, -36.5322265625, -33.1015625, -29.6708984375, -26.240234375, -22.8095703125, -19.37890625, -15.9482421875, -12.517578125, -9.0869140625, -5.65625, -2.2255859375, 1.205078125, 4.6357421875, 8.06640625, 11.4970703125, 14.927734375, 18.3583984375, 21.7890625, 25.2197265625, 28.650390625, 32.0810546875, 35.51171875, 38.9423828125, 42.373046875, 45.8037109375, 49.234375, 52.6650390625, 56.095703125, 59.5263671875, 62.95703125, 66.3876953125, 69.818359375, 73.2490234375, 76.6796875, 80.1103515625, 83.541015625, 86.9716796875, 90.40234375, 93.8330078125, 97.263671875, 100.6943359375, 104.125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 3.0, 5.0, 11.0, 5.0, 14.0, 17.0, 19.0, 21.0, 24.0, 24.0, 35.0, 31.0, 27.0, 44.0, 46.0, 42.0, 50.0, 68.0, 56.0, 51.0, 47.0, 40.0, 35.0, 40.0, 30.0, 37.0, 26.0, 21.0, 20.0, 16.0, 14.0, 12.0, 12.0, 7.0, 9.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-78.125, -75.576171875, -73.02734375, -70.478515625, -67.9296875, -65.380859375, -62.83203125, -60.283203125, -57.734375, -55.185546875, -52.63671875, -50.087890625, -47.5390625, -44.990234375, -42.44140625, -39.892578125, -37.34375, -34.794921875, -32.24609375, -29.697265625, -27.1484375, -24.599609375, -22.05078125, -19.501953125, -16.953125, -14.404296875, -11.85546875, -9.306640625, -6.7578125, -4.208984375, -1.66015625, 0.888671875, 3.4375, 5.986328125, 8.53515625, 11.083984375, 13.6328125, 16.181640625, 18.73046875, 21.279296875, 23.828125, 26.376953125, 28.92578125, 31.474609375, 34.0234375, 36.572265625, 39.12109375, 41.669921875, 44.21875, 46.767578125, 49.31640625, 51.865234375, 54.4140625, 56.962890625, 59.51171875, 62.060546875, 64.609375, 67.158203125, 69.70703125, 72.255859375, 74.8046875, 77.353515625, 79.90234375, 82.451171875, 85.0]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 10.0, 5.0, 8.0, 15.0, 10.0, 12.0, 16.0, 23.0, 45.0, 61.0, 81.0, 143.0, 289.0, 583.0, 1656.0, 6325.0, 48535.0, 909793.0, 69868.0, 7751.0, 1872.0, 662.0, 332.0, 145.0, 98.0, 80.0, 43.0, 30.0, 24.0, 10.0, 11.0, 6.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.0, -156.86328125, -150.7265625, -144.58984375, -138.453125, -132.31640625, -126.1796875, -120.04296875, -113.90625, -107.76953125, -101.6328125, -95.49609375, -89.359375, -83.22265625, -77.0859375, -70.94921875, -64.8125, -58.67578125, -52.5390625, -46.40234375, -40.265625, -34.12890625, -27.9921875, -21.85546875, -15.71875, -9.58203125, -3.4453125, 2.69140625, 8.828125, 14.96484375, 21.1015625, 27.23828125, 33.375, 39.51171875, 45.6484375, 51.78515625, 57.921875, 64.05859375, 70.1953125, 76.33203125, 82.46875, 88.60546875, 94.7421875, 100.87890625, 107.015625, 113.15234375, 119.2890625, 125.42578125, 131.5625, 137.69921875, 143.8359375, 149.97265625, 156.109375, 162.24609375, 168.3828125, 174.51953125, 180.65625, 186.79296875, 192.9296875, 199.06640625, 205.203125, 211.33984375, 217.4765625, 223.61328125, 229.75]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 11.0, 15.0, 12.0, 19.0, 34.0, 37.0, 52.0, 62.0, 74.0, 307.0, 101.0, 72.0, 48.0, 37.0, 25.0, 18.0, 18.0, 10.0, 7.0, 4.0, 5.0, 7.0, 2.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01611328125, -0.01560211181640625, -0.0150909423828125, -0.01457977294921875, -0.014068603515625, -0.01355743408203125, -0.0130462646484375, -0.01253509521484375, -0.01202392578125, -0.01151275634765625, -0.0110015869140625, -0.01049041748046875, -0.009979248046875, -0.00946807861328125, -0.0089569091796875, -0.00844573974609375, -0.0079345703125, -0.00742340087890625, -0.0069122314453125, -0.00640106201171875, -0.005889892578125, -0.00537872314453125, -0.0048675537109375, -0.00435638427734375, -0.00384521484375, -0.00333404541015625, -0.0028228759765625, -0.00231170654296875, -0.001800537109375, -0.00128936767578125, -0.0007781982421875, -0.00026702880859375, 0.000244140625, 0.00075531005859375, 0.0012664794921875, 0.00177764892578125, 0.002288818359375, 0.00279998779296875, 0.0033111572265625, 0.00382232666015625, 0.00433349609375, 0.00484466552734375, 0.0053558349609375, 0.00586700439453125, 0.006378173828125, 0.00688934326171875, 0.0074005126953125, 0.00791168212890625, 0.0084228515625, 0.00893402099609375, 0.0094451904296875, 0.00995635986328125, 0.010467529296875, 0.01097869873046875, 0.0114898681640625, 0.01200103759765625, 0.01251220703125, 0.01302337646484375, 0.0135345458984375, 0.01404571533203125, 0.014556884765625, 0.01506805419921875, 0.0155792236328125, 0.01609039306640625, 0.0166015625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 14.0, 12.0, 19.0, 37.0, 57.0, 108.0, 214.0, 443.0, 1851.0, 12903.0, 923344.0, 103097.0, 4853.0, 980.0, 304.0, 119.0, 77.0, 37.0, 28.0, 16.0, 14.0, 13.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-377.75, -368.25390625, -358.7578125, -349.26171875, -339.765625, -330.26953125, -320.7734375, -311.27734375, -301.78125, -292.28515625, -282.7890625, -273.29296875, -263.796875, -254.30078125, -244.8046875, -235.30859375, -225.8125, -216.31640625, -206.8203125, -197.32421875, -187.828125, -178.33203125, -168.8359375, -159.33984375, -149.84375, -140.34765625, -130.8515625, -121.35546875, -111.859375, -102.36328125, -92.8671875, -83.37109375, -73.875, -64.37890625, -54.8828125, -45.38671875, -35.890625, -26.39453125, -16.8984375, -7.40234375, 2.09375, 11.58984375, 21.0859375, 30.58203125, 40.078125, 49.57421875, 59.0703125, 68.56640625, 78.0625, 87.55859375, 97.0546875, 106.55078125, 116.046875, 125.54296875, 135.0390625, 144.53515625, 154.03125, 163.52734375, 173.0234375, 182.51953125, 192.015625, 201.51171875, 211.0078125, 220.50390625, 230.0]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 6.0, 6.0, 15.0, 16.0, 25.0, 34.0, 38.0, 84.0, 137.0, 217.0, 171.0, 81.0, 50.0, 21.0, 23.0, 12.0, 13.0, 11.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-102.875, -100.0546875, -97.234375, -94.4140625, -91.59375, -88.7734375, -85.953125, -83.1328125, -80.3125, -77.4921875, -74.671875, -71.8515625, -69.03125, -66.2109375, -63.390625, -60.5703125, -57.75, -54.9296875, -52.109375, -49.2890625, -46.46875, -43.6484375, -40.828125, -38.0078125, -35.1875, -32.3671875, -29.546875, -26.7265625, -23.90625, -21.0859375, -18.265625, -15.4453125, -12.625, -9.8046875, -6.984375, -4.1640625, -1.34375, 1.4765625, 4.296875, 7.1171875, 9.9375, 12.7578125, 15.578125, 18.3984375, 21.21875, 24.0390625, 26.859375, 29.6796875, 32.5, 35.3203125, 38.140625, 40.9609375, 43.78125, 46.6015625, 49.421875, 52.2421875, 55.0625, 57.8828125, 60.703125, 63.5234375, 66.34375, 69.1640625, 71.984375, 74.8046875, 77.625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 9.0, 9.0, 29.0, 56.0, 117.0, 183.0, 225.0, 178.0, 101.0, 58.0, 26.0, 9.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2286.513916015625, -2236.326171875, -2186.138427734375, -2135.95068359375, -2085.762939453125, -2035.5751953125, -1985.387451171875, -1935.19970703125, -1885.011962890625, -1834.82421875, -1784.636474609375, -1734.44873046875, -1684.260986328125, -1634.0732421875, -1583.885498046875, -1533.69775390625, -1483.510009765625, -1433.322265625, -1383.134521484375, -1332.94677734375, -1282.759033203125, -1232.5712890625, -1182.383544921875, -1132.19580078125, -1082.0079345703125, -1031.8201904296875, -981.6324462890625, -931.4447021484375, -881.2569580078125, -831.0692138671875, -780.8814697265625, -730.6937255859375, -680.5060424804688, -630.3182983398438, -580.1305541992188, -529.9428100585938, -479.75506591796875, -429.56732177734375, -379.3795471191406, -329.1918029785156, -279.0040588378906, -228.81631469726562, -178.62857055664062, -128.44081115722656, -78.25306701660156, -28.065322875976562, 22.1224365234375, 72.3101806640625, 122.4979248046875, 172.6856689453125, 222.8734130859375, 273.0611572265625, 323.2489013671875, 373.4366455078125, 423.6244201660156, 473.8121643066406, 523.9998779296875, 574.1876220703125, 624.3753662109375, 674.5631103515625, 724.7508544921875, 774.9385986328125, 825.1263427734375, 875.3140869140625, 925.5018920898438]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 9.0, 7.0, 4.0, 15.0, 22.0, 19.0, 18.0, 23.0, 27.0, 25.0, 27.0, 28.0, 40.0, 25.0, 28.0, 35.0, 47.0, 46.0, 37.0, 32.0, 51.0, 47.0, 51.0, 41.0, 36.0, 41.0, 31.0, 18.0, 22.0, 20.0, 14.0, 16.0, 12.0, 11.0, 8.0, 8.0, 13.0, 3.0, 8.0, 7.0, 6.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-412.84381103515625, -398.9066467285156, -384.969482421875, -371.0323181152344, -357.09515380859375, -343.157958984375, -329.2207946777344, -315.28363037109375, -301.3464660644531, -287.4093017578125, -273.4721374511719, -259.53497314453125, -245.59779357910156, -231.66062927246094, -217.72344970703125, -203.78628540039062, -189.84912109375, -175.91195678710938, -161.97479248046875, -148.03761291503906, -134.10044860839844, -120.16328430175781, -106.22611236572266, -92.2889404296875, -78.35177612304688, -64.41461181640625, -50.477439880371094, -36.5402717590332, -22.603103637695312, -8.665939331054688, 5.271232604980469, 19.208404541015625, 33.14556884765625, 47.08273696899414, 61.01990509033203, 74.95707702636719, 88.89424133300781, 102.83140563964844, 116.7685775756836, 130.70574951171875, 144.64291381835938, 158.580078125, 172.51724243164062, 186.4544219970703, 200.39158630371094, 214.32875061035156, 228.26593017578125, 242.20309448242188, 256.1402587890625, 270.0774230957031, 284.01458740234375, 297.9517517089844, 311.888916015625, 325.82611083984375, 339.7632751464844, 353.700439453125, 367.6376037597656, 381.57476806640625, 395.5119323730469, 409.4490966796875, 423.38629150390625, 437.32342529296875, 451.2606201171875, 465.1977844238281, 479.13494873046875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 9.0, 17.0, 19.0, 33.0, 37.0, 42.0, 70.0, 99.0, 173.0, 290.0, 477.0, 959.0, 2049.0, 4643.0, 12482.0, 37525.0, 188659.0, 3575874.0, 297381.0, 47431.0, 15118.0, 5750.0, 2431.0, 1155.0, 600.0, 344.0, 211.0, 127.0, 79.0, 53.0, 40.0, 32.0, 21.0, 14.0, 11.0, 6.0, 7.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-173.75, -169.001953125, -164.25390625, -159.505859375, -154.7578125, -150.009765625, -145.26171875, -140.513671875, -135.765625, -131.017578125, -126.26953125, -121.521484375, -116.7734375, -112.025390625, -107.27734375, -102.529296875, -97.78125, -93.033203125, -88.28515625, -83.537109375, -78.7890625, -74.041015625, -69.29296875, -64.544921875, -59.796875, -55.048828125, -50.30078125, -45.552734375, -40.8046875, -36.056640625, -31.30859375, -26.560546875, -21.8125, -17.064453125, -12.31640625, -7.568359375, -2.8203125, 1.927734375, 6.67578125, 11.423828125, 16.171875, 20.919921875, 25.66796875, 30.416015625, 35.1640625, 39.912109375, 44.66015625, 49.408203125, 54.15625, 58.904296875, 63.65234375, 68.400390625, 73.1484375, 77.896484375, 82.64453125, 87.392578125, 92.140625, 96.888671875, 101.63671875, 106.384765625, 111.1328125, 115.880859375, 120.62890625, 125.376953125, 130.125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 9.0, 8.0, 3.0, 8.0, 11.0, 21.0, 12.0, 22.0, 23.0, 26.0, 30.0, 40.0, 44.0, 32.0, 32.0, 34.0, 43.0, 43.0, 47.0, 54.0, 46.0, 38.0, 45.0, 41.0, 38.0, 36.0, 40.0, 26.0, 23.0, 25.0, 18.0, 9.0, 10.0, 17.0, 10.0, 5.0, 8.0, 7.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.59375, -14.03515625, -13.4765625, -12.91796875, -12.359375, -11.80078125, -11.2421875, -10.68359375, -10.125, -9.56640625, -9.0078125, -8.44921875, -7.890625, -7.33203125, -6.7734375, -6.21484375, -5.65625, -5.09765625, -4.5390625, -3.98046875, -3.421875, -2.86328125, -2.3046875, -1.74609375, -1.1875, -0.62890625, -0.0703125, 0.48828125, 1.046875, 1.60546875, 2.1640625, 2.72265625, 3.28125, 3.83984375, 4.3984375, 4.95703125, 5.515625, 6.07421875, 6.6328125, 7.19140625, 7.75, 8.30859375, 8.8671875, 9.42578125, 9.984375, 10.54296875, 11.1015625, 11.66015625, 12.21875, 12.77734375, 13.3359375, 13.89453125, 14.453125, 15.01171875, 15.5703125, 16.12890625, 16.6875, 17.24609375, 17.8046875, 18.36328125, 18.921875, 19.48046875, 20.0390625, 20.59765625, 21.15625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 11.0, 13.0, 13.0, 35.0, 38.0, 42.0, 74.0, 103.0, 152.0, 245.0, 382.0, 676.0, 1231.0, 2406.0, 4920.0, 11309.0, 30880.0, 116416.0, 2563417.0, 1314431.0, 99545.0, 27906.0, 10343.0, 4592.0, 2177.0, 1151.0, 628.0, 400.0, 241.0, 147.0, 104.0, 79.0, 43.0, 30.0, 23.0, 15.0, 16.0, 13.0, 10.0, 7.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-145.25, -140.841796875, -136.43359375, -132.025390625, -127.6171875, -123.208984375, -118.80078125, -114.392578125, -109.984375, -105.576171875, -101.16796875, -96.759765625, -92.3515625, -87.943359375, -83.53515625, -79.126953125, -74.71875, -70.310546875, -65.90234375, -61.494140625, -57.0859375, -52.677734375, -48.26953125, -43.861328125, -39.453125, -35.044921875, -30.63671875, -26.228515625, -21.8203125, -17.412109375, -13.00390625, -8.595703125, -4.1875, 0.220703125, 4.62890625, 9.037109375, 13.4453125, 17.853515625, 22.26171875, 26.669921875, 31.078125, 35.486328125, 39.89453125, 44.302734375, 48.7109375, 53.119140625, 57.52734375, 61.935546875, 66.34375, 70.751953125, 75.16015625, 79.568359375, 83.9765625, 88.384765625, 92.79296875, 97.201171875, 101.609375, 106.017578125, 110.42578125, 114.833984375, 119.2421875, 123.650390625, 128.05859375, 132.466796875, 136.875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 5.0, 7.0, 22.0, 21.0, 33.0, 29.0, 60.0, 72.0, 111.0, 254.0, 673.0, 1779.0, 463.0, 201.0, 111.0, 60.0, 47.0, 27.0, 22.0, 17.0, 8.0, 9.0, 4.0, 13.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.4375, -73.10546875, -70.7734375, -68.44140625, -66.109375, -63.77734375, -61.4453125, -59.11328125, -56.78125, -54.44921875, -52.1171875, -49.78515625, -47.453125, -45.12109375, -42.7890625, -40.45703125, -38.125, -35.79296875, -33.4609375, -31.12890625, -28.796875, -26.46484375, -24.1328125, -21.80078125, -19.46875, -17.13671875, -14.8046875, -12.47265625, -10.140625, -7.80859375, -5.4765625, -3.14453125, -0.8125, 1.51953125, 3.8515625, 6.18359375, 8.515625, 10.84765625, 13.1796875, 15.51171875, 17.84375, 20.17578125, 22.5078125, 24.83984375, 27.171875, 29.50390625, 31.8359375, 34.16796875, 36.5, 38.83203125, 41.1640625, 43.49609375, 45.828125, 48.16015625, 50.4921875, 52.82421875, 55.15625, 57.48828125, 59.8203125, 62.15234375, 64.484375, 66.81640625, 69.1484375, 71.48046875, 73.8125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 14.0, 24.0, 87.0, 211.0, 323.0, 217.0, 92.0, 31.0, 11.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-310.0920104980469, -273.5859680175781, -237.07989501953125, -200.5738525390625, -164.0677947998047, -127.56173706054688, -91.05569458007812, -54.54963684082031, -18.0435791015625, 18.462474822998047, 54.968528747558594, 91.47457885742188, 127.98063659667969, 164.4866943359375, 200.99273681640625, 237.49879455566406, 274.0048522949219, 310.5108947753906, 347.0169677734375, 383.52301025390625, 420.029052734375, 456.5351257324219, 493.0411682128906, 529.5472412109375, 566.0532836914062, 602.559326171875, 639.0653686523438, 675.5714111328125, 712.0775146484375, 748.5835571289062, 785.089599609375, 821.5956420898438, 858.1016845703125, 894.6077270507812, 931.11376953125, 967.619873046875, 1004.1259155273438, 1040.6319580078125, 1077.137939453125, 1113.64404296875, 1150.150146484375, 1186.65625, 1223.1622314453125, 1259.6683349609375, 1296.17431640625, 1332.680419921875, 1369.1865234375, 1405.6925048828125, 1442.198486328125, 1478.70458984375, 1515.2105712890625, 1551.7166748046875, 1588.22265625, 1624.728759765625, 1661.23486328125, 1697.7408447265625, 1734.2469482421875, 1770.7530517578125, 1807.259033203125, 1843.76513671875, 1880.2711181640625, 1916.7772216796875, 1953.283203125, 1989.789306640625, 2026.29541015625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 13.0, 11.0, 5.0, 14.0, 16.0, 14.0, 25.0, 29.0, 25.0, 25.0, 29.0, 37.0, 33.0, 30.0, 42.0, 34.0, 43.0, 45.0, 41.0, 48.0, 43.0, 43.0, 40.0, 42.0, 37.0, 35.0, 39.0, 27.0, 24.0, 12.0, 23.0, 8.0, 13.0, 13.0, 8.0, 8.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-242.73529052734375, -235.77764892578125, -228.82000732421875, -221.86236572265625, -214.90472412109375, -207.94708251953125, -200.98944091796875, -194.0317840576172, -187.0741424560547, -180.1165008544922, -173.1588592529297, -166.2012176513672, -159.2435760498047, -152.28591918945312, -145.32827758789062, -138.37063598632812, -131.41299438476562, -124.45535278320312, -117.49771118164062, -110.54006958007812, -103.5824203491211, -96.6247787475586, -89.6671371459961, -82.70948791503906, -75.75186157226562, -68.79421997070312, -61.83657455444336, -54.87893295288086, -47.921287536621094, -40.963645935058594, -34.006004333496094, -27.048358917236328, -20.090713500976562, -13.13306999206543, -6.175427436828613, 0.7822151184082031, 7.739858627319336, 14.697502136230469, 21.65514373779297, 28.612789154052734, 35.570430755615234, 42.528072357177734, 49.4857177734375, 56.443359375, 63.4010009765625, 70.358642578125, 77.3162841796875, 84.27393341064453, 91.23157501220703, 98.18921661376953, 105.14685821533203, 112.10450744628906, 119.06214904785156, 126.01979064941406, 132.97743225097656, 139.93507385253906, 146.89271545410156, 153.85035705566406, 160.80799865722656, 167.76564025878906, 174.72328186035156, 181.68093872070312, 188.63858032226562, 195.59622192382812, 202.55386352539062]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 8.0, 16.0, 34.0, 33.0, 56.0, 115.0, 168.0, 332.0, 527.0, 1181.0, 2269.0, 4908.0, 11370.0, 28764.0, 78338.0, 222698.0, 380982.0, 201402.0, 70438.0, 25788.0, 10145.0, 4654.0, 2068.0, 1029.0, 566.0, 292.0, 156.0, 88.0, 53.0, 25.0, 13.0, 15.0, 15.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.8125, -77.8681640625, -74.923828125, -71.9794921875, -69.03515625, -66.0908203125, -63.146484375, -60.2021484375, -57.2578125, -54.3134765625, -51.369140625, -48.4248046875, -45.48046875, -42.5361328125, -39.591796875, -36.6474609375, -33.703125, -30.7587890625, -27.814453125, -24.8701171875, -21.92578125, -18.9814453125, -16.037109375, -13.0927734375, -10.1484375, -7.2041015625, -4.259765625, -1.3154296875, 1.62890625, 4.5732421875, 7.517578125, 10.4619140625, 13.40625, 16.3505859375, 19.294921875, 22.2392578125, 25.18359375, 28.1279296875, 31.072265625, 34.0166015625, 36.9609375, 39.9052734375, 42.849609375, 45.7939453125, 48.73828125, 51.6826171875, 54.626953125, 57.5712890625, 60.515625, 63.4599609375, 66.404296875, 69.3486328125, 72.29296875, 75.2373046875, 78.181640625, 81.1259765625, 84.0703125, 87.0146484375, 89.958984375, 92.9033203125, 95.84765625, 98.7919921875, 101.736328125, 104.6806640625, 107.625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 11.0, 13.0, 14.0, 17.0, 17.0, 22.0, 28.0, 27.0, 36.0, 39.0, 25.0, 36.0, 47.0, 54.0, 43.0, 55.0, 41.0, 50.0, 43.0, 61.0, 50.0, 44.0, 32.0, 29.0, 22.0, 20.0, 17.0, 18.0, 17.0, 14.0, 11.0, 11.0, 16.0, 2.0, 0.0, 6.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.828125, -21.129150390625, -20.43017578125, -19.731201171875, -19.0322265625, -18.333251953125, -17.63427734375, -16.935302734375, -16.236328125, -15.537353515625, -14.83837890625, -14.139404296875, -13.4404296875, -12.741455078125, -12.04248046875, -11.343505859375, -10.64453125, -9.945556640625, -9.24658203125, -8.547607421875, -7.8486328125, -7.149658203125, -6.45068359375, -5.751708984375, -5.052734375, -4.353759765625, -3.65478515625, -2.955810546875, -2.2568359375, -1.557861328125, -0.85888671875, -0.159912109375, 0.5390625, 1.238037109375, 1.93701171875, 2.635986328125, 3.3349609375, 4.033935546875, 4.73291015625, 5.431884765625, 6.130859375, 6.829833984375, 7.52880859375, 8.227783203125, 8.9267578125, 9.625732421875, 10.32470703125, 11.023681640625, 11.72265625, 12.421630859375, 13.12060546875, 13.819580078125, 14.5185546875, 15.217529296875, 15.91650390625, 16.615478515625, 17.314453125, 18.013427734375, 18.71240234375, 19.411376953125, 20.1103515625, 20.809326171875, 21.50830078125, 22.207275390625, 22.90625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 14.0, 4.0, 15.0, 19.0, 14.0, 28.0, 33.0, 41.0, 57.0, 79.0, 103.0, 146.0, 201.0, 297.0, 408.0, 678.0, 1322.0, 2915.0, 9013.0, 38016.0, 213012.0, 583251.0, 156582.0, 29265.0, 7404.0, 2607.0, 1112.0, 599.0, 358.0, 243.0, 173.0, 133.0, 105.0, 88.0, 47.0, 42.0, 27.0, 28.0, 16.0, 15.0, 7.0, 12.0, 8.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-168.375, -163.482421875, -158.58984375, -153.697265625, -148.8046875, -143.912109375, -139.01953125, -134.126953125, -129.234375, -124.341796875, -119.44921875, -114.556640625, -109.6640625, -104.771484375, -99.87890625, -94.986328125, -90.09375, -85.201171875, -80.30859375, -75.416015625, -70.5234375, -65.630859375, -60.73828125, -55.845703125, -50.953125, -46.060546875, -41.16796875, -36.275390625, -31.3828125, -26.490234375, -21.59765625, -16.705078125, -11.8125, -6.919921875, -2.02734375, 2.865234375, 7.7578125, 12.650390625, 17.54296875, 22.435546875, 27.328125, 32.220703125, 37.11328125, 42.005859375, 46.8984375, 51.791015625, 56.68359375, 61.576171875, 66.46875, 71.361328125, 76.25390625, 81.146484375, 86.0390625, 90.931640625, 95.82421875, 100.716796875, 105.609375, 110.501953125, 115.39453125, 120.287109375, 125.1796875, 130.072265625, 134.96484375, 139.857421875, 144.75]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 6.0, 3.0, 8.0, 7.0, 9.0, 7.0, 22.0, 12.0, 12.0, 26.0, 24.0, 27.0, 32.0, 29.0, 36.0, 43.0, 40.0, 56.0, 49.0, 43.0, 40.0, 69.0, 46.0, 33.0, 42.0, 52.0, 30.0, 32.0, 22.0, 23.0, 16.0, 17.0, 11.0, 17.0, 9.0, 9.0, 9.0, 7.0, 4.0, 3.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.125, -110.26953125, -106.4140625, -102.55859375, -98.703125, -94.84765625, -90.9921875, -87.13671875, -83.28125, -79.42578125, -75.5703125, -71.71484375, -67.859375, -64.00390625, -60.1484375, -56.29296875, -52.4375, -48.58203125, -44.7265625, -40.87109375, -37.015625, -33.16015625, -29.3046875, -25.44921875, -21.59375, -17.73828125, -13.8828125, -10.02734375, -6.171875, -2.31640625, 1.5390625, 5.39453125, 9.25, 13.10546875, 16.9609375, 20.81640625, 24.671875, 28.52734375, 32.3828125, 36.23828125, 40.09375, 43.94921875, 47.8046875, 51.66015625, 55.515625, 59.37109375, 63.2265625, 67.08203125, 70.9375, 74.79296875, 78.6484375, 82.50390625, 86.359375, 90.21484375, 94.0703125, 97.92578125, 101.78125, 105.63671875, 109.4921875, 113.34765625, 117.203125, 121.05859375, 124.9140625, 128.76953125, 132.625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 13.0, 11.0, 24.0, 49.0, 96.0, 263.0, 1304.0, 14143.0, 933785.0, 94481.0, 3586.0, 516.0, 156.0, 50.0, 31.0, 16.0, 11.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-487.5, -475.8203125, -464.140625, -452.4609375, -440.78125, -429.1015625, -417.421875, -405.7421875, -394.0625, -382.3828125, -370.703125, -359.0234375, -347.34375, -335.6640625, -323.984375, -312.3046875, -300.625, -288.9453125, -277.265625, -265.5859375, -253.90625, -242.2265625, -230.546875, -218.8671875, -207.1875, -195.5078125, -183.828125, -172.1484375, -160.46875, -148.7890625, -137.109375, -125.4296875, -113.75, -102.0703125, -90.390625, -78.7109375, -67.03125, -55.3515625, -43.671875, -31.9921875, -20.3125, -8.6328125, 3.046875, 14.7265625, 26.40625, 38.0859375, 49.765625, 61.4453125, 73.125, 84.8046875, 96.484375, 108.1640625, 119.84375, 131.5234375, 143.203125, 154.8828125, 166.5625, 178.2421875, 189.921875, 201.6015625, 213.28125, 224.9609375, 236.640625, 248.3203125, 260.0]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 4.0, 5.0, 9.0, 9.0, 18.0, 34.0, 56.0, 95.0, 140.0, 195.0, 155.0, 117.0, 55.0, 36.0, 19.0, 15.0, 7.0, 4.0, 3.0, 1.0, 0.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01995849609375, -0.019283294677734375, -0.01860809326171875, -0.017932891845703125, -0.0172576904296875, -0.016582489013671875, -0.01590728759765625, -0.015232086181640625, -0.014556884765625, -0.013881683349609375, -0.01320648193359375, -0.012531280517578125, -0.0118560791015625, -0.011180877685546875, -0.01050567626953125, -0.009830474853515625, -0.0091552734375, -0.008480072021484375, -0.00780487060546875, -0.007129669189453125, -0.0064544677734375, -0.005779266357421875, -0.00510406494140625, -0.004428863525390625, -0.003753662109375, -0.003078460693359375, -0.00240325927734375, -0.001728057861328125, -0.0010528564453125, -0.000377655029296875, 0.00029754638671875, 0.000972747802734375, 0.00164794921875, 0.002323150634765625, 0.00299835205078125, 0.003673553466796875, 0.0043487548828125, 0.005023956298828125, 0.00569915771484375, 0.006374359130859375, 0.007049560546875, 0.007724761962890625, 0.00839996337890625, 0.009075164794921875, 0.0097503662109375, 0.010425567626953125, 0.01110076904296875, 0.011775970458984375, 0.012451171875, 0.013126373291015625, 0.01380157470703125, 0.014476776123046875, 0.0151519775390625, 0.015827178955078125, 0.01650238037109375, 0.017177581787109375, 0.017852783203125, 0.018527984619140625, 0.01920318603515625, 0.019878387451171875, 0.0205535888671875, 0.021228790283203125, 0.02190399169921875, 0.022579193115234375, 0.02325439453125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 10.0, 6.0, 7.0, 15.0, 26.0, 30.0, 63.0, 115.0, 175.0, 345.0, 764.0, 1993.0, 6656.0, 37885.0, 610214.0, 356728.0, 25316.0, 5249.0, 1650.0, 619.0, 283.0, 148.0, 90.0, 57.0, 36.0, 19.0, 9.0, 13.0, 13.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-168.0, -163.044921875, -158.08984375, -153.134765625, -148.1796875, -143.224609375, -138.26953125, -133.314453125, -128.359375, -123.404296875, -118.44921875, -113.494140625, -108.5390625, -103.583984375, -98.62890625, -93.673828125, -88.71875, -83.763671875, -78.80859375, -73.853515625, -68.8984375, -63.943359375, -58.98828125, -54.033203125, -49.078125, -44.123046875, -39.16796875, -34.212890625, -29.2578125, -24.302734375, -19.34765625, -14.392578125, -9.4375, -4.482421875, 0.47265625, 5.427734375, 10.3828125, 15.337890625, 20.29296875, 25.248046875, 30.203125, 35.158203125, 40.11328125, 45.068359375, 50.0234375, 54.978515625, 59.93359375, 64.888671875, 69.84375, 74.798828125, 79.75390625, 84.708984375, 89.6640625, 94.619140625, 99.57421875, 104.529296875, 109.484375, 114.439453125, 119.39453125, 124.349609375, 129.3046875, 134.259765625, 139.21484375, 144.169921875, 149.125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 4.0, 3.0, 3.0, 7.0, 5.0, 8.0, 20.0, 30.0, 25.0, 34.0, 58.0, 51.0, 70.0, 84.0, 108.0, 103.0, 92.0, 60.0, 67.0, 49.0, 32.0, 24.0, 14.0, 14.0, 10.0, 7.0, 6.0, 3.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.5, -81.771484375, -79.04296875, -76.314453125, -73.5859375, -70.857421875, -68.12890625, -65.400390625, -62.671875, -59.943359375, -57.21484375, -54.486328125, -51.7578125, -49.029296875, -46.30078125, -43.572265625, -40.84375, -38.115234375, -35.38671875, -32.658203125, -29.9296875, -27.201171875, -24.47265625, -21.744140625, -19.015625, -16.287109375, -13.55859375, -10.830078125, -8.1015625, -5.373046875, -2.64453125, 0.083984375, 2.8125, 5.541015625, 8.26953125, 10.998046875, 13.7265625, 16.455078125, 19.18359375, 21.912109375, 24.640625, 27.369140625, 30.09765625, 32.826171875, 35.5546875, 38.283203125, 41.01171875, 43.740234375, 46.46875, 49.197265625, 51.92578125, 54.654296875, 57.3828125, 60.111328125, 62.83984375, 65.568359375, 68.296875, 71.025390625, 73.75390625, 76.482421875, 79.2109375, 81.939453125, 84.66796875, 87.396484375, 90.125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 15.0, 12.0, 37.0, 39.0, 71.0, 98.0, 118.0, 132.0, 124.0, 117.0, 87.0, 64.0, 30.0, 25.0, 11.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1019.497802734375, -982.3251342773438, -945.1524658203125, -907.9797973632812, -870.80712890625, -833.634521484375, -796.4618530273438, -759.2891845703125, -722.1165161132812, -684.94384765625, -647.7711791992188, -610.5985107421875, -573.4259033203125, -536.253173828125, -499.08056640625, -461.90789794921875, -424.7352294921875, -387.56256103515625, -350.389892578125, -313.2172546386719, -276.0445861816406, -238.87191772460938, -201.6992645263672, -164.526611328125, -127.35394287109375, -90.18128204345703, -53.00862121582031, -15.835960388183594, 21.336700439453125, 58.509368896484375, 95.68202209472656, 132.85467529296875, 170.02734375, 207.20001220703125, 244.37266540527344, 281.5453186035156, 318.7179870605469, 355.8906555175781, 393.06329345703125, 430.2359619140625, 467.40863037109375, 504.581298828125, 541.7539672851562, 578.9266357421875, 616.0992431640625, 653.27197265625, 690.444580078125, 727.6172485351562, 764.7899169921875, 801.9625854492188, 839.13525390625, 876.3079223632812, 913.4805908203125, 950.6531982421875, 987.8258666992188, 1024.99853515625, 1062.171142578125, 1099.34375, 1136.5164794921875, 1173.6890869140625, 1210.86181640625, 1248.034423828125, 1285.2071533203125, 1322.3797607421875, 1359.552490234375]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 6.0, 8.0, 14.0, 13.0, 12.0, 19.0, 19.0, 24.0, 20.0, 39.0, 25.0, 24.0, 43.0, 38.0, 51.0, 42.0, 39.0, 33.0, 51.0, 54.0, 48.0, 41.0, 39.0, 49.0, 35.0, 32.0, 24.0, 25.0, 14.0, 14.0, 21.0, 15.0, 8.0, 11.0, 4.0, 10.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-634.297119140625, -613.699951171875, -593.102783203125, -572.505615234375, -551.908447265625, -531.311279296875, -510.714111328125, -490.116943359375, -469.519775390625, -448.922607421875, -428.325439453125, -407.728271484375, -387.131103515625, -366.533935546875, -345.936767578125, -325.339599609375, -304.742431640625, -284.145263671875, -263.548095703125, -242.950927734375, -222.353759765625, -201.756591796875, -181.159423828125, -160.562255859375, -139.965087890625, -119.367919921875, -98.770751953125, -78.173583984375, -57.576416015625, -36.979248046875, -16.382080078125, 4.215087890625, 24.81219482421875, 45.40936279296875, 66.00653076171875, 86.60369873046875, 107.20086669921875, 127.79803466796875, 148.39520263671875, 168.99237060546875, 189.58953857421875, 210.18670654296875, 230.78387451171875, 251.38104248046875, 271.97821044921875, 292.57537841796875, 313.17254638671875, 333.76971435546875, 354.36688232421875, 374.96405029296875, 395.56121826171875, 416.15838623046875, 436.75555419921875, 457.35272216796875, 477.94989013671875, 498.54705810546875, 519.1442260742188, 539.7413940429688, 560.3385620117188, 580.9357299804688, 601.5328979492188, 622.1300659179688, 642.7272338867188, 663.3244018554688, 683.9215698242188]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 12.0, 9.0, 13.0, 26.0, 32.0, 46.0, 57.0, 95.0, 132.0, 222.0, 319.0, 471.0, 924.0, 1647.0, 3517.0, 10402.0, 86408.0, 4041725.0, 34999.0, 7049.0, 2793.0, 1415.0, 720.0, 424.0, 291.0, 164.0, 116.0, 86.0, 49.0, 33.0, 20.0, 17.0, 15.0, 10.0, 4.0, 7.0, 5.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-244.875, -237.744140625, -230.61328125, -223.482421875, -216.3515625, -209.220703125, -202.08984375, -194.958984375, -187.828125, -180.697265625, -173.56640625, -166.435546875, -159.3046875, -152.173828125, -145.04296875, -137.912109375, -130.78125, -123.650390625, -116.51953125, -109.388671875, -102.2578125, -95.126953125, -87.99609375, -80.865234375, -73.734375, -66.603515625, -59.47265625, -52.341796875, -45.2109375, -38.080078125, -30.94921875, -23.818359375, -16.6875, -9.556640625, -2.42578125, 4.705078125, 11.8359375, 18.966796875, 26.09765625, 33.228515625, 40.359375, 47.490234375, 54.62109375, 61.751953125, 68.8828125, 76.013671875, 83.14453125, 90.275390625, 97.40625, 104.537109375, 111.66796875, 118.798828125, 125.9296875, 133.060546875, 140.19140625, 147.322265625, 154.453125, 161.583984375, 168.71484375, 175.845703125, 182.9765625, 190.107421875, 197.23828125, 204.369140625, 211.5]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 5.0, 11.0, 9.0, 11.0, 6.0, 16.0, 13.0, 15.0, 20.0, 33.0, 35.0, 26.0, 39.0, 50.0, 43.0, 31.0, 44.0, 53.0, 53.0, 55.0, 49.0, 52.0, 36.0, 32.0, 46.0, 31.0, 26.0, 31.0, 23.0, 25.0, 16.0, 19.0, 6.0, 14.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-30.125, -29.255615234375, -28.38623046875, -27.516845703125, -26.6474609375, -25.778076171875, -24.90869140625, -24.039306640625, -23.169921875, -22.300537109375, -21.43115234375, -20.561767578125, -19.6923828125, -18.822998046875, -17.95361328125, -17.084228515625, -16.21484375, -15.345458984375, -14.47607421875, -13.606689453125, -12.7373046875, -11.867919921875, -10.99853515625, -10.129150390625, -9.259765625, -8.390380859375, -7.52099609375, -6.651611328125, -5.7822265625, -4.912841796875, -4.04345703125, -3.174072265625, -2.3046875, -1.435302734375, -0.56591796875, 0.303466796875, 1.1728515625, 2.042236328125, 2.91162109375, 3.781005859375, 4.650390625, 5.519775390625, 6.38916015625, 7.258544921875, 8.1279296875, 8.997314453125, 9.86669921875, 10.736083984375, 11.60546875, 12.474853515625, 13.34423828125, 14.213623046875, 15.0830078125, 15.952392578125, 16.82177734375, 17.691162109375, 18.560546875, 19.429931640625, 20.29931640625, 21.168701171875, 22.0380859375, 22.907470703125, 23.77685546875, 24.646240234375, 25.515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 6.0, 11.0, 6.0, 9.0, 22.0, 42.0, 59.0, 74.0, 135.0, 217.0, 330.0, 592.0, 1066.0, 2138.0, 5032.0, 15138.0, 216759.0, 3918147.0, 22389.0, 6399.0, 2756.0, 1205.0, 706.0, 378.0, 246.0, 130.0, 93.0, 72.0, 48.0, 24.0, 20.0, 9.0, 5.0, 5.0, 3.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-251.75, -243.9140625, -236.078125, -228.2421875, -220.40625, -212.5703125, -204.734375, -196.8984375, -189.0625, -181.2265625, -173.390625, -165.5546875, -157.71875, -149.8828125, -142.046875, -134.2109375, -126.375, -118.5390625, -110.703125, -102.8671875, -95.03125, -87.1953125, -79.359375, -71.5234375, -63.6875, -55.8515625, -48.015625, -40.1796875, -32.34375, -24.5078125, -16.671875, -8.8359375, -1.0, 6.8359375, 14.671875, 22.5078125, 30.34375, 38.1796875, 46.015625, 53.8515625, 61.6875, 69.5234375, 77.359375, 85.1953125, 93.03125, 100.8671875, 108.703125, 116.5390625, 124.375, 132.2109375, 140.046875, 147.8828125, 155.71875, 163.5546875, 171.390625, 179.2265625, 187.0625, 194.8984375, 202.734375, 210.5703125, 218.40625, 226.2421875, 234.078125, 241.9140625, 249.75]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 6.0, 3.0, 2.0, 4.0, 11.0, 23.0, 39.0, 144.0, 3327.0, 363.0, 68.0, 27.0, 13.0, 11.0, 8.0, 4.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.25, -44.8369140625, -43.423828125, -42.0107421875, -40.59765625, -39.1845703125, -37.771484375, -36.3583984375, -34.9453125, -33.5322265625, -32.119140625, -30.7060546875, -29.29296875, -27.8798828125, -26.466796875, -25.0537109375, -23.640625, -22.2275390625, -20.814453125, -19.4013671875, -17.98828125, -16.5751953125, -15.162109375, -13.7490234375, -12.3359375, -10.9228515625, -9.509765625, -8.0966796875, -6.68359375, -5.2705078125, -3.857421875, -2.4443359375, -1.03125, 0.3818359375, 1.794921875, 3.2080078125, 4.62109375, 6.0341796875, 7.447265625, 8.8603515625, 10.2734375, 11.6865234375, 13.099609375, 14.5126953125, 15.92578125, 17.3388671875, 18.751953125, 20.1650390625, 21.578125, 22.9912109375, 24.404296875, 25.8173828125, 27.23046875, 28.6435546875, 30.056640625, 31.4697265625, 32.8828125, 34.2958984375, 35.708984375, 37.1220703125, 38.53515625, 39.9482421875, 41.361328125, 42.7744140625, 44.1875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 7.0, 12.0, 31.0, 52.0, 79.0, 121.0, 154.0, 175.0, 125.0, 80.0, 68.0, 43.0, 23.0, 12.0, 10.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-230.63693237304688, -224.88626098632812, -219.13560485839844, -213.3849334716797, -207.63427734375, -201.88360595703125, -196.1329345703125, -190.38226318359375, -184.63160705566406, -178.8809356689453, -173.13027954101562, -167.37960815429688, -161.62893676757812, -155.87828063964844, -150.1276092529297, -144.376953125, -138.62628173828125, -132.8756103515625, -127.12495422363281, -121.37428283691406, -115.62361907958984, -109.87295532226562, -104.12228393554688, -98.37162017822266, -92.62095642089844, -86.87029266357422, -81.11962890625, -75.36895751953125, -69.61829376220703, -63.86763000488281, -58.11696243286133, -52.366294860839844, -46.61564636230469, -40.86498260498047, -35.114315032958984, -29.363649368286133, -23.61298370361328, -17.86231803894043, -12.111652374267578, -6.360984802246094, -0.610321044921875, 5.140344619750977, 10.891010284423828, 16.64167594909668, 22.39234161376953, 28.143007278442383, 33.893672943115234, 39.64434051513672, 45.39500427246094, 51.145668029785156, 56.89633560180664, 62.647003173828125, 68.39766693115234, 74.14833068847656, 79.89900207519531, 85.64966583251953, 91.40032958984375, 97.15099334716797, 102.90165710449219, 108.65232849121094, 114.40299224853516, 120.15365600585938, 125.90432739257812, 131.65499877929688, 137.40565490722656]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 6.0, 3.0, 3.0, 5.0, 7.0, 7.0, 14.0, 10.0, 14.0, 12.0, 22.0, 19.0, 19.0, 38.0, 34.0, 31.0, 43.0, 42.0, 32.0, 54.0, 48.0, 32.0, 48.0, 32.0, 43.0, 35.0, 34.0, 42.0, 30.0, 29.0, 30.0, 30.0, 28.0, 29.0, 20.0, 14.0, 16.0, 9.0, 15.0, 7.0, 6.0, 9.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.81053161621094, -69.47563171386719, -67.14073181152344, -64.80583953857422, -62.47093963623047, -60.13603973388672, -57.801143646240234, -55.46624755859375, -53.13134765625, -50.79644775390625, -48.461551666259766, -46.12665557861328, -43.79175567626953, -41.45685577392578, -39.1219596862793, -36.78706359863281, -34.45216369628906, -32.11726379394531, -29.782367706298828, -27.44746971130371, -25.112571716308594, -22.777673721313477, -20.44277572631836, -18.107877731323242, -15.772979736328125, -13.438081741333008, -11.10318374633789, -8.768285751342773, -6.433387756347656, -4.098489761352539, -1.7635917663574219, 0.5713062286376953, 2.9062042236328125, 5.24110221862793, 7.576000213623047, 9.910898208618164, 12.245796203613281, 14.580694198608398, 16.915592193603516, 19.250490188598633, 21.58538818359375, 23.920286178588867, 26.255184173583984, 28.5900821685791, 30.92498016357422, 33.25988006591797, 35.59477615356445, 37.92967224121094, 40.26457214355469, 42.59947204589844, 44.93436813354492, 47.269264221191406, 49.604164123535156, 51.939064025878906, 54.27396011352539, 56.608856201171875, 58.943756103515625, 61.278656005859375, 63.61355209350586, 65.94844818115234, 68.2833480834961, 70.61824798583984, 72.95314025878906, 75.28804016113281, 77.62294006347656]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 19.0, 16.0, 25.0, 38.0, 55.0, 60.0, 123.0, 168.0, 289.0, 460.0, 774.0, 1304.0, 2508.0, 4547.0, 9224.0, 18680.0, 40184.0, 86597.0, 188086.0, 299693.0, 209430.0, 98716.0, 45017.0, 20838.0, 10212.0, 5202.0, 2588.0, 1469.0, 852.0, 499.0, 294.0, 201.0, 125.0, 79.0, 42.0, 35.0, 25.0, 21.0, 22.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-74.6875, -72.322265625, -69.95703125, -67.591796875, -65.2265625, -62.861328125, -60.49609375, -58.130859375, -55.765625, -53.400390625, -51.03515625, -48.669921875, -46.3046875, -43.939453125, -41.57421875, -39.208984375, -36.84375, -34.478515625, -32.11328125, -29.748046875, -27.3828125, -25.017578125, -22.65234375, -20.287109375, -17.921875, -15.556640625, -13.19140625, -10.826171875, -8.4609375, -6.095703125, -3.73046875, -1.365234375, 1.0, 3.365234375, 5.73046875, 8.095703125, 10.4609375, 12.826171875, 15.19140625, 17.556640625, 19.921875, 22.287109375, 24.65234375, 27.017578125, 29.3828125, 31.748046875, 34.11328125, 36.478515625, 38.84375, 41.208984375, 43.57421875, 45.939453125, 48.3046875, 50.669921875, 53.03515625, 55.400390625, 57.765625, 60.130859375, 62.49609375, 64.861328125, 67.2265625, 69.591796875, 71.95703125, 74.322265625, 76.6875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 6.0, 11.0, 17.0, 11.0, 23.0, 16.0, 30.0, 25.0, 32.0, 27.0, 34.0, 33.0, 45.0, 44.0, 49.0, 51.0, 44.0, 59.0, 44.0, 42.0, 34.0, 32.0, 43.0, 39.0, 30.0, 29.0, 26.0, 27.0, 16.0, 17.0, 15.0, 5.0, 5.0, 5.0, 3.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.640625, -29.7001953125, -28.759765625, -27.8193359375, -26.87890625, -25.9384765625, -24.998046875, -24.0576171875, -23.1171875, -22.1767578125, -21.236328125, -20.2958984375, -19.35546875, -18.4150390625, -17.474609375, -16.5341796875, -15.59375, -14.6533203125, -13.712890625, -12.7724609375, -11.83203125, -10.8916015625, -9.951171875, -9.0107421875, -8.0703125, -7.1298828125, -6.189453125, -5.2490234375, -4.30859375, -3.3681640625, -2.427734375, -1.4873046875, -0.546875, 0.3935546875, 1.333984375, 2.2744140625, 3.21484375, 4.1552734375, 5.095703125, 6.0361328125, 6.9765625, 7.9169921875, 8.857421875, 9.7978515625, 10.73828125, 11.6787109375, 12.619140625, 13.5595703125, 14.5, 15.4404296875, 16.380859375, 17.3212890625, 18.26171875, 19.2021484375, 20.142578125, 21.0830078125, 22.0234375, 22.9638671875, 23.904296875, 24.8447265625, 25.78515625, 26.7255859375, 27.666015625, 28.6064453125, 29.546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 4.0, 8.0, 15.0, 22.0, 21.0, 35.0, 42.0, 60.0, 84.0, 112.0, 145.0, 180.0, 304.0, 434.0, 600.0, 1133.0, 2515.0, 7574.0, 34773.0, 227292.0, 625027.0, 118147.0, 20317.0, 5005.0, 1854.0, 932.0, 566.0, 355.0, 280.0, 200.0, 135.0, 114.0, 73.0, 47.0, 41.0, 24.0, 28.0, 10.0, 17.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.0, -168.447265625, -162.89453125, -157.341796875, -151.7890625, -146.236328125, -140.68359375, -135.130859375, -129.578125, -124.025390625, -118.47265625, -112.919921875, -107.3671875, -101.814453125, -96.26171875, -90.708984375, -85.15625, -79.603515625, -74.05078125, -68.498046875, -62.9453125, -57.392578125, -51.83984375, -46.287109375, -40.734375, -35.181640625, -29.62890625, -24.076171875, -18.5234375, -12.970703125, -7.41796875, -1.865234375, 3.6875, 9.240234375, 14.79296875, 20.345703125, 25.8984375, 31.451171875, 37.00390625, 42.556640625, 48.109375, 53.662109375, 59.21484375, 64.767578125, 70.3203125, 75.873046875, 81.42578125, 86.978515625, 92.53125, 98.083984375, 103.63671875, 109.189453125, 114.7421875, 120.294921875, 125.84765625, 131.400390625, 136.953125, 142.505859375, 148.05859375, 153.611328125, 159.1640625, 164.716796875, 170.26953125, 175.822265625, 181.375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 7.0, 3.0, 3.0, 9.0, 5.0, 7.0, 14.0, 7.0, 17.0, 24.0, 21.0, 24.0, 33.0, 42.0, 42.0, 33.0, 37.0, 56.0, 46.0, 61.0, 47.0, 38.0, 49.0, 49.0, 45.0, 49.0, 52.0, 33.0, 27.0, 26.0, 21.0, 18.0, 14.0, 9.0, 10.0, 17.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-186.625, -181.01953125, -175.4140625, -169.80859375, -164.203125, -158.59765625, -152.9921875, -147.38671875, -141.78125, -136.17578125, -130.5703125, -124.96484375, -119.359375, -113.75390625, -108.1484375, -102.54296875, -96.9375, -91.33203125, -85.7265625, -80.12109375, -74.515625, -68.91015625, -63.3046875, -57.69921875, -52.09375, -46.48828125, -40.8828125, -35.27734375, -29.671875, -24.06640625, -18.4609375, -12.85546875, -7.25, -1.64453125, 3.9609375, 9.56640625, 15.171875, 20.77734375, 26.3828125, 31.98828125, 37.59375, 43.19921875, 48.8046875, 54.41015625, 60.015625, 65.62109375, 71.2265625, 76.83203125, 82.4375, 88.04296875, 93.6484375, 99.25390625, 104.859375, 110.46484375, 116.0703125, 121.67578125, 127.28125, 132.88671875, 138.4921875, 144.09765625, 149.703125, 155.30859375, 160.9140625, 166.51953125, 172.125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 4.0, 3.0, 10.0, 7.0, 15.0, 26.0, 41.0, 68.0, 104.0, 200.0, 364.0, 915.0, 2541.0, 8532.0, 39662.0, 290506.0, 596355.0, 86648.0, 15897.0, 4088.0, 1350.0, 559.0, 269.0, 132.0, 93.0, 56.0, 40.0, 19.0, 15.0, 11.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-86.9375, -84.396484375, -81.85546875, -79.314453125, -76.7734375, -74.232421875, -71.69140625, -69.150390625, -66.609375, -64.068359375, -61.52734375, -58.986328125, -56.4453125, -53.904296875, -51.36328125, -48.822265625, -46.28125, -43.740234375, -41.19921875, -38.658203125, -36.1171875, -33.576171875, -31.03515625, -28.494140625, -25.953125, -23.412109375, -20.87109375, -18.330078125, -15.7890625, -13.248046875, -10.70703125, -8.166015625, -5.625, -3.083984375, -0.54296875, 1.998046875, 4.5390625, 7.080078125, 9.62109375, 12.162109375, 14.703125, 17.244140625, 19.78515625, 22.326171875, 24.8671875, 27.408203125, 29.94921875, 32.490234375, 35.03125, 37.572265625, 40.11328125, 42.654296875, 45.1953125, 47.736328125, 50.27734375, 52.818359375, 55.359375, 57.900390625, 60.44140625, 62.982421875, 65.5234375, 68.064453125, 70.60546875, 73.146484375, 75.6875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 8.0, 12.0, 9.0, 19.0, 31.0, 35.0, 63.0, 102.0, 155.0, 157.0, 135.0, 93.0, 55.0, 31.0, 20.0, 21.0, 15.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.019500732421875, -0.01901829242706299, -0.018535852432250977, -0.018053412437438965, -0.017570972442626953, -0.01708853244781494, -0.01660609245300293, -0.016123652458190918, -0.015641212463378906, -0.015158772468566895, -0.014676332473754883, -0.014193892478942871, -0.01371145248413086, -0.013229012489318848, -0.012746572494506836, -0.012264132499694824, -0.011781692504882812, -0.0112992525100708, -0.010816812515258789, -0.010334372520446777, -0.009851932525634766, -0.009369492530822754, -0.008887052536010742, -0.00840461254119873, -0.007922172546386719, -0.007439732551574707, -0.006957292556762695, -0.006474852561950684, -0.005992412567138672, -0.00550997257232666, -0.0050275325775146484, -0.004545092582702637, -0.004062652587890625, -0.0035802125930786133, -0.0030977725982666016, -0.00261533260345459, -0.002132892608642578, -0.0016504526138305664, -0.0011680126190185547, -0.000685572624206543, -0.00020313262939453125, 0.00027930736541748047, 0.0007617473602294922, 0.001244187355041504, 0.0017266273498535156, 0.0022090673446655273, 0.002691507339477539, 0.0031739473342895508, 0.0036563873291015625, 0.004138827323913574, 0.004621267318725586, 0.005103707313537598, 0.005586147308349609, 0.006068587303161621, 0.006551027297973633, 0.0070334672927856445, 0.007515907287597656, 0.007998347282409668, 0.00848078727722168, 0.008963227272033691, 0.009445667266845703, 0.009928107261657715, 0.010410547256469727, 0.010892987251281738, 0.01137542724609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 5.0, 10.0, 14.0, 18.0, 34.0, 63.0, 102.0, 182.0, 346.0, 775.0, 2101.0, 7936.0, 66185.0, 739724.0, 209037.0, 16555.0, 3358.0, 1077.0, 473.0, 237.0, 138.0, 61.0, 44.0, 28.0, 19.0, 12.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-132.25, -128.9189453125, -125.587890625, -122.2568359375, -118.92578125, -115.5947265625, -112.263671875, -108.9326171875, -105.6015625, -102.2705078125, -98.939453125, -95.6083984375, -92.27734375, -88.9462890625, -85.615234375, -82.2841796875, -78.953125, -75.6220703125, -72.291015625, -68.9599609375, -65.62890625, -62.2978515625, -58.966796875, -55.6357421875, -52.3046875, -48.9736328125, -45.642578125, -42.3115234375, -38.98046875, -35.6494140625, -32.318359375, -28.9873046875, -25.65625, -22.3251953125, -18.994140625, -15.6630859375, -12.33203125, -9.0009765625, -5.669921875, -2.3388671875, 0.9921875, 4.3232421875, 7.654296875, 10.9853515625, 14.31640625, 17.6474609375, 20.978515625, 24.3095703125, 27.640625, 30.9716796875, 34.302734375, 37.6337890625, 40.96484375, 44.2958984375, 47.626953125, 50.9580078125, 54.2890625, 57.6201171875, 60.951171875, 64.2822265625, 67.61328125, 70.9443359375, 74.275390625, 77.6064453125, 80.9375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 8.0, 2.0, 8.0, 14.0, 19.0, 15.0, 42.0, 39.0, 54.0, 73.0, 101.0, 89.0, 97.0, 79.0, 71.0, 78.0, 57.0, 46.0, 35.0, 23.0, 25.0, 10.0, 5.0, 11.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-105.4375, -103.169921875, -100.90234375, -98.634765625, -96.3671875, -94.099609375, -91.83203125, -89.564453125, -87.296875, -85.029296875, -82.76171875, -80.494140625, -78.2265625, -75.958984375, -73.69140625, -71.423828125, -69.15625, -66.888671875, -64.62109375, -62.353515625, -60.0859375, -57.818359375, -55.55078125, -53.283203125, -51.015625, -48.748046875, -46.48046875, -44.212890625, -41.9453125, -39.677734375, -37.41015625, -35.142578125, -32.875, -30.607421875, -28.33984375, -26.072265625, -23.8046875, -21.537109375, -19.26953125, -17.001953125, -14.734375, -12.466796875, -10.19921875, -7.931640625, -5.6640625, -3.396484375, -1.12890625, 1.138671875, 3.40625, 5.673828125, 7.94140625, 10.208984375, 12.4765625, 14.744140625, 17.01171875, 19.279296875, 21.546875, 23.814453125, 26.08203125, 28.349609375, 30.6171875, 32.884765625, 35.15234375, 37.419921875, 39.6875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 19.0, 61.0, 125.0, 191.0, 266.0, 177.0, 81.0, 52.0, 15.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-758.7891235351562, -697.4159545898438, -636.0427856445312, -574.6695556640625, -513.29638671875, -451.9232177734375, -390.550048828125, -329.1768493652344, -267.8036804199219, -206.4304962158203, -145.05731201171875, -83.68414306640625, -22.310958862304688, 39.062225341796875, 100.43539428710938, 161.80859375, 223.1817626953125, 284.554931640625, 345.9281311035156, 407.3013000488281, 468.67449951171875, 530.0476684570312, 591.4208374023438, 652.7940673828125, 714.167236328125, 775.5404052734375, 836.91357421875, 898.2867431640625, 959.6599731445312, 1021.0331420898438, 1082.40625, 1143.779541015625, 1205.1527099609375, 1266.52587890625, 1327.8990478515625, 1389.272216796875, 1450.6453857421875, 1512.0185546875, 1573.391845703125, 1634.7650146484375, 1696.13818359375, 1757.5113525390625, 1818.884521484375, 1880.2576904296875, 1941.630859375, 2003.004150390625, 2064.377197265625, 2125.75048828125, 2187.12353515625, 2248.496826171875, 2309.869873046875, 2371.2431640625, 2432.6162109375, 2493.989501953125, 2555.362548828125, 2616.73583984375, 2678.109130859375, 2739.482421875, 2800.85546875, 2862.228759765625, 2923.601806640625, 2984.97509765625, 3046.34814453125, 3107.721435546875, 3169.094482421875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 2.0, 13.0, 12.0, 4.0, 13.0, 11.0, 19.0, 16.0, 21.0, 18.0, 18.0, 18.0, 30.0, 37.0, 37.0, 61.0, 55.0, 45.0, 43.0, 57.0, 41.0, 38.0, 51.0, 41.0, 32.0, 27.0, 22.0, 32.0, 32.0, 24.0, 19.0, 15.0, 9.0, 15.0, 11.0, 9.0, 9.0, 3.0, 5.0, 9.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-660.2056884765625, -637.6907348632812, -615.1758422851562, -592.660888671875, -570.14599609375, -547.6310424804688, -525.1160888671875, -502.6011962890625, -480.0862731933594, -457.57135009765625, -435.0564270019531, -412.54150390625, -390.02655029296875, -367.51165771484375, -344.9967041015625, -322.4817810058594, -299.96685791015625, -277.4519348144531, -254.93701171875, -232.4220733642578, -209.9071502685547, -187.39222717285156, -164.87728881835938, -142.36236572265625, -119.84744262695312, -97.33251953125, -74.81758880615234, -52.30265808105469, -29.787734985351562, -7.2728118896484375, 15.24212646484375, 37.757049560546875, 60.27191162109375, 82.78683471679688, 105.30176544189453, 127.81669616699219, 150.3316192626953, 172.84654235839844, 195.36148071289062, 217.87640380859375, 240.39132690429688, 262.90625, 285.4211730957031, 307.93609619140625, 330.4510498046875, 352.9659423828125, 375.48089599609375, 397.9958190917969, 420.5107421875, 443.0256652832031, 465.54058837890625, 488.0555419921875, 510.5704345703125, 533.0853881835938, 555.600341796875, 578.115234375, 600.630126953125, 623.1450805664062, 645.6599731445312, 668.1749267578125, 690.6898193359375, 713.2047729492188, 735.7197265625, 758.234619140625, 780.7495727539062]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 5.0, 7.0, 8.0, 11.0, 11.0, 22.0, 33.0, 50.0, 69.0, 99.0, 164.0, 230.0, 432.0, 814.0, 1783.0, 4160.0, 13403.0, 112088.0, 4006913.0, 39729.0, 8228.0, 3038.0, 1299.0, 667.0, 352.0, 215.0, 146.0, 86.0, 57.0, 43.0, 30.0, 27.0, 18.0, 9.0, 12.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-224.875, -218.5078125, -212.140625, -205.7734375, -199.40625, -193.0390625, -186.671875, -180.3046875, -173.9375, -167.5703125, -161.203125, -154.8359375, -148.46875, -142.1015625, -135.734375, -129.3671875, -123.0, -116.6328125, -110.265625, -103.8984375, -97.53125, -91.1640625, -84.796875, -78.4296875, -72.0625, -65.6953125, -59.328125, -52.9609375, -46.59375, -40.2265625, -33.859375, -27.4921875, -21.125, -14.7578125, -8.390625, -2.0234375, 4.34375, 10.7109375, 17.078125, 23.4453125, 29.8125, 36.1796875, 42.546875, 48.9140625, 55.28125, 61.6484375, 68.015625, 74.3828125, 80.75, 87.1171875, 93.484375, 99.8515625, 106.21875, 112.5859375, 118.953125, 125.3203125, 131.6875, 138.0546875, 144.421875, 150.7890625, 157.15625, 163.5234375, 169.890625, 176.2578125, 182.625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 8.0, 8.0, 4.0, 17.0, 20.0, 23.0, 24.0, 31.0, 38.0, 40.0, 37.0, 52.0, 45.0, 58.0, 50.0, 55.0, 56.0, 52.0, 44.0, 51.0, 45.0, 43.0, 36.0, 37.0, 26.0, 17.0, 19.0, 12.0, 12.0, 7.0, 3.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.0, -29.87109375, -28.7421875, -27.61328125, -26.484375, -25.35546875, -24.2265625, -23.09765625, -21.96875, -20.83984375, -19.7109375, -18.58203125, -17.453125, -16.32421875, -15.1953125, -14.06640625, -12.9375, -11.80859375, -10.6796875, -9.55078125, -8.421875, -7.29296875, -6.1640625, -5.03515625, -3.90625, -2.77734375, -1.6484375, -0.51953125, 0.609375, 1.73828125, 2.8671875, 3.99609375, 5.125, 6.25390625, 7.3828125, 8.51171875, 9.640625, 10.76953125, 11.8984375, 13.02734375, 14.15625, 15.28515625, 16.4140625, 17.54296875, 18.671875, 19.80078125, 20.9296875, 22.05859375, 23.1875, 24.31640625, 25.4453125, 26.57421875, 27.703125, 28.83203125, 29.9609375, 31.08984375, 32.21875, 33.34765625, 34.4765625, 35.60546875, 36.734375, 37.86328125, 38.9921875, 40.12109375, 41.25]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 8.0, 6.0, 9.0, 17.0, 19.0, 26.0, 30.0, 33.0, 45.0, 70.0, 76.0, 132.0, 172.0, 243.0, 373.0, 578.0, 939.0, 1680.0, 3101.0, 6685.0, 17880.0, 96079.0, 3937074.0, 96951.0, 17936.0, 6598.0, 2984.0, 1637.0, 993.0, 602.0, 359.0, 259.0, 162.0, 126.0, 93.0, 72.0, 58.0, 36.0, 28.0, 32.0, 21.0, 9.0, 13.0, 8.0, 13.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-153.5, -148.91796875, -144.3359375, -139.75390625, -135.171875, -130.58984375, -126.0078125, -121.42578125, -116.84375, -112.26171875, -107.6796875, -103.09765625, -98.515625, -93.93359375, -89.3515625, -84.76953125, -80.1875, -75.60546875, -71.0234375, -66.44140625, -61.859375, -57.27734375, -52.6953125, -48.11328125, -43.53125, -38.94921875, -34.3671875, -29.78515625, -25.203125, -20.62109375, -16.0390625, -11.45703125, -6.875, -2.29296875, 2.2890625, 6.87109375, 11.453125, 16.03515625, 20.6171875, 25.19921875, 29.78125, 34.36328125, 38.9453125, 43.52734375, 48.109375, 52.69140625, 57.2734375, 61.85546875, 66.4375, 71.01953125, 75.6015625, 80.18359375, 84.765625, 89.34765625, 93.9296875, 98.51171875, 103.09375, 107.67578125, 112.2578125, 116.83984375, 121.421875, 126.00390625, 130.5859375, 135.16796875, 139.75]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 6.0, 7.0, 22.0, 32.0, 64.0, 186.0, 3198.0, 387.0, 63.0, 30.0, 20.0, 21.0, 10.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.625, -48.10693359375, -46.5888671875, -45.07080078125, -43.552734375, -42.03466796875, -40.5166015625, -38.99853515625, -37.48046875, -35.96240234375, -34.4443359375, -32.92626953125, -31.408203125, -29.89013671875, -28.3720703125, -26.85400390625, -25.3359375, -23.81787109375, -22.2998046875, -20.78173828125, -19.263671875, -17.74560546875, -16.2275390625, -14.70947265625, -13.19140625, -11.67333984375, -10.1552734375, -8.63720703125, -7.119140625, -5.60107421875, -4.0830078125, -2.56494140625, -1.046875, 0.47119140625, 1.9892578125, 3.50732421875, 5.025390625, 6.54345703125, 8.0615234375, 9.57958984375, 11.09765625, 12.61572265625, 14.1337890625, 15.65185546875, 17.169921875, 18.68798828125, 20.2060546875, 21.72412109375, 23.2421875, 24.76025390625, 26.2783203125, 27.79638671875, 29.314453125, 30.83251953125, 32.3505859375, 33.86865234375, 35.38671875, 36.90478515625, 38.4228515625, 39.94091796875, 41.458984375, 42.97705078125, 44.4951171875, 46.01318359375, 47.53125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 1.0, 3.0, 5.0, 7.0, 15.0, 5.0, 10.0, 15.0, 19.0, 28.0, 33.0, 40.0, 57.0, 81.0, 72.0, 87.0, 87.0, 83.0, 75.0, 62.0, 53.0, 38.0, 28.0, 20.0, 21.0, 13.0, 7.0, 13.0, 6.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-150.412109375, -147.04037475585938, -143.66864013671875, -140.2969207763672, -136.92518615722656, -133.55345153808594, -130.1817169189453, -126.80998992919922, -123.43826293945312, -120.0665283203125, -116.6948013305664, -113.32306671142578, -109.95133972167969, -106.57960510253906, -103.20787048339844, -99.83614349365234, -96.46440887451172, -93.0926742553711, -89.720947265625, -86.34921264648438, -82.97748565673828, -79.60575103759766, -76.23402404785156, -72.86228942871094, -69.49055480957031, -66.11882019042969, -62.747093200683594, -59.37535858154297, -56.003631591796875, -52.63189697265625, -49.26016616821289, -45.88843536376953, -42.51671600341797, -39.14498519897461, -35.77325439453125, -32.401519775390625, -29.0297908782959, -25.65806007385254, -22.286327362060547, -18.914596557617188, -15.542865753173828, -12.171134948730469, -8.799403190612793, -5.427671432495117, -2.055940628051758, 1.3157901763916016, 4.687522888183594, 8.059253692626953, 11.430984497070312, 14.802715301513672, 18.17444610595703, 21.546178817749023, 24.917909622192383, 28.289640426635742, 31.661373138427734, 35.033103942871094, 38.40483474731445, 41.77656555175781, 45.14829635620117, 48.52002716064453, 51.891761779785156, 55.26348876953125, 58.635223388671875, 62.006954193115234, 65.3786849975586]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 6.0, 4.0, 7.0, 6.0, 12.0, 10.0, 7.0, 18.0, 22.0, 11.0, 22.0, 32.0, 29.0, 29.0, 32.0, 40.0, 29.0, 36.0, 57.0, 42.0, 47.0, 44.0, 34.0, 31.0, 45.0, 40.0, 39.0, 31.0, 32.0, 31.0, 19.0, 19.0, 16.0, 20.0, 20.0, 9.0, 14.0, 7.0, 12.0, 5.0, 5.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0], "bins": [-85.30018615722656, -82.8665542602539, -80.43292999267578, -77.99929809570312, -75.565673828125, -73.13204193115234, -70.69841003417969, -68.26478576660156, -65.8311538696289, -63.397525787353516, -60.963897705078125, -58.53026580810547, -56.09663772583008, -53.66300964355469, -51.22937774658203, -48.79574966430664, -46.36212158203125, -43.92849349975586, -41.49486541748047, -39.06123352050781, -36.62760543823242, -34.19397735595703, -31.760347366333008, -29.326717376708984, -26.893089294433594, -24.459461212158203, -22.02583122253418, -19.592201232910156, -17.158573150634766, -14.724944114685059, -12.291315078735352, -9.857685089111328, -7.424049377441406, -4.990420341491699, -2.556791305541992, -0.12316226959228516, 2.310466766357422, 4.744095802307129, 7.177724838256836, 9.61135482788086, 12.04498291015625, 14.478611946105957, 16.912240982055664, 19.345870971679688, 21.779499053955078, 24.21312713623047, 26.646757125854492, 29.080387115478516, 31.514015197753906, 33.9476432800293, 36.38127136230469, 38.814903259277344, 41.248531341552734, 43.682159423828125, 46.11579132080078, 48.54941940307617, 50.98304748535156, 53.41667556762695, 55.850303649902344, 58.283935546875, 60.71756362915039, 63.15119171142578, 65.58482360839844, 68.01844787597656, 70.45207977294922]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 13.0, 12.0, 16.0, 33.0, 43.0, 54.0, 94.0, 148.0, 214.0, 355.0, 566.0, 937.0, 1589.0, 2875.0, 5260.0, 9924.0, 19480.0, 40385.0, 84886.0, 173947.0, 271922.0, 217523.0, 111938.0, 52891.0, 25358.0, 12823.0, 6662.0, 3623.0, 2026.0, 1171.0, 652.0, 415.0, 264.0, 154.0, 106.0, 54.0, 47.0, 24.0, 20.0, 18.0, 6.0, 7.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-60.3125, -58.46728515625, -56.6220703125, -54.77685546875, -52.931640625, -51.08642578125, -49.2412109375, -47.39599609375, -45.55078125, -43.70556640625, -41.8603515625, -40.01513671875, -38.169921875, -36.32470703125, -34.4794921875, -32.63427734375, -30.7890625, -28.94384765625, -27.0986328125, -25.25341796875, -23.408203125, -21.56298828125, -19.7177734375, -17.87255859375, -16.02734375, -14.18212890625, -12.3369140625, -10.49169921875, -8.646484375, -6.80126953125, -4.9560546875, -3.11083984375, -1.265625, 0.57958984375, 2.4248046875, 4.27001953125, 6.115234375, 7.96044921875, 9.8056640625, 11.65087890625, 13.49609375, 15.34130859375, 17.1865234375, 19.03173828125, 20.876953125, 22.72216796875, 24.5673828125, 26.41259765625, 28.2578125, 30.10302734375, 31.9482421875, 33.79345703125, 35.638671875, 37.48388671875, 39.3291015625, 41.17431640625, 43.01953125, 44.86474609375, 46.7099609375, 48.55517578125, 50.400390625, 52.24560546875, 54.0908203125, 55.93603515625, 57.78125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 2.0, 5.0, 11.0, 5.0, 9.0, 13.0, 11.0, 22.0, 21.0, 43.0, 32.0, 34.0, 39.0, 36.0, 55.0, 47.0, 50.0, 55.0, 59.0, 55.0, 58.0, 56.0, 41.0, 47.0, 31.0, 28.0, 32.0, 22.0, 16.0, 16.0, 13.0, 10.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.125, -31.93408203125, -30.7431640625, -29.55224609375, -28.361328125, -27.17041015625, -25.9794921875, -24.78857421875, -23.59765625, -22.40673828125, -21.2158203125, -20.02490234375, -18.833984375, -17.64306640625, -16.4521484375, -15.26123046875, -14.0703125, -12.87939453125, -11.6884765625, -10.49755859375, -9.306640625, -8.11572265625, -6.9248046875, -5.73388671875, -4.54296875, -3.35205078125, -2.1611328125, -0.97021484375, 0.220703125, 1.41162109375, 2.6025390625, 3.79345703125, 4.984375, 6.17529296875, 7.3662109375, 8.55712890625, 9.748046875, 10.93896484375, 12.1298828125, 13.32080078125, 14.51171875, 15.70263671875, 16.8935546875, 18.08447265625, 19.275390625, 20.46630859375, 21.6572265625, 22.84814453125, 24.0390625, 25.22998046875, 26.4208984375, 27.61181640625, 28.802734375, 29.99365234375, 31.1845703125, 32.37548828125, 33.56640625, 34.75732421875, 35.9482421875, 37.13916015625, 38.330078125, 39.52099609375, 40.7119140625, 41.90283203125, 43.09375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 3.0, 8.0, 13.0, 25.0, 34.0, 36.0, 48.0, 65.0, 91.0, 111.0, 172.0, 206.0, 279.0, 378.0, 560.0, 835.0, 1585.0, 3878.0, 13260.0, 67999.0, 461103.0, 416212.0, 61331.0, 12139.0, 3677.0, 1628.0, 863.0, 572.0, 352.0, 275.0, 203.0, 152.0, 102.0, 94.0, 68.0, 51.0, 28.0, 21.0, 24.0, 14.0, 16.0, 2.0, 9.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-137.375, -132.939453125, -128.50390625, -124.068359375, -119.6328125, -115.197265625, -110.76171875, -106.326171875, -101.890625, -97.455078125, -93.01953125, -88.583984375, -84.1484375, -79.712890625, -75.27734375, -70.841796875, -66.40625, -61.970703125, -57.53515625, -53.099609375, -48.6640625, -44.228515625, -39.79296875, -35.357421875, -30.921875, -26.486328125, -22.05078125, -17.615234375, -13.1796875, -8.744140625, -4.30859375, 0.126953125, 4.5625, 8.998046875, 13.43359375, 17.869140625, 22.3046875, 26.740234375, 31.17578125, 35.611328125, 40.046875, 44.482421875, 48.91796875, 53.353515625, 57.7890625, 62.224609375, 66.66015625, 71.095703125, 75.53125, 79.966796875, 84.40234375, 88.837890625, 93.2734375, 97.708984375, 102.14453125, 106.580078125, 111.015625, 115.451171875, 119.88671875, 124.322265625, 128.7578125, 133.193359375, 137.62890625, 142.064453125, 146.5]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 10.0, 10.0, 15.0, 11.0, 20.0, 23.0, 30.0, 36.0, 31.0, 29.0, 28.0, 50.0, 47.0, 44.0, 52.0, 49.0, 51.0, 35.0, 50.0, 37.0, 54.0, 36.0, 38.0, 27.0, 24.0, 29.0, 23.0, 13.0, 15.0, 23.0, 8.0, 8.0, 4.0, 7.0, 8.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.75, -135.767578125, -130.78515625, -125.802734375, -120.8203125, -115.837890625, -110.85546875, -105.873046875, -100.890625, -95.908203125, -90.92578125, -85.943359375, -80.9609375, -75.978515625, -70.99609375, -66.013671875, -61.03125, -56.048828125, -51.06640625, -46.083984375, -41.1015625, -36.119140625, -31.13671875, -26.154296875, -21.171875, -16.189453125, -11.20703125, -6.224609375, -1.2421875, 3.740234375, 8.72265625, 13.705078125, 18.6875, 23.669921875, 28.65234375, 33.634765625, 38.6171875, 43.599609375, 48.58203125, 53.564453125, 58.546875, 63.529296875, 68.51171875, 73.494140625, 78.4765625, 83.458984375, 88.44140625, 93.423828125, 98.40625, 103.388671875, 108.37109375, 113.353515625, 118.3359375, 123.318359375, 128.30078125, 133.283203125, 138.265625, 143.248046875, 148.23046875, 153.212890625, 158.1953125, 163.177734375, 168.16015625, 173.142578125, 178.125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 8.0, 15.0, 16.0, 37.0, 44.0, 74.0, 168.0, 373.0, 1073.0, 5022.0, 64096.0, 889191.0, 80774.0, 5701.0, 1168.0, 388.0, 160.0, 77.0, 52.0, 37.0, 21.0, 17.0, 12.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-109.625, -106.1484375, -102.671875, -99.1953125, -95.71875, -92.2421875, -88.765625, -85.2890625, -81.8125, -78.3359375, -74.859375, -71.3828125, -67.90625, -64.4296875, -60.953125, -57.4765625, -54.0, -50.5234375, -47.046875, -43.5703125, -40.09375, -36.6171875, -33.140625, -29.6640625, -26.1875, -22.7109375, -19.234375, -15.7578125, -12.28125, -8.8046875, -5.328125, -1.8515625, 1.625, 5.1015625, 8.578125, 12.0546875, 15.53125, 19.0078125, 22.484375, 25.9609375, 29.4375, 32.9140625, 36.390625, 39.8671875, 43.34375, 46.8203125, 50.296875, 53.7734375, 57.25, 60.7265625, 64.203125, 67.6796875, 71.15625, 74.6328125, 78.109375, 81.5859375, 85.0625, 88.5390625, 92.015625, 95.4921875, 98.96875, 102.4453125, 105.921875, 109.3984375, 112.875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 7.0, 7.0, 8.0, 15.0, 17.0, 19.0, 29.0, 26.0, 34.0, 64.0, 85.0, 82.0, 117.0, 101.0, 87.0, 64.0, 57.0, 32.0, 27.0, 22.0, 23.0, 16.0, 10.0, 5.0, 8.0, 7.0, 3.0, 2.0, 8.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01042938232421875, -0.010128378868103027, -0.009827375411987305, -0.009526371955871582, -0.00922536849975586, -0.008924365043640137, -0.008623361587524414, -0.008322358131408691, -0.008021354675292969, -0.007720351219177246, -0.0074193477630615234, -0.007118344306945801, -0.006817340850830078, -0.0065163373947143555, -0.006215333938598633, -0.00591433048248291, -0.0056133270263671875, -0.005312323570251465, -0.005011320114135742, -0.0047103166580200195, -0.004409313201904297, -0.004108309745788574, -0.0038073062896728516, -0.003506302833557129, -0.0032052993774414062, -0.0029042959213256836, -0.002603292465209961, -0.0023022890090942383, -0.0020012855529785156, -0.001700282096862793, -0.0013992786407470703, -0.0010982751846313477, -0.000797271728515625, -0.0004962682723999023, -0.0001952648162841797, 0.00010573863983154297, 0.0004067420959472656, 0.0007077455520629883, 0.001008749008178711, 0.0013097524642944336, 0.0016107559204101562, 0.001911759376525879, 0.0022127628326416016, 0.0025137662887573242, 0.002814769744873047, 0.0031157732009887695, 0.003416776657104492, 0.003717780113220215, 0.0040187835693359375, 0.00431978702545166, 0.004620790481567383, 0.0049217939376831055, 0.005222797393798828, 0.005523800849914551, 0.0058248043060302734, 0.006125807762145996, 0.006426811218261719, 0.006727814674377441, 0.007028818130493164, 0.007329821586608887, 0.007630825042724609, 0.007931828498840332, 0.008232831954956055, 0.008533835411071777, 0.0088348388671875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 8.0, 5.0, 13.0, 14.0, 22.0, 31.0, 52.0, 96.0, 162.0, 364.0, 833.0, 2196.0, 9651.0, 113398.0, 836066.0, 74685.0, 7690.0, 1923.0, 688.0, 293.0, 144.0, 86.0, 42.0, 28.0, 16.0, 12.0, 6.0, 11.0, 7.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.25, -87.37890625, -84.5078125, -81.63671875, -78.765625, -75.89453125, -73.0234375, -70.15234375, -67.28125, -64.41015625, -61.5390625, -58.66796875, -55.796875, -52.92578125, -50.0546875, -47.18359375, -44.3125, -41.44140625, -38.5703125, -35.69921875, -32.828125, -29.95703125, -27.0859375, -24.21484375, -21.34375, -18.47265625, -15.6015625, -12.73046875, -9.859375, -6.98828125, -4.1171875, -1.24609375, 1.625, 4.49609375, 7.3671875, 10.23828125, 13.109375, 15.98046875, 18.8515625, 21.72265625, 24.59375, 27.46484375, 30.3359375, 33.20703125, 36.078125, 38.94921875, 41.8203125, 44.69140625, 47.5625, 50.43359375, 53.3046875, 56.17578125, 59.046875, 61.91796875, 64.7890625, 67.66015625, 70.53125, 73.40234375, 76.2734375, 79.14453125, 82.015625, 84.88671875, 87.7578125, 90.62890625, 93.5]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 10.0, 8.0, 21.0, 13.0, 22.0, 28.0, 43.0, 52.0, 76.0, 72.0, 97.0, 101.0, 106.0, 88.0, 64.0, 59.0, 37.0, 29.0, 23.0, 14.0, 13.0, 5.0, 9.0, 8.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.8125, -63.0234375, -61.234375, -59.4453125, -57.65625, -55.8671875, -54.078125, -52.2890625, -50.5, -48.7109375, -46.921875, -45.1328125, -43.34375, -41.5546875, -39.765625, -37.9765625, -36.1875, -34.3984375, -32.609375, -30.8203125, -29.03125, -27.2421875, -25.453125, -23.6640625, -21.875, -20.0859375, -18.296875, -16.5078125, -14.71875, -12.9296875, -11.140625, -9.3515625, -7.5625, -5.7734375, -3.984375, -2.1953125, -0.40625, 1.3828125, 3.171875, 4.9609375, 6.75, 8.5390625, 10.328125, 12.1171875, 13.90625, 15.6953125, 17.484375, 19.2734375, 21.0625, 22.8515625, 24.640625, 26.4296875, 28.21875, 30.0078125, 31.796875, 33.5859375, 35.375, 37.1640625, 38.953125, 40.7421875, 42.53125, 44.3203125, 46.109375, 47.8984375, 49.6875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 8.0, 12.0, 33.0, 55.0, 87.0, 101.0, 162.0, 150.0, 124.0, 99.0, 66.0, 29.0, 24.0, 17.0, 9.0, 7.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-992.91943359375, -958.955322265625, -924.9912109375, -891.0270385742188, -857.0629272460938, -823.0988159179688, -789.1346435546875, -755.1705322265625, -721.2064208984375, -687.2423095703125, -653.2781982421875, -619.3140258789062, -585.3499145507812, -551.3858032226562, -517.421630859375, -483.45751953125, -449.493408203125, -415.529296875, -381.5651550292969, -347.60101318359375, -313.63690185546875, -279.67279052734375, -245.70864868164062, -211.74452209472656, -177.7803955078125, -143.81626892089844, -109.85214233398438, -75.88801574707031, -41.92388916015625, -7.9597625732421875, 26.004364013671875, 59.96849060058594, 93.9326171875, 127.89674377441406, 161.86087036132812, 195.8249969482422, 229.78912353515625, 263.75323486328125, 297.7173767089844, 331.6815185546875, 365.6456298828125, 399.6097412109375, 433.5738830566406, 467.53802490234375, 501.50213623046875, 535.4662475585938, 569.430419921875, 603.39453125, 637.358642578125, 671.32275390625, 705.286865234375, 739.2510375976562, 773.2151489257812, 807.1792602539062, 841.1434326171875, 875.1075439453125, 909.0716552734375, 943.0357666015625, 976.9998779296875, 1010.9640502929688, 1044.92822265625, 1078.892333984375, 1112.8564453125, 1146.820556640625, 1180.78466796875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 5.0, 3.0, 7.0, 6.0, 14.0, 13.0, 12.0, 15.0, 19.0, 26.0, 21.0, 24.0, 35.0, 35.0, 37.0, 42.0, 39.0, 36.0, 40.0, 45.0, 60.0, 38.0, 45.0, 49.0, 31.0, 37.0, 30.0, 29.0, 31.0, 18.0, 28.0, 26.0, 18.0, 11.0, 11.0, 13.0, 10.0, 6.0, 10.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-631.4794921875, -611.931884765625, -592.3843383789062, -572.8367309570312, -553.2891845703125, -533.7415771484375, -514.1939697265625, -494.6463928222656, -475.09881591796875, -455.5512390136719, -436.003662109375, -416.4560546875, -396.9084777832031, -377.36090087890625, -357.81329345703125, -338.2657165527344, -318.7181396484375, -299.1705627441406, -279.62298583984375, -260.07537841796875, -240.52780151367188, -220.980224609375, -201.43263244628906, -181.88504028320312, -162.33746337890625, -142.78988647460938, -123.24229431152344, -103.69470977783203, -84.14712524414062, -64.59954071044922, -45.05195617675781, -25.504364013671875, -5.95672607421875, 13.590858459472656, 33.13844299316406, 52.68602752685547, 72.23361206054688, 91.78119659423828, 111.32878112792969, 130.87637329101562, 150.4239501953125, 169.97152709960938, 189.5191192626953, 209.06671142578125, 228.61428833007812, 248.161865234375, 267.70947265625, 287.2570495605469, 306.80462646484375, 326.3522033691406, 345.8997802734375, 365.4473876953125, 384.9949645996094, 404.54254150390625, 424.09014892578125, 443.6377258300781, 463.185302734375, 482.7328796386719, 502.28045654296875, 521.8280639648438, 541.3756103515625, 560.9232177734375, 580.4708251953125, 600.0184326171875, 619.5659790039062]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 9.0, 11.0, 15.0, 17.0, 29.0, 34.0, 44.0, 60.0, 90.0, 169.0, 187.0, 320.0, 512.0, 846.0, 1501.0, 3113.0, 8558.0, 50595.0, 4077984.0, 36420.0, 7318.0, 2793.0, 1406.0, 816.0, 493.0, 311.0, 197.0, 129.0, 89.0, 58.0, 39.0, 34.0, 29.0, 8.0, 14.0, 10.0, 7.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-174.125, -168.5859375, -163.046875, -157.5078125, -151.96875, -146.4296875, -140.890625, -135.3515625, -129.8125, -124.2734375, -118.734375, -113.1953125, -107.65625, -102.1171875, -96.578125, -91.0390625, -85.5, -79.9609375, -74.421875, -68.8828125, -63.34375, -57.8046875, -52.265625, -46.7265625, -41.1875, -35.6484375, -30.109375, -24.5703125, -19.03125, -13.4921875, -7.953125, -2.4140625, 3.125, 8.6640625, 14.203125, 19.7421875, 25.28125, 30.8203125, 36.359375, 41.8984375, 47.4375, 52.9765625, 58.515625, 64.0546875, 69.59375, 75.1328125, 80.671875, 86.2109375, 91.75, 97.2890625, 102.828125, 108.3671875, 113.90625, 119.4453125, 124.984375, 130.5234375, 136.0625, 141.6015625, 147.140625, 152.6796875, 158.21875, 163.7578125, 169.296875, 174.8359375, 180.375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 6.0, 7.0, 17.0, 14.0, 19.0, 24.0, 42.0, 39.0, 45.0, 43.0, 51.0, 62.0, 58.0, 66.0, 55.0, 56.0, 72.0, 47.0, 60.0, 41.0, 38.0, 36.0, 23.0, 17.0, 21.0, 8.0, 10.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.47265625, -40.1328125, -38.79296875, -37.453125, -36.11328125, -34.7734375, -33.43359375, -32.09375, -30.75390625, -29.4140625, -28.07421875, -26.734375, -25.39453125, -24.0546875, -22.71484375, -21.375, -20.03515625, -18.6953125, -17.35546875, -16.015625, -14.67578125, -13.3359375, -11.99609375, -10.65625, -9.31640625, -7.9765625, -6.63671875, -5.296875, -3.95703125, -2.6171875, -1.27734375, 0.0625, 1.40234375, 2.7421875, 4.08203125, 5.421875, 6.76171875, 8.1015625, 9.44140625, 10.78125, 12.12109375, 13.4609375, 14.80078125, 16.140625, 17.48046875, 18.8203125, 20.16015625, 21.5, 22.83984375, 24.1796875, 25.51953125, 26.859375, 28.19921875, 29.5390625, 30.87890625, 32.21875, 33.55859375, 34.8984375, 36.23828125, 37.578125, 38.91796875, 40.2578125, 41.59765625, 42.9375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 5.0, 9.0, 15.0, 17.0, 28.0, 33.0, 42.0, 54.0, 97.0, 140.0, 226.0, 362.0, 586.0, 1110.0, 2343.0, 5757.0, 23481.0, 4074554.0, 68806.0, 9625.0, 3376.0, 1522.0, 783.0, 477.0, 242.0, 201.0, 102.0, 75.0, 51.0, 44.0, 37.0, 16.0, 13.0, 13.0, 10.0, 8.0, 6.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-229.5, -222.263671875, -215.02734375, -207.791015625, -200.5546875, -193.318359375, -186.08203125, -178.845703125, -171.609375, -164.373046875, -157.13671875, -149.900390625, -142.6640625, -135.427734375, -128.19140625, -120.955078125, -113.71875, -106.482421875, -99.24609375, -92.009765625, -84.7734375, -77.537109375, -70.30078125, -63.064453125, -55.828125, -48.591796875, -41.35546875, -34.119140625, -26.8828125, -19.646484375, -12.41015625, -5.173828125, 2.0625, 9.298828125, 16.53515625, 23.771484375, 31.0078125, 38.244140625, 45.48046875, 52.716796875, 59.953125, 67.189453125, 74.42578125, 81.662109375, 88.8984375, 96.134765625, 103.37109375, 110.607421875, 117.84375, 125.080078125, 132.31640625, 139.552734375, 146.7890625, 154.025390625, 161.26171875, 168.498046875, 175.734375, 182.970703125, 190.20703125, 197.443359375, 204.6796875, 211.916015625, 219.15234375, 226.388671875, 233.625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 6.0, 6.0, 17.0, 28.0, 85.0, 3571.0, 241.0, 45.0, 21.0, 14.0, 10.0, 2.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.206298828125, -28.67822265625, -27.150146484375, -25.6220703125, -24.093994140625, -22.56591796875, -21.037841796875, -19.509765625, -17.981689453125, -16.45361328125, -14.925537109375, -13.3974609375, -11.869384765625, -10.34130859375, -8.813232421875, -7.28515625, -5.757080078125, -4.22900390625, -2.700927734375, -1.1728515625, 0.355224609375, 1.88330078125, 3.411376953125, 4.939453125, 6.467529296875, 7.99560546875, 9.523681640625, 11.0517578125, 12.579833984375, 14.10791015625, 15.635986328125, 17.1640625, 18.692138671875, 20.22021484375, 21.748291015625, 23.2763671875, 24.804443359375, 26.33251953125, 27.860595703125, 29.388671875, 30.916748046875, 32.44482421875, 33.972900390625, 35.5009765625, 37.029052734375, 38.55712890625, 40.085205078125, 41.61328125, 43.141357421875, 44.66943359375, 46.197509765625, 47.7255859375, 49.253662109375, 50.78173828125, 52.309814453125, 53.837890625, 55.365966796875, 56.89404296875, 58.422119140625, 59.9501953125, 61.478271484375, 63.00634765625, 64.534423828125, 66.0625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 16.0, 14.0, 26.0, 32.0, 41.0, 89.0, 132.0, 147.0, 124.0, 101.0, 88.0, 52.0, 44.0, 28.0, 19.0, 11.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-166.2162322998047, -161.10142517089844, -155.9866180419922, -150.871826171875, -145.75701904296875, -140.6422119140625, -135.52740478515625, -130.41259765625, -125.29779815673828, -120.18299102783203, -115.06819152832031, -109.95338439941406, -104.83857727050781, -99.7237777709961, -94.60897064208984, -89.49417114257812, -84.37936401367188, -79.26455688476562, -74.1497573852539, -69.03495025634766, -63.92014694213867, -58.80534362792969, -53.69053649902344, -48.57573318481445, -43.46092987060547, -38.346126556396484, -33.2313232421875, -28.11651611328125, -23.001712799072266, -17.88690948486328, -12.772104263305664, -7.657299041748047, -2.5424957275390625, 2.5723085403442383, 7.687112808227539, 12.80191707611084, 17.91672134399414, 23.031524658203125, 28.146329879760742, 33.26113510131836, 38.375938415527344, 43.49074172973633, 48.60554504394531, 53.72035217285156, 58.83515548706055, 63.94995880126953, 69.06476593017578, 74.1795654296875, 79.29437255859375, 84.4091796875, 89.52397918701172, 94.63878631591797, 99.75358581542969, 104.86839294433594, 109.98320007324219, 115.09800720214844, 120.21280670166016, 125.3276138305664, 130.44241333007812, 135.55722045898438, 140.67202758789062, 145.78683471679688, 150.90162658691406, 156.0164337158203, 161.13124084472656]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 5.0, 3.0, 5.0, 7.0, 15.0, 10.0, 18.0, 26.0, 22.0, 18.0, 25.0, 34.0, 27.0, 41.0, 31.0, 40.0, 30.0, 47.0, 47.0, 36.0, 34.0, 44.0, 35.0, 43.0, 31.0, 32.0, 24.0, 37.0, 24.0, 23.0, 25.0, 22.0, 12.0, 20.0, 20.0, 13.0, 14.0, 8.0, 11.0, 11.0, 8.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-68.31822204589844, -66.04344940185547, -63.768680572509766, -61.49391174316406, -59.219139099121094, -56.94437026977539, -54.66960144042969, -52.39482879638672, -50.12005615234375, -47.84528732299805, -45.57051467895508, -43.295745849609375, -41.020973205566406, -38.7462043762207, -36.471435546875, -34.19666290283203, -31.921894073486328, -29.647123336791992, -27.372352600097656, -25.097583770751953, -22.822811126708984, -20.54804229736328, -18.273271560668945, -15.99850082397461, -13.723730087280273, -11.448959350585938, -9.174188613891602, -6.899418830871582, -4.624648094177246, -2.34987735748291, -0.07510757446289062, 2.1996631622314453, 4.474433898925781, 6.749204635620117, 9.023975372314453, 11.298745155334473, 13.573515892028809, 15.848286628723145, 18.123056411743164, 20.3978271484375, 22.672597885131836, 24.947368621826172, 27.222139358520508, 29.496910095214844, 31.771678924560547, 34.046451568603516, 36.32122039794922, 38.59599304199219, 40.87076187133789, 43.145530700683594, 45.42030334472656, 47.695072174072266, 49.969844818115234, 52.24461364746094, 54.519386291503906, 56.79415512084961, 59.06892395019531, 61.343692779541016, 63.618465423583984, 65.89323425292969, 68.16800689697266, 70.44277954101562, 72.71754455566406, 74.99231719970703, 77.26708984375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 2.0, 8.0, 4.0, 3.0, 11.0, 15.0, 21.0, 42.0, 48.0, 66.0, 134.0, 175.0, 352.0, 541.0, 972.0, 1983.0, 3958.0, 8023.0, 17636.0, 40619.0, 96317.0, 219626.0, 329754.0, 185405.0, 79785.0, 33932.0, 14896.0, 6944.0, 3358.0, 1749.0, 936.0, 478.0, 269.0, 190.0, 109.0, 69.0, 58.0, 23.0, 16.0, 15.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.03125, -51.02197265625, -49.0126953125, -47.00341796875, -44.994140625, -42.98486328125, -40.9755859375, -38.96630859375, -36.95703125, -34.94775390625, -32.9384765625, -30.92919921875, -28.919921875, -26.91064453125, -24.9013671875, -22.89208984375, -20.8828125, -18.87353515625, -16.8642578125, -14.85498046875, -12.845703125, -10.83642578125, -8.8271484375, -6.81787109375, -4.80859375, -2.79931640625, -0.7900390625, 1.21923828125, 3.228515625, 5.23779296875, 7.2470703125, 9.25634765625, 11.265625, 13.27490234375, 15.2841796875, 17.29345703125, 19.302734375, 21.31201171875, 23.3212890625, 25.33056640625, 27.33984375, 29.34912109375, 31.3583984375, 33.36767578125, 35.376953125, 37.38623046875, 39.3955078125, 41.40478515625, 43.4140625, 45.42333984375, 47.4326171875, 49.44189453125, 51.451171875, 53.46044921875, 55.4697265625, 57.47900390625, 59.48828125, 61.49755859375, 63.5068359375, 65.51611328125, 67.525390625, 69.53466796875, 71.5439453125, 73.55322265625, 75.5625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 9.0, 3.0, 5.0, 10.0, 13.0, 18.0, 21.0, 34.0, 37.0, 39.0, 33.0, 51.0, 47.0, 43.0, 70.0, 57.0, 58.0, 66.0, 66.0, 50.0, 52.0, 45.0, 39.0, 41.0, 20.0, 17.0, 23.0, 13.0, 7.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.03125, -46.57958984375, -45.1279296875, -43.67626953125, -42.224609375, -40.77294921875, -39.3212890625, -37.86962890625, -36.41796875, -34.96630859375, -33.5146484375, -32.06298828125, -30.611328125, -29.15966796875, -27.7080078125, -26.25634765625, -24.8046875, -23.35302734375, -21.9013671875, -20.44970703125, -18.998046875, -17.54638671875, -16.0947265625, -14.64306640625, -13.19140625, -11.73974609375, -10.2880859375, -8.83642578125, -7.384765625, -5.93310546875, -4.4814453125, -3.02978515625, -1.578125, -0.12646484375, 1.3251953125, 2.77685546875, 4.228515625, 5.68017578125, 7.1318359375, 8.58349609375, 10.03515625, 11.48681640625, 12.9384765625, 14.39013671875, 15.841796875, 17.29345703125, 18.7451171875, 20.19677734375, 21.6484375, 23.10009765625, 24.5517578125, 26.00341796875, 27.455078125, 28.90673828125, 30.3583984375, 31.81005859375, 33.26171875, 34.71337890625, 36.1650390625, 37.61669921875, 39.068359375, 40.52001953125, 41.9716796875, 43.42333984375, 44.875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 15.0, 12.0, 10.0, 17.0, 34.0, 41.0, 38.0, 63.0, 117.0, 120.0, 165.0, 213.0, 328.0, 423.0, 628.0, 1008.0, 2049.0, 5430.0, 25014.0, 187664.0, 687610.0, 111912.0, 16977.0, 4198.0, 1625.0, 846.0, 542.0, 376.0, 273.0, 206.0, 145.0, 116.0, 92.0, 58.0, 46.0, 38.0, 26.0, 14.0, 14.0, 17.0, 12.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-136.125, -131.64453125, -127.1640625, -122.68359375, -118.203125, -113.72265625, -109.2421875, -104.76171875, -100.28125, -95.80078125, -91.3203125, -86.83984375, -82.359375, -77.87890625, -73.3984375, -68.91796875, -64.4375, -59.95703125, -55.4765625, -50.99609375, -46.515625, -42.03515625, -37.5546875, -33.07421875, -28.59375, -24.11328125, -19.6328125, -15.15234375, -10.671875, -6.19140625, -1.7109375, 2.76953125, 7.25, 11.73046875, 16.2109375, 20.69140625, 25.171875, 29.65234375, 34.1328125, 38.61328125, 43.09375, 47.57421875, 52.0546875, 56.53515625, 61.015625, 65.49609375, 69.9765625, 74.45703125, 78.9375, 83.41796875, 87.8984375, 92.37890625, 96.859375, 101.33984375, 105.8203125, 110.30078125, 114.78125, 119.26171875, 123.7421875, 128.22265625, 132.703125, 137.18359375, 141.6640625, 146.14453125, 150.625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 10.0, 7.0, 6.0, 8.0, 13.0, 15.0, 9.0, 23.0, 19.0, 22.0, 36.0, 30.0, 29.0, 32.0, 38.0, 40.0, 38.0, 52.0, 42.0, 40.0, 34.0, 44.0, 47.0, 49.0, 42.0, 29.0, 37.0, 34.0, 14.0, 27.0, 14.0, 21.0, 19.0, 15.0, 13.0, 15.0, 3.0, 8.0, 13.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.125, -131.38671875, -126.6484375, -121.91015625, -117.171875, -112.43359375, -107.6953125, -102.95703125, -98.21875, -93.48046875, -88.7421875, -84.00390625, -79.265625, -74.52734375, -69.7890625, -65.05078125, -60.3125, -55.57421875, -50.8359375, -46.09765625, -41.359375, -36.62109375, -31.8828125, -27.14453125, -22.40625, -17.66796875, -12.9296875, -8.19140625, -3.453125, 1.28515625, 6.0234375, 10.76171875, 15.5, 20.23828125, 24.9765625, 29.71484375, 34.453125, 39.19140625, 43.9296875, 48.66796875, 53.40625, 58.14453125, 62.8828125, 67.62109375, 72.359375, 77.09765625, 81.8359375, 86.57421875, 91.3125, 96.05078125, 100.7890625, 105.52734375, 110.265625, 115.00390625, 119.7421875, 124.48046875, 129.21875, 133.95703125, 138.6953125, 143.43359375, 148.171875, 152.91015625, 157.6484375, 162.38671875, 167.125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 4.0, 6.0, 10.0, 17.0, 27.0, 31.0, 59.0, 88.0, 214.0, 490.0, 1574.0, 11380.0, 536901.0, 484364.0, 10929.0, 1558.0, 457.0, 202.0, 98.0, 52.0, 34.0, 18.0, 15.0, 11.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.0, -147.025390625, -143.05078125, -139.076171875, -135.1015625, -131.126953125, -127.15234375, -123.177734375, -119.203125, -115.228515625, -111.25390625, -107.279296875, -103.3046875, -99.330078125, -95.35546875, -91.380859375, -87.40625, -83.431640625, -79.45703125, -75.482421875, -71.5078125, -67.533203125, -63.55859375, -59.583984375, -55.609375, -51.634765625, -47.66015625, -43.685546875, -39.7109375, -35.736328125, -31.76171875, -27.787109375, -23.8125, -19.837890625, -15.86328125, -11.888671875, -7.9140625, -3.939453125, 0.03515625, 4.009765625, 7.984375, 11.958984375, 15.93359375, 19.908203125, 23.8828125, 27.857421875, 31.83203125, 35.806640625, 39.78125, 43.755859375, 47.73046875, 51.705078125, 55.6796875, 59.654296875, 63.62890625, 67.603515625, 71.578125, 75.552734375, 79.52734375, 83.501953125, 87.4765625, 91.451171875, 95.42578125, 99.400390625, 103.375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 5.0, 5.0, 24.0, 25.0, 36.0, 42.0, 55.0, 120.0, 167.0, 162.0, 106.0, 77.0, 56.0, 30.0, 17.0, 19.0, 13.0, 13.0, 5.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00804901123046875, -0.007666945457458496, -0.007284879684448242, -0.006902813911437988, -0.006520748138427734, -0.0061386823654174805, -0.0057566165924072266, -0.005374550819396973, -0.004992485046386719, -0.004610419273376465, -0.004228353500366211, -0.003846287727355957, -0.003464221954345703, -0.0030821561813354492, -0.0027000904083251953, -0.0023180246353149414, -0.0019359588623046875, -0.0015538930892944336, -0.0011718273162841797, -0.0007897615432739258, -0.0004076957702636719, -2.562999725341797e-05, 0.00035643577575683594, 0.0007385015487670898, 0.0011205673217773438, 0.0015026330947875977, 0.0018846988677978516, 0.0022667646408081055, 0.0026488304138183594, 0.0030308961868286133, 0.003412961959838867, 0.003795027732849121, 0.004177093505859375, 0.004559159278869629, 0.004941225051879883, 0.005323290824890137, 0.005705356597900391, 0.0060874223709106445, 0.0064694881439208984, 0.006851553916931152, 0.007233619689941406, 0.00761568546295166, 0.007997751235961914, 0.008379817008972168, 0.008761882781982422, 0.009143948554992676, 0.00952601432800293, 0.009908080101013184, 0.010290145874023438, 0.010672211647033691, 0.011054277420043945, 0.0114363431930542, 0.011818408966064453, 0.012200474739074707, 0.012582540512084961, 0.012964606285095215, 0.013346672058105469, 0.013728737831115723, 0.014110803604125977, 0.01449286937713623, 0.014874935150146484, 0.015257000923156738, 0.015639066696166992, 0.016021132469177246, 0.0164031982421875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 8.0, 5.0, 11.0, 20.0, 40.0, 52.0, 114.0, 264.0, 549.0, 1391.0, 5416.0, 51156.0, 839494.0, 137224.0, 9574.0, 1989.0, 640.0, 269.0, 155.0, 73.0, 40.0, 27.0, 17.0, 8.0, 9.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.625, -67.36328125, -64.1015625, -60.83984375, -57.578125, -54.31640625, -51.0546875, -47.79296875, -44.53125, -41.26953125, -38.0078125, -34.74609375, -31.484375, -28.22265625, -24.9609375, -21.69921875, -18.4375, -15.17578125, -11.9140625, -8.65234375, -5.390625, -2.12890625, 1.1328125, 4.39453125, 7.65625, 10.91796875, 14.1796875, 17.44140625, 20.703125, 23.96484375, 27.2265625, 30.48828125, 33.75, 37.01171875, 40.2734375, 43.53515625, 46.796875, 50.05859375, 53.3203125, 56.58203125, 59.84375, 63.10546875, 66.3671875, 69.62890625, 72.890625, 76.15234375, 79.4140625, 82.67578125, 85.9375, 89.19921875, 92.4609375, 95.72265625, 98.984375, 102.24609375, 105.5078125, 108.76953125, 112.03125, 115.29296875, 118.5546875, 121.81640625, 125.078125, 128.33984375, 131.6015625, 134.86328125, 138.125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 5.0, 8.0, 10.0, 7.0, 20.0, 22.0, 35.0, 37.0, 42.0, 57.0, 63.0, 74.0, 82.0, 82.0, 74.0, 78.0, 58.0, 42.0, 40.0, 33.0, 32.0, 30.0, 19.0, 12.0, 9.0, 9.0, 3.0, 6.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.40625, -41.81298828125, -40.2197265625, -38.62646484375, -37.033203125, -35.43994140625, -33.8466796875, -32.25341796875, -30.66015625, -29.06689453125, -27.4736328125, -25.88037109375, -24.287109375, -22.69384765625, -21.1005859375, -19.50732421875, -17.9140625, -16.32080078125, -14.7275390625, -13.13427734375, -11.541015625, -9.94775390625, -8.3544921875, -6.76123046875, -5.16796875, -3.57470703125, -1.9814453125, -0.38818359375, 1.205078125, 2.79833984375, 4.3916015625, 5.98486328125, 7.578125, 9.17138671875, 10.7646484375, 12.35791015625, 13.951171875, 15.54443359375, 17.1376953125, 18.73095703125, 20.32421875, 21.91748046875, 23.5107421875, 25.10400390625, 26.697265625, 28.29052734375, 29.8837890625, 31.47705078125, 33.0703125, 34.66357421875, 36.2568359375, 37.85009765625, 39.443359375, 41.03662109375, 42.6298828125, 44.22314453125, 45.81640625, 47.40966796875, 49.0029296875, 50.59619140625, 52.189453125, 53.78271484375, 55.3759765625, 56.96923828125, 58.5625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 13.0, 41.0, 174.0, 419.0, 258.0, 67.0, 15.0, 10.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1573.348876953125, -1488.7479248046875, -1404.14697265625, -1319.546142578125, -1234.9451904296875, -1150.34423828125, -1065.743408203125, -981.1424560546875, -896.54150390625, -811.9405517578125, -727.3396606445312, -642.73876953125, -558.1378173828125, -473.5368957519531, -388.93597412109375, -304.3350830078125, -219.734130859375, -135.13320922851562, -50.53228759765625, 34.068634033203125, 118.6695556640625, 203.27047729492188, 287.87139892578125, 372.4722900390625, 457.0732421875, 541.6741943359375, 626.2750854492188, 710.8759765625, 795.4769287109375, 880.077880859375, 964.6787719726562, 1049.2796630859375, 1133.88037109375, 1218.4813232421875, 1303.082275390625, 1387.68310546875, 1472.2840576171875, 1556.885009765625, 1641.48583984375, 1726.0867919921875, 1810.687744140625, 1895.2886962890625, 1979.8896484375, 2064.490478515625, 2149.09130859375, 2233.6923828125, 2318.293212890625, 2402.89404296875, 2487.4951171875, 2572.095947265625, 2656.697021484375, 2741.2978515625, 2825.89892578125, 2910.499755859375, 2995.1005859375, 3079.70166015625, 3164.302490234375, 3248.9033203125, 3333.50439453125, 3418.105224609375, 3502.7060546875, 3587.30712890625, 3671.907958984375, 3756.5087890625, 3841.10986328125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 7.0, 6.0, 6.0, 6.0, 12.0, 14.0, 10.0, 8.0, 13.0, 34.0, 18.0, 30.0, 24.0, 32.0, 38.0, 37.0, 47.0, 47.0, 64.0, 64.0, 45.0, 55.0, 34.0, 51.0, 42.0, 33.0, 31.0, 30.0, 24.0, 20.0, 15.0, 14.0, 12.0, 9.0, 6.0, 18.0, 11.0, 6.0, 4.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-665.8525390625, -644.0042724609375, -622.1559448242188, -600.3076782226562, -578.4594116210938, -556.611083984375, -534.7628173828125, -512.91455078125, -491.0662536621094, -469.21795654296875, -447.36968994140625, -425.5213928222656, -403.673095703125, -381.8248291015625, -359.9765319824219, -338.12823486328125, -316.27996826171875, -294.4316711425781, -272.5834045410156, -250.735107421875, -228.88682556152344, -207.03854370117188, -185.19024658203125, -163.3419647216797, -141.49368286132812, -119.64540100097656, -97.79711151123047, -75.94882202148438, -54.10054016113281, -32.25225830078125, -10.403961181640625, 11.444320678710938, 33.2926025390625, 55.14088821411133, 76.98917388916016, 98.83746337890625, 120.68574523925781, 142.53402709960938, 164.38232421875, 186.23060607910156, 208.07888793945312, 229.9271697998047, 251.77545166015625, 273.6237487792969, 295.4720458984375, 317.3203125, 339.1686096191406, 361.01690673828125, 382.86517333984375, 404.7134704589844, 426.5617370605469, 448.4100341796875, 470.25830078125, 492.1065979003906, 513.9548950195312, 535.8031616210938, 557.6514892578125, 579.499755859375, 601.3480834960938, 623.1963500976562, 645.0446166992188, 666.8929443359375, 688.7412109375, 710.5894775390625, 732.437744140625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 9.0, 8.0, 11.0, 18.0, 16.0, 31.0, 37.0, 53.0, 78.0, 111.0, 151.0, 234.0, 299.0, 481.0, 656.0, 874.0, 1307.0, 2059.0, 3323.0, 6516.0, 15383.0, 66812.0, 3951291.0, 106775.0, 19382.0, 7422.0, 3844.0, 2289.0, 1540.0, 1011.0, 713.0, 501.0, 343.0, 210.0, 139.0, 109.0, 75.0, 56.0, 28.0, 20.0, 24.0, 7.0, 12.0, 6.0, 4.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-102.375, -99.029296875, -95.68359375, -92.337890625, -88.9921875, -85.646484375, -82.30078125, -78.955078125, -75.609375, -72.263671875, -68.91796875, -65.572265625, -62.2265625, -58.880859375, -55.53515625, -52.189453125, -48.84375, -45.498046875, -42.15234375, -38.806640625, -35.4609375, -32.115234375, -28.76953125, -25.423828125, -22.078125, -18.732421875, -15.38671875, -12.041015625, -8.6953125, -5.349609375, -2.00390625, 1.341796875, 4.6875, 8.033203125, 11.37890625, 14.724609375, 18.0703125, 21.416015625, 24.76171875, 28.107421875, 31.453125, 34.798828125, 38.14453125, 41.490234375, 44.8359375, 48.181640625, 51.52734375, 54.873046875, 58.21875, 61.564453125, 64.91015625, 68.255859375, 71.6015625, 74.947265625, 78.29296875, 81.638671875, 84.984375, 88.330078125, 91.67578125, 95.021484375, 98.3671875, 101.712890625, 105.05859375, 108.404296875, 111.75]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 9.0, 12.0, 11.0, 16.0, 23.0, 39.0, 41.0, 45.0, 48.0, 52.0, 69.0, 61.0, 75.0, 86.0, 76.0, 62.0, 64.0, 45.0, 31.0, 33.0, 37.0, 16.0, 13.0, 8.0, 11.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.125, -41.51416015625, -39.9033203125, -38.29248046875, -36.681640625, -35.07080078125, -33.4599609375, -31.84912109375, -30.23828125, -28.62744140625, -27.0166015625, -25.40576171875, -23.794921875, -22.18408203125, -20.5732421875, -18.96240234375, -17.3515625, -15.74072265625, -14.1298828125, -12.51904296875, -10.908203125, -9.29736328125, -7.6865234375, -6.07568359375, -4.46484375, -2.85400390625, -1.2431640625, 0.36767578125, 1.978515625, 3.58935546875, 5.2001953125, 6.81103515625, 8.421875, 10.03271484375, 11.6435546875, 13.25439453125, 14.865234375, 16.47607421875, 18.0869140625, 19.69775390625, 21.30859375, 22.91943359375, 24.5302734375, 26.14111328125, 27.751953125, 29.36279296875, 30.9736328125, 32.58447265625, 34.1953125, 35.80615234375, 37.4169921875, 39.02783203125, 40.638671875, 42.24951171875, 43.8603515625, 45.47119140625, 47.08203125, 48.69287109375, 50.3037109375, 51.91455078125, 53.525390625, 55.13623046875, 56.7470703125, 58.35791015625, 59.96875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 3.0, 11.0, 25.0, 21.0, 33.0, 43.0, 70.0, 83.0, 121.0, 217.0, 341.0, 492.0, 868.0, 1453.0, 2680.0, 5226.0, 12571.0, 42613.0, 3848548.0, 234037.0, 26205.0, 9161.0, 4125.0, 2175.0, 1203.0, 707.0, 443.0, 258.0, 155.0, 124.0, 84.0, 56.0, 37.0, 27.0, 16.0, 11.0, 9.0, 9.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-148.5, -144.236328125, -139.97265625, -135.708984375, -131.4453125, -127.181640625, -122.91796875, -118.654296875, -114.390625, -110.126953125, -105.86328125, -101.599609375, -97.3359375, -93.072265625, -88.80859375, -84.544921875, -80.28125, -76.017578125, -71.75390625, -67.490234375, -63.2265625, -58.962890625, -54.69921875, -50.435546875, -46.171875, -41.908203125, -37.64453125, -33.380859375, -29.1171875, -24.853515625, -20.58984375, -16.326171875, -12.0625, -7.798828125, -3.53515625, 0.728515625, 4.9921875, 9.255859375, 13.51953125, 17.783203125, 22.046875, 26.310546875, 30.57421875, 34.837890625, 39.1015625, 43.365234375, 47.62890625, 51.892578125, 56.15625, 60.419921875, 64.68359375, 68.947265625, 73.2109375, 77.474609375, 81.73828125, 86.001953125, 90.265625, 94.529296875, 98.79296875, 103.056640625, 107.3203125, 111.583984375, 115.84765625, 120.111328125, 124.375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 6.0, 2.0, 10.0, 10.0, 16.0, 13.0, 29.0, 52.0, 183.0, 3153.0, 354.0, 97.0, 38.0, 23.0, 17.0, 13.0, 13.0, 8.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-61.5, -59.67333984375, -57.8466796875, -56.02001953125, -54.193359375, -52.36669921875, -50.5400390625, -48.71337890625, -46.88671875, -45.06005859375, -43.2333984375, -41.40673828125, -39.580078125, -37.75341796875, -35.9267578125, -34.10009765625, -32.2734375, -30.44677734375, -28.6201171875, -26.79345703125, -24.966796875, -23.14013671875, -21.3134765625, -19.48681640625, -17.66015625, -15.83349609375, -14.0068359375, -12.18017578125, -10.353515625, -8.52685546875, -6.7001953125, -4.87353515625, -3.046875, -1.22021484375, 0.6064453125, 2.43310546875, 4.259765625, 6.08642578125, 7.9130859375, 9.73974609375, 11.56640625, 13.39306640625, 15.2197265625, 17.04638671875, 18.873046875, 20.69970703125, 22.5263671875, 24.35302734375, 26.1796875, 28.00634765625, 29.8330078125, 31.65966796875, 33.486328125, 35.31298828125, 37.1396484375, 38.96630859375, 40.79296875, 42.61962890625, 44.4462890625, 46.27294921875, 48.099609375, 49.92626953125, 51.7529296875, 53.57958984375, 55.40625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 6.0, 8.0, 9.0, 8.0, 8.0, 19.0, 14.0, 23.0, 35.0, 40.0, 66.0, 50.0, 69.0, 84.0, 85.0, 80.0, 74.0, 76.0, 56.0, 40.0, 41.0, 18.0, 30.0, 14.0, 9.0, 7.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-182.44300842285156, -177.17477416992188, -171.9065399169922, -166.6383056640625, -161.3700714111328, -156.10183715820312, -150.83360290527344, -145.56536865234375, -140.297119140625, -135.0288848876953, -129.76065063476562, -124.49241638183594, -119.22418212890625, -113.95594787597656, -108.68770599365234, -103.41947174072266, -98.1512451171875, -92.88301086425781, -87.61477661132812, -82.34654235839844, -77.07830810546875, -71.81007385253906, -66.54183197021484, -61.273597717285156, -56.00536346435547, -50.73712921142578, -45.468894958496094, -40.20065689086914, -34.93242263793945, -29.664188385009766, -24.395952224731445, -19.127716064453125, -13.859466552734375, -8.591231346130371, -3.322996139526367, 1.9452390670776367, 7.213474273681641, 12.481708526611328, 17.74994468688965, 23.01818084716797, 28.286415100097656, 33.554649353027344, 38.82288360595703, 44.091121673583984, 49.35935592651367, 54.62759017944336, 59.89582824707031, 65.1640625, 70.43229675292969, 75.70053100585938, 80.96876525878906, 86.23699951171875, 91.50523376464844, 96.77346801757812, 102.04170989990234, 107.30994415283203, 112.57817840576172, 117.8464126586914, 123.1146469116211, 128.3828887939453, 133.651123046875, 138.9193572998047, 144.18759155273438, 149.45582580566406, 154.72406005859375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 11.0, 13.0, 16.0, 17.0, 22.0, 19.0, 23.0, 27.0, 32.0, 25.0, 28.0, 32.0, 42.0, 51.0, 42.0, 56.0, 37.0, 42.0, 44.0, 50.0, 48.0, 38.0, 39.0, 32.0, 33.0, 26.0, 19.0, 17.0, 12.0, 18.0, 11.0, 12.0, 8.0, 6.0, 10.0, 8.0, 5.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.29916381835938, -121.89496612548828, -117.49076843261719, -113.0865707397461, -108.682373046875, -104.27818298339844, -99.87398529052734, -95.46978759765625, -91.06558990478516, -86.66139221191406, -82.25719451904297, -77.85299682617188, -73.44880676269531, -69.04460144042969, -64.64041137695312, -60.23621368408203, -55.83201599121094, -51.427818298339844, -47.02362060546875, -42.61942672729492, -38.21522903442383, -33.811031341552734, -29.406835556030273, -25.002639770507812, -20.59844207763672, -16.194244384765625, -11.790048599243164, -7.385851860046387, -2.9816551208496094, 1.4225425720214844, 5.826738357543945, 10.230934143066406, 14.635147094726562, 19.039344787597656, 23.443540573120117, 27.847736358642578, 32.25193405151367, 36.656131744384766, 41.060325622558594, 45.46452331542969, 49.86872100830078, 54.272918701171875, 58.67711639404297, 63.0813102722168, 67.48550415039062, 71.88970947265625, 76.29389953613281, 80.6980972290039, 85.102294921875, 89.5064926147461, 93.91069030761719, 98.31488800048828, 102.71908569335938, 107.12327575683594, 111.52747344970703, 115.93167114257812, 120.33586883544922, 124.74006652832031, 129.14425659179688, 133.5484619140625, 137.95265197753906, 142.3568572998047, 146.76104736328125, 151.16525268554688, 155.56944274902344]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 2.0, 9.0, 8.0, 20.0, 17.0, 27.0, 62.0, 72.0, 147.0, 278.0, 461.0, 864.0, 1788.0, 3796.0, 8571.0, 20612.0, 51494.0, 133696.0, 330232.0, 299389.0, 117840.0, 46089.0, 18345.0, 7912.0, 3400.0, 1615.0, 843.0, 426.0, 216.0, 138.0, 68.0, 45.0, 22.0, 14.0, 13.0, 8.0, 7.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.9375, -84.8984375, -81.859375, -78.8203125, -75.78125, -72.7421875, -69.703125, -66.6640625, -63.625, -60.5859375, -57.546875, -54.5078125, -51.46875, -48.4296875, -45.390625, -42.3515625, -39.3125, -36.2734375, -33.234375, -30.1953125, -27.15625, -24.1171875, -21.078125, -18.0390625, -15.0, -11.9609375, -8.921875, -5.8828125, -2.84375, 0.1953125, 3.234375, 6.2734375, 9.3125, 12.3515625, 15.390625, 18.4296875, 21.46875, 24.5078125, 27.546875, 30.5859375, 33.625, 36.6640625, 39.703125, 42.7421875, 45.78125, 48.8203125, 51.859375, 54.8984375, 57.9375, 60.9765625, 64.015625, 67.0546875, 70.09375, 73.1328125, 76.171875, 79.2109375, 82.25, 85.2890625, 88.328125, 91.3671875, 94.40625, 97.4453125, 100.484375, 103.5234375, 106.5625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 15.0, 11.0, 10.0, 23.0, 27.0, 32.0, 37.0, 29.0, 46.0, 44.0, 44.0, 52.0, 62.0, 67.0, 74.0, 53.0, 55.0, 57.0, 54.0, 42.0, 37.0, 24.0, 17.0, 19.0, 13.0, 11.0, 9.0, 8.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.78125, -39.30859375, -37.8359375, -36.36328125, -34.890625, -33.41796875, -31.9453125, -30.47265625, -29.0, -27.52734375, -26.0546875, -24.58203125, -23.109375, -21.63671875, -20.1640625, -18.69140625, -17.21875, -15.74609375, -14.2734375, -12.80078125, -11.328125, -9.85546875, -8.3828125, -6.91015625, -5.4375, -3.96484375, -2.4921875, -1.01953125, 0.453125, 1.92578125, 3.3984375, 4.87109375, 6.34375, 7.81640625, 9.2890625, 10.76171875, 12.234375, 13.70703125, 15.1796875, 16.65234375, 18.125, 19.59765625, 21.0703125, 22.54296875, 24.015625, 25.48828125, 26.9609375, 28.43359375, 29.90625, 31.37890625, 32.8515625, 34.32421875, 35.796875, 37.26953125, 38.7421875, 40.21484375, 41.6875, 43.16015625, 44.6328125, 46.10546875, 47.578125, 49.05078125, 50.5234375, 51.99609375, 53.46875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 8.0, 9.0, 7.0, 20.0, 28.0, 42.0, 61.0, 103.0, 143.0, 237.0, 437.0, 885.0, 2388.0, 12912.0, 200301.0, 773738.0, 48838.0, 5517.0, 1386.0, 621.0, 308.0, 185.0, 112.0, 97.0, 57.0, 37.0, 30.0, 16.0, 13.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.75, -259.453125, -251.15625, -242.859375, -234.5625, -226.265625, -217.96875, -209.671875, -201.375, -193.078125, -184.78125, -176.484375, -168.1875, -159.890625, -151.59375, -143.296875, -135.0, -126.703125, -118.40625, -110.109375, -101.8125, -93.515625, -85.21875, -76.921875, -68.625, -60.328125, -52.03125, -43.734375, -35.4375, -27.140625, -18.84375, -10.546875, -2.25, 6.046875, 14.34375, 22.640625, 30.9375, 39.234375, 47.53125, 55.828125, 64.125, 72.421875, 80.71875, 89.015625, 97.3125, 105.609375, 113.90625, 122.203125, 130.5, 138.796875, 147.09375, 155.390625, 163.6875, 171.984375, 180.28125, 188.578125, 196.875, 205.171875, 213.46875, 221.765625, 230.0625, 238.359375, 246.65625, 254.953125, 263.25]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 6.0, 5.0, 8.0, 10.0, 15.0, 15.0, 19.0, 27.0, 24.0, 33.0, 29.0, 26.0, 42.0, 47.0, 49.0, 52.0, 49.0, 53.0, 44.0, 60.0, 56.0, 52.0, 35.0, 40.0, 29.0, 23.0, 41.0, 25.0, 13.0, 14.0, 21.0, 11.0, 5.0, 5.0, 9.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-165.375, -160.01171875, -154.6484375, -149.28515625, -143.921875, -138.55859375, -133.1953125, -127.83203125, -122.46875, -117.10546875, -111.7421875, -106.37890625, -101.015625, -95.65234375, -90.2890625, -84.92578125, -79.5625, -74.19921875, -68.8359375, -63.47265625, -58.109375, -52.74609375, -47.3828125, -42.01953125, -36.65625, -31.29296875, -25.9296875, -20.56640625, -15.203125, -9.83984375, -4.4765625, 0.88671875, 6.25, 11.61328125, 16.9765625, 22.33984375, 27.703125, 33.06640625, 38.4296875, 43.79296875, 49.15625, 54.51953125, 59.8828125, 65.24609375, 70.609375, 75.97265625, 81.3359375, 86.69921875, 92.0625, 97.42578125, 102.7890625, 108.15234375, 113.515625, 118.87890625, 124.2421875, 129.60546875, 134.96875, 140.33203125, 145.6953125, 151.05859375, 156.421875, 161.78515625, 167.1484375, 172.51171875, 177.875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 5.0, 4.0, 8.0, 4.0, 21.0, 23.0, 43.0, 53.0, 60.0, 145.0, 241.0, 463.0, 1141.0, 3827.0, 20005.0, 220300.0, 725354.0, 64551.0, 8596.0, 2081.0, 786.0, 354.0, 173.0, 98.0, 71.0, 38.0, 37.0, 16.0, 8.0, 12.0, 9.0, 14.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-81.75, -79.3642578125, -76.978515625, -74.5927734375, -72.20703125, -69.8212890625, -67.435546875, -65.0498046875, -62.6640625, -60.2783203125, -57.892578125, -55.5068359375, -53.12109375, -50.7353515625, -48.349609375, -45.9638671875, -43.578125, -41.1923828125, -38.806640625, -36.4208984375, -34.03515625, -31.6494140625, -29.263671875, -26.8779296875, -24.4921875, -22.1064453125, -19.720703125, -17.3349609375, -14.94921875, -12.5634765625, -10.177734375, -7.7919921875, -5.40625, -3.0205078125, -0.634765625, 1.7509765625, 4.13671875, 6.5224609375, 8.908203125, 11.2939453125, 13.6796875, 16.0654296875, 18.451171875, 20.8369140625, 23.22265625, 25.6083984375, 27.994140625, 30.3798828125, 32.765625, 35.1513671875, 37.537109375, 39.9228515625, 42.30859375, 44.6943359375, 47.080078125, 49.4658203125, 51.8515625, 54.2373046875, 56.623046875, 59.0087890625, 61.39453125, 63.7802734375, 66.166015625, 68.5517578125, 70.9375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 6.0, 5.0, 8.0, 7.0, 18.0, 9.0, 32.0, 29.0, 45.0, 61.0, 76.0, 128.0, 121.0, 107.0, 91.0, 61.0, 41.0, 38.0, 33.0, 14.0, 11.0, 7.0, 3.0, 8.0, 9.0, 2.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.013336181640625, -0.01298224925994873, -0.012628316879272461, -0.012274384498596191, -0.011920452117919922, -0.011566519737243652, -0.011212587356567383, -0.010858654975891113, -0.010504722595214844, -0.010150790214538574, -0.009796857833862305, -0.009442925453186035, -0.009088993072509766, -0.008735060691833496, -0.008381128311157227, -0.008027195930480957, -0.0076732635498046875, -0.007319331169128418, -0.0069653987884521484, -0.006611466407775879, -0.006257534027099609, -0.00590360164642334, -0.00554966926574707, -0.005195736885070801, -0.004841804504394531, -0.004487872123718262, -0.004133939743041992, -0.0037800073623657227, -0.003426074981689453, -0.0030721426010131836, -0.002718210220336914, -0.0023642778396606445, -0.002010345458984375, -0.0016564130783081055, -0.001302480697631836, -0.0009485483169555664, -0.0005946159362792969, -0.00024068355560302734, 0.00011324882507324219, 0.0004671812057495117, 0.0008211135864257812, 0.0011750459671020508, 0.0015289783477783203, 0.0018829107284545898, 0.0022368431091308594, 0.002590775489807129, 0.0029447078704833984, 0.003298640251159668, 0.0036525726318359375, 0.004006505012512207, 0.0043604373931884766, 0.004714369773864746, 0.005068302154541016, 0.005422234535217285, 0.005776166915893555, 0.006130099296569824, 0.006484031677246094, 0.006837964057922363, 0.007191896438598633, 0.007545828819274902, 0.007899761199951172, 0.008253693580627441, 0.008607625961303711, 0.00896155834197998, 0.00931549072265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 7.0, 6.0, 14.0, 18.0, 22.0, 30.0, 36.0, 78.0, 117.0, 217.0, 390.0, 914.0, 2572.0, 12098.0, 176433.0, 793476.0, 53175.0, 5908.0, 1641.0, 615.0, 308.0, 183.0, 103.0, 69.0, 30.0, 30.0, 20.0, 14.0, 4.0, 3.0, 7.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-95.625, -92.75390625, -89.8828125, -87.01171875, -84.140625, -81.26953125, -78.3984375, -75.52734375, -72.65625, -69.78515625, -66.9140625, -64.04296875, -61.171875, -58.30078125, -55.4296875, -52.55859375, -49.6875, -46.81640625, -43.9453125, -41.07421875, -38.203125, -35.33203125, -32.4609375, -29.58984375, -26.71875, -23.84765625, -20.9765625, -18.10546875, -15.234375, -12.36328125, -9.4921875, -6.62109375, -3.75, -0.87890625, 1.9921875, 4.86328125, 7.734375, 10.60546875, 13.4765625, 16.34765625, 19.21875, 22.08984375, 24.9609375, 27.83203125, 30.703125, 33.57421875, 36.4453125, 39.31640625, 42.1875, 45.05859375, 47.9296875, 50.80078125, 53.671875, 56.54296875, 59.4140625, 62.28515625, 65.15625, 68.02734375, 70.8984375, 73.76953125, 76.640625, 79.51171875, 82.3828125, 85.25390625, 88.125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 13.0, 12.0, 15.0, 20.0, 30.0, 42.0, 66.0, 67.0, 87.0, 104.0, 104.0, 87.0, 84.0, 64.0, 62.0, 43.0, 25.0, 8.0, 16.0, 15.0, 7.0, 8.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.03125, -49.94677734375, -47.8623046875, -45.77783203125, -43.693359375, -41.60888671875, -39.5244140625, -37.43994140625, -35.35546875, -33.27099609375, -31.1865234375, -29.10205078125, -27.017578125, -24.93310546875, -22.8486328125, -20.76416015625, -18.6796875, -16.59521484375, -14.5107421875, -12.42626953125, -10.341796875, -8.25732421875, -6.1728515625, -4.08837890625, -2.00390625, 0.08056640625, 2.1650390625, 4.24951171875, 6.333984375, 8.41845703125, 10.5029296875, 12.58740234375, 14.671875, 16.75634765625, 18.8408203125, 20.92529296875, 23.009765625, 25.09423828125, 27.1787109375, 29.26318359375, 31.34765625, 33.43212890625, 35.5166015625, 37.60107421875, 39.685546875, 41.77001953125, 43.8544921875, 45.93896484375, 48.0234375, 50.10791015625, 52.1923828125, 54.27685546875, 56.361328125, 58.44580078125, 60.5302734375, 62.61474609375, 64.69921875, 66.78369140625, 68.8681640625, 70.95263671875, 73.037109375, 75.12158203125, 77.2060546875, 79.29052734375, 81.375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 7.0, 6.0, 14.0, 20.0, 51.0, 88.0, 147.0, 185.0, 168.0, 123.0, 83.0, 54.0, 22.0, 17.0, 10.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-927.8832397460938, -883.736328125, -839.5894775390625, -795.4425659179688, -751.295654296875, -707.1488037109375, -663.0018920898438, -618.85498046875, -574.7081298828125, -530.5612182617188, -486.41436767578125, -442.2674560546875, -398.1205749511719, -353.97369384765625, -309.8267822265625, -265.6799011230469, -221.53302001953125, -177.38613891601562, -133.23924255371094, -89.09234619140625, -44.945465087890625, -0.798583984375, 43.34832763671875, 87.49520874023438, 131.64208984375, 175.78897094726562, 219.9358673095703, 264.082763671875, 308.2296447753906, 352.37652587890625, 396.5234375, 440.6703186035156, 484.817138671875, 528.9640502929688, 573.1109008789062, 617.2578125, 661.4046630859375, 705.5515747070312, 749.698486328125, 793.8453369140625, 837.9922485351562, 882.13916015625, 926.2860107421875, 970.4329223632812, 1014.579833984375, 1058.7266845703125, 1102.87353515625, 1147.0205078125, 1191.1673583984375, 1235.314208984375, 1279.461181640625, 1323.6080322265625, 1367.7548828125, 1411.90185546875, 1456.0487060546875, 1500.195556640625, 1544.342529296875, 1588.4893798828125, 1632.6363525390625, 1676.783203125, 1720.9300537109375, 1765.076904296875, 1809.223876953125, 1853.3707275390625, 1897.517578125]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 7.0, 6.0, 6.0, 12.0, 19.0, 18.0, 23.0, 22.0, 23.0, 29.0, 49.0, 38.0, 42.0, 42.0, 63.0, 61.0, 65.0, 50.0, 56.0, 41.0, 44.0, 46.0, 37.0, 28.0, 26.0, 24.0, 29.0, 23.0, 16.0, 13.0, 8.0, 7.0, 5.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-674.2063598632812, -649.893310546875, -625.5802001953125, -601.2671508789062, -576.9541015625, -552.6409912109375, -528.3279418945312, -504.014892578125, -479.7018127441406, -455.38873291015625, -431.07568359375, -406.7626037597656, -382.44952392578125, -358.136474609375, -333.8233947753906, -309.51031494140625, -285.197265625, -260.8841857910156, -236.57113647460938, -212.258056640625, -187.9449920654297, -163.63192749023438, -139.31884765625, -115.00578308105469, -90.69271850585938, -66.37965393066406, -42.06658172607422, -17.753509521484375, 6.5595550537109375, 30.87261962890625, 55.185699462890625, 79.49876403808594, 103.811767578125, 128.1248321533203, 152.43789672851562, 176.7509765625, 201.0640411376953, 225.37710571289062, 249.690185546875, 274.00323486328125, 298.3163146972656, 322.62939453125, 346.94244384765625, 371.2555236816406, 395.568603515625, 419.88165283203125, 444.1947326660156, 468.5078125, 492.82086181640625, 517.1339111328125, 541.447021484375, 565.7600708007812, 590.0731201171875, 614.38623046875, 638.6992797851562, 663.0123291015625, 687.325439453125, 711.6384887695312, 735.9515991210938, 760.2646484375, 784.5776977539062, 808.8907470703125, 833.203857421875, 857.5169067382812, 881.8299560546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 16.0, 21.0, 38.0, 47.0, 70.0, 107.0, 154.0, 293.0, 448.0, 803.0, 1358.0, 2422.0, 4423.0, 8436.0, 17816.0, 43649.0, 170145.0, 2509608.0, 1253836.0, 114122.0, 35093.0, 15161.0, 7335.0, 3898.0, 2091.0, 1201.0, 682.0, 353.0, 245.0, 133.0, 103.0, 53.0, 46.0, 20.0, 21.0, 7.0, 12.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.9375, -68.7802734375, -66.623046875, -64.4658203125, -62.30859375, -60.1513671875, -57.994140625, -55.8369140625, -53.6796875, -51.5224609375, -49.365234375, -47.2080078125, -45.05078125, -42.8935546875, -40.736328125, -38.5791015625, -36.421875, -34.2646484375, -32.107421875, -29.9501953125, -27.79296875, -25.6357421875, -23.478515625, -21.3212890625, -19.1640625, -17.0068359375, -14.849609375, -12.6923828125, -10.53515625, -8.3779296875, -6.220703125, -4.0634765625, -1.90625, 0.2509765625, 2.408203125, 4.5654296875, 6.72265625, 8.8798828125, 11.037109375, 13.1943359375, 15.3515625, 17.5087890625, 19.666015625, 21.8232421875, 23.98046875, 26.1376953125, 28.294921875, 30.4521484375, 32.609375, 34.7666015625, 36.923828125, 39.0810546875, 41.23828125, 43.3955078125, 45.552734375, 47.7099609375, 49.8671875, 52.0244140625, 54.181640625, 56.3388671875, 58.49609375, 60.6533203125, 62.810546875, 64.9677734375, 67.125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 6.0, 7.0, 9.0, 14.0, 15.0, 15.0, 22.0, 29.0, 28.0, 32.0, 37.0, 29.0, 37.0, 41.0, 52.0, 39.0, 57.0, 51.0, 41.0, 64.0, 43.0, 41.0, 44.0, 45.0, 33.0, 31.0, 24.0, 25.0, 16.0, 14.0, 11.0, 11.0, 9.0, 5.0, 3.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.53125, -33.42724609375, -32.3232421875, -31.21923828125, -30.115234375, -29.01123046875, -27.9072265625, -26.80322265625, -25.69921875, -24.59521484375, -23.4912109375, -22.38720703125, -21.283203125, -20.17919921875, -19.0751953125, -17.97119140625, -16.8671875, -15.76318359375, -14.6591796875, -13.55517578125, -12.451171875, -11.34716796875, -10.2431640625, -9.13916015625, -8.03515625, -6.93115234375, -5.8271484375, -4.72314453125, -3.619140625, -2.51513671875, -1.4111328125, -0.30712890625, 0.796875, 1.90087890625, 3.0048828125, 4.10888671875, 5.212890625, 6.31689453125, 7.4208984375, 8.52490234375, 9.62890625, 10.73291015625, 11.8369140625, 12.94091796875, 14.044921875, 15.14892578125, 16.2529296875, 17.35693359375, 18.4609375, 19.56494140625, 20.6689453125, 21.77294921875, 22.876953125, 23.98095703125, 25.0849609375, 26.18896484375, 27.29296875, 28.39697265625, 29.5009765625, 30.60498046875, 31.708984375, 32.81298828125, 33.9169921875, 35.02099609375, 36.125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 10.0, 11.0, 29.0, 41.0, 43.0, 61.0, 139.0, 242.0, 565.0, 1718.0, 6564.0, 32137.0, 421781.0, 3642319.0, 71948.0, 12074.0, 2874.0, 902.0, 345.0, 179.0, 114.0, 57.0, 33.0, 23.0, 21.0, 15.0, 7.0, 9.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-238.375, -231.96875, -225.5625, -219.15625, -212.75, -206.34375, -199.9375, -193.53125, -187.125, -180.71875, -174.3125, -167.90625, -161.5, -155.09375, -148.6875, -142.28125, -135.875, -129.46875, -123.0625, -116.65625, -110.25, -103.84375, -97.4375, -91.03125, -84.625, -78.21875, -71.8125, -65.40625, -59.0, -52.59375, -46.1875, -39.78125, -33.375, -26.96875, -20.5625, -14.15625, -7.75, -1.34375, 5.0625, 11.46875, 17.875, 24.28125, 30.6875, 37.09375, 43.5, 49.90625, 56.3125, 62.71875, 69.125, 75.53125, 81.9375, 88.34375, 94.75, 101.15625, 107.5625, 113.96875, 120.375, 126.78125, 133.1875, 139.59375, 146.0, 152.40625, 158.8125, 165.21875, 171.625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 7.0, 8.0, 15.0, 14.0, 11.0, 27.0, 24.0, 38.0, 61.0, 75.0, 152.0, 418.0, 1338.0, 1189.0, 349.0, 125.0, 69.0, 41.0, 26.0, 20.0, 17.0, 18.0, 10.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.4375, -106.3544921875, -101.271484375, -96.1884765625, -91.10546875, -86.0224609375, -80.939453125, -75.8564453125, -70.7734375, -65.6904296875, -60.607421875, -55.5244140625, -50.44140625, -45.3583984375, -40.275390625, -35.1923828125, -30.109375, -25.0263671875, -19.943359375, -14.8603515625, -9.77734375, -4.6943359375, 0.388671875, 5.4716796875, 10.5546875, 15.6376953125, 20.720703125, 25.8037109375, 30.88671875, 35.9697265625, 41.052734375, 46.1357421875, 51.21875, 56.3017578125, 61.384765625, 66.4677734375, 71.55078125, 76.6337890625, 81.716796875, 86.7998046875, 91.8828125, 96.9658203125, 102.048828125, 107.1318359375, 112.21484375, 117.2978515625, 122.380859375, 127.4638671875, 132.546875, 137.6298828125, 142.712890625, 147.7958984375, 152.87890625, 157.9619140625, 163.044921875, 168.1279296875, 173.2109375, 178.2939453125, 183.376953125, 188.4599609375, 193.54296875, 198.6259765625, 203.708984375, 208.7919921875, 213.875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 8.0, 6.0, 7.0, 9.0, 19.0, 59.0, 90.0, 161.0, 202.0, 182.0, 115.0, 57.0, 28.0, 20.0, 7.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1903.1878662109375, -1859.8245849609375, -1816.461181640625, -1773.097900390625, -1729.734619140625, -1686.371337890625, -1643.008056640625, -1599.6446533203125, -1556.2813720703125, -1512.9180908203125, -1469.5546875, -1426.19140625, -1382.828125, -1339.46484375, -1296.1015625, -1252.7381591796875, -1209.3748779296875, -1166.0115966796875, -1122.648193359375, -1079.284912109375, -1035.921630859375, -992.558349609375, -949.1950073242188, -905.8316650390625, -862.4683837890625, -819.1051025390625, -775.7417602539062, -732.37841796875, -689.01513671875, -645.65185546875, -602.2885131835938, -558.9251708984375, -515.5618286132812, -472.1985168457031, -428.835205078125, -385.4718933105469, -342.10858154296875, -298.7452697753906, -255.3819580078125, -212.01864624023438, -168.65533447265625, -125.29202270507812, -81.9287109375, -38.565399169921875, 4.79791259765625, 48.161224365234375, 91.5245361328125, 134.88784790039062, 178.25115966796875, 221.61447143554688, 264.977783203125, 308.3410949707031, 351.70440673828125, 395.0677185058594, 438.4310302734375, 481.7943420410156, 525.1576538085938, 568.52099609375, 611.88427734375, 655.24755859375, 698.6109008789062, 741.9742431640625, 785.3375244140625, 828.7008056640625, 872.0641479492188]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 12.0, 14.0, 15.0, 13.0, 19.0, 30.0, 27.0, 49.0, 48.0, 46.0, 58.0, 47.0, 60.0, 74.0, 75.0, 62.0, 47.0, 55.0, 37.0, 41.0, 37.0, 31.0, 25.0, 18.0, 20.0, 12.0, 9.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-707.8894653320312, -684.757080078125, -661.6246948242188, -638.4923095703125, -615.35986328125, -592.2274780273438, -569.0950927734375, -545.9627075195312, -522.830322265625, -499.69793701171875, -476.5655517578125, -453.4331359863281, -430.3007507324219, -407.1683654785156, -384.03594970703125, -360.903564453125, -337.77117919921875, -314.6387939453125, -291.50640869140625, -268.3739929199219, -245.24160766601562, -222.10922241210938, -198.97682189941406, -175.84442138671875, -152.7120361328125, -129.57965087890625, -106.44725036621094, -83.31485748291016, -60.182464599609375, -37.050071716308594, -13.917678833007812, 9.2147216796875, 32.34716796875, 55.47956085205078, 78.61195373535156, 101.74434661865234, 124.87673950195312, 148.00912475585938, 171.1415252685547, 194.27392578125, 217.40631103515625, 240.5386962890625, 263.67108154296875, 286.8034973144531, 309.9358825683594, 333.0682678222656, 356.20068359375, 379.33306884765625, 402.4654541015625, 425.59783935546875, 448.730224609375, 471.8626403808594, 494.9950256347656, 518.12744140625, 541.2598266601562, 564.3922119140625, 587.5245971679688, 610.656982421875, 633.7893676757812, 656.9217529296875, 680.05419921875, 703.1865844726562, 726.3189697265625, 749.4513549804688, 772.583740234375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 14.0, 19.0, 28.0, 43.0, 59.0, 107.0, 175.0, 299.0, 510.0, 890.0, 1769.0, 3388.0, 7198.0, 16091.0, 39352.0, 108506.0, 339984.0, 347554.0, 110761.0, 40463.0, 16564.0, 7341.0, 3499.0, 1719.0, 971.0, 515.0, 288.0, 178.0, 103.0, 60.0, 27.0, 29.0, 16.0, 14.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.8125, -104.642578125, -101.47265625, -98.302734375, -95.1328125, -91.962890625, -88.79296875, -85.623046875, -82.453125, -79.283203125, -76.11328125, -72.943359375, -69.7734375, -66.603515625, -63.43359375, -60.263671875, -57.09375, -53.923828125, -50.75390625, -47.583984375, -44.4140625, -41.244140625, -38.07421875, -34.904296875, -31.734375, -28.564453125, -25.39453125, -22.224609375, -19.0546875, -15.884765625, -12.71484375, -9.544921875, -6.375, -3.205078125, -0.03515625, 3.134765625, 6.3046875, 9.474609375, 12.64453125, 15.814453125, 18.984375, 22.154296875, 25.32421875, 28.494140625, 31.6640625, 34.833984375, 38.00390625, 41.173828125, 44.34375, 47.513671875, 50.68359375, 53.853515625, 57.0234375, 60.193359375, 63.36328125, 66.533203125, 69.703125, 72.873046875, 76.04296875, 79.212890625, 82.3828125, 85.552734375, 88.72265625, 91.892578125, 95.0625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 8.0, 12.0, 8.0, 14.0, 13.0, 22.0, 30.0, 23.0, 34.0, 41.0, 33.0, 35.0, 37.0, 52.0, 45.0, 50.0, 56.0, 52.0, 57.0, 51.0, 52.0, 44.0, 49.0, 38.0, 23.0, 22.0, 19.0, 13.0, 11.0, 13.0, 13.0, 8.0, 3.0, 3.0, 3.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.40625, -38.1044921875, -36.802734375, -35.5009765625, -34.19921875, -32.8974609375, -31.595703125, -30.2939453125, -28.9921875, -27.6904296875, -26.388671875, -25.0869140625, -23.78515625, -22.4833984375, -21.181640625, -19.8798828125, -18.578125, -17.2763671875, -15.974609375, -14.6728515625, -13.37109375, -12.0693359375, -10.767578125, -9.4658203125, -8.1640625, -6.8623046875, -5.560546875, -4.2587890625, -2.95703125, -1.6552734375, -0.353515625, 0.9482421875, 2.25, 3.5517578125, 4.853515625, 6.1552734375, 7.45703125, 8.7587890625, 10.060546875, 11.3623046875, 12.6640625, 13.9658203125, 15.267578125, 16.5693359375, 17.87109375, 19.1728515625, 20.474609375, 21.7763671875, 23.078125, 24.3798828125, 25.681640625, 26.9833984375, 28.28515625, 29.5869140625, 30.888671875, 32.1904296875, 33.4921875, 34.7939453125, 36.095703125, 37.3974609375, 38.69921875, 40.0009765625, 41.302734375, 42.6044921875, 43.90625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 5.0, 3.0, 12.0, 14.0, 13.0, 23.0, 29.0, 65.0, 72.0, 95.0, 152.0, 235.0, 413.0, 746.0, 1791.0, 5794.0, 38569.0, 775233.0, 204524.0, 14795.0, 3338.0, 1241.0, 524.0, 318.0, 164.0, 121.0, 91.0, 60.0, 34.0, 18.0, 17.0, 13.0, 12.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-310.0, -300.24609375, -290.4921875, -280.73828125, -270.984375, -261.23046875, -251.4765625, -241.72265625, -231.96875, -222.21484375, -212.4609375, -202.70703125, -192.953125, -183.19921875, -173.4453125, -163.69140625, -153.9375, -144.18359375, -134.4296875, -124.67578125, -114.921875, -105.16796875, -95.4140625, -85.66015625, -75.90625, -66.15234375, -56.3984375, -46.64453125, -36.890625, -27.13671875, -17.3828125, -7.62890625, 2.125, 11.87890625, 21.6328125, 31.38671875, 41.140625, 50.89453125, 60.6484375, 70.40234375, 80.15625, 89.91015625, 99.6640625, 109.41796875, 119.171875, 128.92578125, 138.6796875, 148.43359375, 158.1875, 167.94140625, 177.6953125, 187.44921875, 197.203125, 206.95703125, 216.7109375, 226.46484375, 236.21875, 245.97265625, 255.7265625, 265.48046875, 275.234375, 284.98828125, 294.7421875, 304.49609375, 314.25]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 3.0, 3.0, 7.0, 10.0, 17.0, 21.0, 30.0, 32.0, 50.0, 53.0, 64.0, 81.0, 85.0, 83.0, 89.0, 84.0, 61.0, 58.0, 50.0, 34.0, 28.0, 24.0, 6.0, 12.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-298.0, -287.5625, -277.125, -266.6875, -256.25, -245.8125, -235.375, -224.9375, -214.5, -204.0625, -193.625, -183.1875, -172.75, -162.3125, -151.875, -141.4375, -131.0, -120.5625, -110.125, -99.6875, -89.25, -78.8125, -68.375, -57.9375, -47.5, -37.0625, -26.625, -16.1875, -5.75, 4.6875, 15.125, 25.5625, 36.0, 46.4375, 56.875, 67.3125, 77.75, 88.1875, 98.625, 109.0625, 119.5, 129.9375, 140.375, 150.8125, 161.25, 171.6875, 182.125, 192.5625, 203.0, 213.4375, 223.875, 234.3125, 244.75, 255.1875, 265.625, 276.0625, 286.5, 296.9375, 307.375, 317.8125, 328.25, 338.6875, 349.125, 359.5625, 370.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 6.0, 7.0, 13.0, 23.0, 32.0, 61.0, 133.0, 262.0, 740.0, 4035.0, 115524.0, 911565.0, 13901.0, 1504.0, 400.0, 158.0, 84.0, 45.0, 22.0, 13.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-239.5, -233.236328125, -226.97265625, -220.708984375, -214.4453125, -208.181640625, -201.91796875, -195.654296875, -189.390625, -183.126953125, -176.86328125, -170.599609375, -164.3359375, -158.072265625, -151.80859375, -145.544921875, -139.28125, -133.017578125, -126.75390625, -120.490234375, -114.2265625, -107.962890625, -101.69921875, -95.435546875, -89.171875, -82.908203125, -76.64453125, -70.380859375, -64.1171875, -57.853515625, -51.58984375, -45.326171875, -39.0625, -32.798828125, -26.53515625, -20.271484375, -14.0078125, -7.744140625, -1.48046875, 4.783203125, 11.046875, 17.310546875, 23.57421875, 29.837890625, 36.1015625, 42.365234375, 48.62890625, 54.892578125, 61.15625, 67.419921875, 73.68359375, 79.947265625, 86.2109375, 92.474609375, 98.73828125, 105.001953125, 111.265625, 117.529296875, 123.79296875, 130.056640625, 136.3203125, 142.583984375, 148.84765625, 155.111328125, 161.375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 11.0, 9.0, 8.0, 20.0, 22.0, 33.0, 74.0, 130.0, 248.0, 182.0, 102.0, 56.0, 31.0, 29.0, 17.0, 10.0, 5.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.034027099609375, -0.033251047134399414, -0.03247499465942383, -0.03169894218444824, -0.030922889709472656, -0.03014683723449707, -0.029370784759521484, -0.0285947322845459, -0.027818679809570312, -0.027042627334594727, -0.02626657485961914, -0.025490522384643555, -0.02471446990966797, -0.023938417434692383, -0.023162364959716797, -0.02238631248474121, -0.021610260009765625, -0.02083420753479004, -0.020058155059814453, -0.019282102584838867, -0.01850605010986328, -0.017729997634887695, -0.01695394515991211, -0.016177892684936523, -0.015401840209960938, -0.014625787734985352, -0.013849735260009766, -0.01307368278503418, -0.012297630310058594, -0.011521577835083008, -0.010745525360107422, -0.009969472885131836, -0.00919342041015625, -0.008417367935180664, -0.007641315460205078, -0.006865262985229492, -0.006089210510253906, -0.00531315803527832, -0.004537105560302734, -0.0037610530853271484, -0.0029850006103515625, -0.0022089481353759766, -0.0014328956604003906, -0.0006568431854248047, 0.00011920928955078125, 0.0008952617645263672, 0.0016713142395019531, 0.002447366714477539, 0.003223419189453125, 0.003999471664428711, 0.004775524139404297, 0.005551576614379883, 0.006327629089355469, 0.007103681564331055, 0.00787973403930664, 0.008655786514282227, 0.009431838989257812, 0.010207891464233398, 0.010983943939208984, 0.01175999641418457, 0.012536048889160156, 0.013312101364135742, 0.014088153839111328, 0.014864206314086914, 0.0156402587890625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 4.0, 5.0, 9.0, 5.0, 5.0, 13.0, 12.0, 13.0, 22.0, 31.0, 57.0, 75.0, 143.0, 211.0, 397.0, 782.0, 1752.0, 5732.0, 30631.0, 606141.0, 370997.0, 23358.0, 4876.0, 1664.0, 680.0, 347.0, 232.0, 123.0, 66.0, 53.0, 34.0, 18.0, 12.0, 11.0, 4.0, 6.0, 10.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.9375, -96.70703125, -93.4765625, -90.24609375, -87.015625, -83.78515625, -80.5546875, -77.32421875, -74.09375, -70.86328125, -67.6328125, -64.40234375, -61.171875, -57.94140625, -54.7109375, -51.48046875, -48.25, -45.01953125, -41.7890625, -38.55859375, -35.328125, -32.09765625, -28.8671875, -25.63671875, -22.40625, -19.17578125, -15.9453125, -12.71484375, -9.484375, -6.25390625, -3.0234375, 0.20703125, 3.4375, 6.66796875, 9.8984375, 13.12890625, 16.359375, 19.58984375, 22.8203125, 26.05078125, 29.28125, 32.51171875, 35.7421875, 38.97265625, 42.203125, 45.43359375, 48.6640625, 51.89453125, 55.125, 58.35546875, 61.5859375, 64.81640625, 68.046875, 71.27734375, 74.5078125, 77.73828125, 80.96875, 84.19921875, 87.4296875, 90.66015625, 93.890625, 97.12109375, 100.3515625, 103.58203125, 106.8125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 10.0, 8.0, 16.0, 13.0, 14.0, 29.0, 29.0, 37.0, 60.0, 62.0, 81.0, 91.0, 78.0, 73.0, 86.0, 57.0, 62.0, 36.0, 35.0, 19.0, 21.0, 16.0, 10.0, 9.0, 9.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-67.25, -65.107421875, -62.96484375, -60.822265625, -58.6796875, -56.537109375, -54.39453125, -52.251953125, -50.109375, -47.966796875, -45.82421875, -43.681640625, -41.5390625, -39.396484375, -37.25390625, -35.111328125, -32.96875, -30.826171875, -28.68359375, -26.541015625, -24.3984375, -22.255859375, -20.11328125, -17.970703125, -15.828125, -13.685546875, -11.54296875, -9.400390625, -7.2578125, -5.115234375, -2.97265625, -0.830078125, 1.3125, 3.455078125, 5.59765625, 7.740234375, 9.8828125, 12.025390625, 14.16796875, 16.310546875, 18.453125, 20.595703125, 22.73828125, 24.880859375, 27.0234375, 29.166015625, 31.30859375, 33.451171875, 35.59375, 37.736328125, 39.87890625, 42.021484375, 44.1640625, 46.306640625, 48.44921875, 50.591796875, 52.734375, 54.876953125, 57.01953125, 59.162109375, 61.3046875, 63.447265625, 65.58984375, 67.732421875, 69.875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 2.0, 2.0, 8.0, 11.0, 14.0, 36.0, 36.0, 79.0, 110.0, 171.0, 184.0, 131.0, 91.0, 64.0, 30.0, 17.0, 10.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1598.992919921875, -1557.2374267578125, -1515.48193359375, -1473.7264404296875, -1431.970947265625, -1390.215576171875, -1348.4599609375, -1306.70458984375, -1264.9490966796875, -1223.193603515625, -1181.4381103515625, -1139.6826171875, -1097.9271240234375, -1056.171630859375, -1014.4161987304688, -972.6607666015625, -930.9052124023438, -889.1497192382812, -847.3942260742188, -805.6387939453125, -763.88330078125, -722.1278076171875, -680.372314453125, -638.6168212890625, -596.861328125, -555.1058349609375, -513.350341796875, -471.5948791503906, -429.83941650390625, -388.08392333984375, -346.32843017578125, -304.5729675292969, -262.8175048828125, -221.06202697753906, -179.30654907226562, -137.55105590820312, -95.79557800292969, -54.04010009765625, -12.28460693359375, 29.470855712890625, 71.22634887695312, 112.98182678222656, 154.7373046875, 196.4927978515625, 238.24827575683594, 280.0037536621094, 321.7592468261719, 363.51470947265625, 405.27020263671875, 447.02569580078125, 488.7811584472656, 530.53662109375, 572.2921142578125, 614.047607421875, 655.8031005859375, 697.55859375, 739.3140869140625, 781.069580078125, 822.8250732421875, 864.58056640625, 906.3359985351562, 948.0914916992188, 989.8469848632812, 1031.6024169921875, 1073.35791015625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 10.0, 35.0, 31.0, 52.0, 62.0, 84.0, 122.0, 147.0, 128.0, 98.0, 78.0, 55.0, 46.0, 23.0, 21.0, 11.0, 6.0, 0.0, 0.0, 2.0], "bins": [-2914.99560546875, -2858.640380859375, -2802.285400390625, -2745.93017578125, -2689.574951171875, -2633.219970703125, -2576.86474609375, -2520.509521484375, -2464.154541015625, -2407.79931640625, -2351.4443359375, -2295.089111328125, -2238.73388671875, -2182.37890625, -2126.023681640625, -2069.66845703125, -2013.313232421875, -1956.9581298828125, -1900.6029052734375, -1844.247802734375, -1787.8927001953125, -1731.5374755859375, -1675.182373046875, -1618.8271484375, -1562.47216796875, -1506.1170654296875, -1449.7618408203125, -1393.40673828125, -1337.0516357421875, -1280.6964111328125, -1224.34130859375, -1167.986083984375, -1111.6309814453125, -1055.27587890625, -998.9207153320312, -942.5655517578125, -886.2103881835938, -829.855224609375, -773.5001220703125, -717.1449584960938, -660.789794921875, -604.4346313476562, -548.0795288085938, -491.724365234375, -435.36920166015625, -379.0140686035156, -322.658935546875, -266.30377197265625, -209.94866943359375, -153.59352111816406, -97.2383804321289, -40.88323974609375, 15.471908569335938, 71.82705688476562, 128.18218994140625, 184.537353515625, 240.89248657226562, 297.24761962890625, 353.602783203125, 409.9579162597656, 466.31304931640625, 522.668212890625, 579.0233154296875, 635.3785400390625, 691.733642578125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 5.0, 8.0, 8.0, 23.0, 29.0, 42.0, 57.0, 144.0, 248.0, 525.0, 1284.0, 3677.0, 12412.0, 64139.0, 3662844.0, 408067.0, 29314.0, 7451.0, 2364.0, 873.0, 380.0, 171.0, 83.0, 44.0, 28.0, 22.0, 12.0, 9.0, 4.0, 2.0, 3.0, 2.0], "bins": [-239.5, -234.3798828125, -229.259765625, -224.1396484375, -219.01953125, -213.8994140625, -208.779296875, -203.6591796875, -198.5390625, -193.4189453125, -188.298828125, -183.1787109375, -178.05859375, -172.9384765625, -167.818359375, -162.6982421875, -157.578125, -152.4580078125, -147.337890625, -142.2177734375, -137.09765625, -131.9775390625, -126.857421875, -121.7373046875, -116.6171875, -111.4970703125, -106.376953125, -101.2568359375, -96.13671875, -91.0166015625, -85.896484375, -80.7763671875, -75.65625, -70.5361328125, -65.416015625, -60.2958984375, -55.17578125, -50.0556640625, -44.935546875, -39.8154296875, -34.6953125, -29.5751953125, -24.455078125, -19.3349609375, -14.21484375, -9.0947265625, -3.974609375, 1.1455078125, 6.265625, 11.3857421875, 16.505859375, 21.6259765625, 26.74609375, 31.8662109375, 36.986328125, 42.1064453125, 47.2265625, 52.3466796875, 57.466796875, 62.5869140625, 67.70703125, 72.8271484375, 77.947265625, 83.0673828125, 88.1875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 18.0, 45.0, 92.0, 149.0, 216.0, 210.0, 157.0, 64.0, 35.0, 16.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-243.25, -238.056640625, -232.86328125, -227.669921875, -222.4765625, -217.283203125, -212.08984375, -206.896484375, -201.703125, -196.509765625, -191.31640625, -186.123046875, -180.9296875, -175.736328125, -170.54296875, -165.349609375, -160.15625, -154.962890625, -149.76953125, -144.576171875, -139.3828125, -134.189453125, -128.99609375, -123.802734375, -118.609375, -113.416015625, -108.22265625, -103.029296875, -97.8359375, -92.642578125, -87.44921875, -82.255859375, -77.0625, -71.869140625, -66.67578125, -61.482421875, -56.2890625, -51.095703125, -45.90234375, -40.708984375, -35.515625, -30.322265625, -25.12890625, -19.935546875, -14.7421875, -9.548828125, -4.35546875, 0.837890625, 6.03125, 11.224609375, 16.41796875, 21.611328125, 26.8046875, 31.998046875, 37.19140625, 42.384765625, 47.578125, 52.771484375, 57.96484375, 63.158203125, 68.3515625, 73.544921875, 78.73828125, 83.931640625, 89.125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 10.0, 6.0, 9.0, 13.0, 24.0, 29.0, 46.0, 71.0, 137.0, 220.0, 361.0, 692.0, 1518.0, 3637.0, 10120.0, 33427.0, 187780.0, 3698228.0, 202974.0, 36602.0, 11210.0, 3984.0, 1578.0, 722.0, 359.0, 196.0, 123.0, 59.0, 49.0, 31.0, 18.0, 23.0, 16.0, 5.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-214.25, -208.6875, -203.125, -197.5625, -192.0, -186.4375, -180.875, -175.3125, -169.75, -164.1875, -158.625, -153.0625, -147.5, -141.9375, -136.375, -130.8125, -125.25, -119.6875, -114.125, -108.5625, -103.0, -97.4375, -91.875, -86.3125, -80.75, -75.1875, -69.625, -64.0625, -58.5, -52.9375, -47.375, -41.8125, -36.25, -30.6875, -25.125, -19.5625, -14.0, -8.4375, -2.875, 2.6875, 8.25, 13.8125, 19.375, 24.9375, 30.5, 36.0625, 41.625, 47.1875, 52.75, 58.3125, 63.875, 69.4375, 75.0, 80.5625, 86.125, 91.6875, 97.25, 102.8125, 108.375, 113.9375, 119.5, 125.0625, 130.625, 136.1875, 141.75]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 7.0, 9.0, 18.0, 24.0, 48.0, 52.0, 98.0, 237.0, 775.0, 1681.0, 618.0, 204.0, 78.0, 55.0, 36.0, 23.0, 23.0, 15.0, 13.0, 14.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-219.25, -213.396484375, -207.54296875, -201.689453125, -195.8359375, -189.982421875, -184.12890625, -178.275390625, -172.421875, -166.568359375, -160.71484375, -154.861328125, -149.0078125, -143.154296875, -137.30078125, -131.447265625, -125.59375, -119.740234375, -113.88671875, -108.033203125, -102.1796875, -96.326171875, -90.47265625, -84.619140625, -78.765625, -72.912109375, -67.05859375, -61.205078125, -55.3515625, -49.498046875, -43.64453125, -37.791015625, -31.9375, -26.083984375, -20.23046875, -14.376953125, -8.5234375, -2.669921875, 3.18359375, 9.037109375, 14.890625, 20.744140625, 26.59765625, 32.451171875, 38.3046875, 44.158203125, 50.01171875, 55.865234375, 61.71875, 67.572265625, 73.42578125, 79.279296875, 85.1328125, 90.986328125, 96.83984375, 102.693359375, 108.546875, 114.400390625, 120.25390625, 126.107421875, 131.9609375, 137.814453125, 143.66796875, 149.521484375, 155.375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 8.0, 8.0, 11.0, 21.0, 34.0, 61.0, 113.0, 188.0, 209.0, 140.0, 84.0, 61.0, 23.0, 18.0, 13.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1800.4676513671875, -1758.6907958984375, -1716.9140625, -1675.13720703125, -1633.3603515625, -1591.58349609375, -1549.8067626953125, -1508.0299072265625, -1466.253173828125, -1424.476318359375, -1382.6995849609375, -1340.9227294921875, -1299.1458740234375, -1257.369140625, -1215.59228515625, -1173.8154296875, -1132.03857421875, -1090.26171875, -1048.4849853515625, -1006.7081298828125, -964.9312744140625, -923.1544799804688, -881.377685546875, -839.600830078125, -797.8240356445312, -756.0472412109375, -714.2703857421875, -672.4935913085938, -630.716796875, -588.93994140625, -547.1631469726562, -505.3863220214844, -463.609375, -421.8325500488281, -380.05572509765625, -338.2789306640625, -296.5021057128906, -254.72528076171875, -212.94847106933594, -171.17166137695312, -129.39483642578125, -87.6180191040039, -45.84120178222656, -4.064384460449219, 37.712432861328125, 79.4892578125, 121.26606750488281, 163.04287719726562, 204.8197021484375, 246.59652709960938, 288.37335205078125, 330.150146484375, 371.9269714355469, 413.70379638671875, 455.4805908203125, 497.2574157714844, 539.0342407226562, 580.81103515625, 622.587890625, 664.3646850585938, 706.1414794921875, 747.9183349609375, 789.6951293945312, 831.471923828125, 873.248779296875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 6.0, 8.0, 14.0, 15.0, 22.0, 18.0, 23.0, 27.0, 33.0, 42.0, 57.0, 55.0, 59.0, 70.0, 64.0, 63.0, 62.0, 42.0, 49.0, 48.0, 43.0, 33.0, 29.0, 29.0, 14.0, 19.0, 15.0, 15.0, 9.0, 9.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-703.7635498046875, -680.7233276367188, -657.68310546875, -634.6429443359375, -611.6027221679688, -588.5625, -565.5223388671875, -542.4821166992188, -519.44189453125, -496.40167236328125, -473.3614807128906, -450.3212890625, -427.28106689453125, -404.2408447265625, -381.2006530761719, -358.16046142578125, -335.1202392578125, -312.08001708984375, -289.0398254394531, -265.9996337890625, -242.95941162109375, -219.91920471191406, -196.87899780273438, -173.8387908935547, -150.798583984375, -127.75837707519531, -104.71817016601562, -81.67796325683594, -58.63775634765625, -35.59754943847656, -12.557342529296875, 10.482864379882812, 33.5230712890625, 56.56327819824219, 79.60348510742188, 102.64369201660156, 125.68389892578125, 148.72410583496094, 171.76431274414062, 194.8045196533203, 217.8447265625, 240.8849334716797, 263.9251403808594, 286.96533203125, 310.00555419921875, 333.0457763671875, 356.0859680175781, 379.12615966796875, 402.1663818359375, 425.20660400390625, 448.2467956542969, 471.2869873046875, 494.32720947265625, 517.367431640625, 540.4075927734375, 563.4478149414062, 586.488037109375, 609.5282592773438, 632.5684814453125, 655.608642578125, 678.6488647460938, 701.6890869140625, 724.729248046875, 747.7694702148438, 770.8096923828125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 8.0, 13.0, 13.0, 22.0, 26.0, 41.0, 51.0, 77.0, 120.0, 222.0, 411.0, 694.0, 1324.0, 2745.0, 6421.0, 15894.0, 42569.0, 135572.0, 441416.0, 276089.0, 78751.0, 26974.0, 10404.0, 4316.0, 1980.0, 983.0, 535.0, 330.0, 184.0, 128.0, 67.0, 46.0, 33.0, 30.0, 19.0, 6.0, 10.0, 7.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-130.875, -126.8818359375, -122.888671875, -118.8955078125, -114.90234375, -110.9091796875, -106.916015625, -102.9228515625, -98.9296875, -94.9365234375, -90.943359375, -86.9501953125, -82.95703125, -78.9638671875, -74.970703125, -70.9775390625, -66.984375, -62.9912109375, -58.998046875, -55.0048828125, -51.01171875, -47.0185546875, -43.025390625, -39.0322265625, -35.0390625, -31.0458984375, -27.052734375, -23.0595703125, -19.06640625, -15.0732421875, -11.080078125, -7.0869140625, -3.09375, 0.8994140625, 4.892578125, 8.8857421875, 12.87890625, 16.8720703125, 20.865234375, 24.8583984375, 28.8515625, 32.8447265625, 36.837890625, 40.8310546875, 44.82421875, 48.8173828125, 52.810546875, 56.8037109375, 60.796875, 64.7900390625, 68.783203125, 72.7763671875, 76.76953125, 80.7626953125, 84.755859375, 88.7490234375, 92.7421875, 96.7353515625, 100.728515625, 104.7216796875, 108.71484375, 112.7080078125, 116.701171875, 120.6943359375, 124.6875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 15.0, 19.0, 27.0, 42.0, 56.0, 74.0, 83.0, 97.0, 103.0, 124.0, 97.0, 80.0, 53.0, 45.0, 34.0, 18.0, 24.0, 9.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-146.875, -143.724609375, -140.57421875, -137.423828125, -134.2734375, -131.123046875, -127.97265625, -124.822265625, -121.671875, -118.521484375, -115.37109375, -112.220703125, -109.0703125, -105.919921875, -102.76953125, -99.619140625, -96.46875, -93.318359375, -90.16796875, -87.017578125, -83.8671875, -80.716796875, -77.56640625, -74.416015625, -71.265625, -68.115234375, -64.96484375, -61.814453125, -58.6640625, -55.513671875, -52.36328125, -49.212890625, -46.0625, -42.912109375, -39.76171875, -36.611328125, -33.4609375, -30.310546875, -27.16015625, -24.009765625, -20.859375, -17.708984375, -14.55859375, -11.408203125, -8.2578125, -5.107421875, -1.95703125, 1.193359375, 4.34375, 7.494140625, 10.64453125, 13.794921875, 16.9453125, 20.095703125, 23.24609375, 26.396484375, 29.546875, 32.697265625, 35.84765625, 38.998046875, 42.1484375, 45.298828125, 48.44921875, 51.599609375, 54.75]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 15.0, 18.0, 18.0, 24.0, 46.0, 45.0, 81.0, 90.0, 158.0, 196.0, 394.0, 681.0, 1279.0, 2732.0, 7633.0, 28625.0, 183294.0, 700896.0, 94050.0, 18161.0, 5443.0, 2136.0, 984.0, 531.0, 329.0, 208.0, 126.0, 96.0, 74.0, 54.0, 36.0, 29.0, 9.0, 16.0, 8.0, 10.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.0, -198.013671875, -191.02734375, -184.041015625, -177.0546875, -170.068359375, -163.08203125, -156.095703125, -149.109375, -142.123046875, -135.13671875, -128.150390625, -121.1640625, -114.177734375, -107.19140625, -100.205078125, -93.21875, -86.232421875, -79.24609375, -72.259765625, -65.2734375, -58.287109375, -51.30078125, -44.314453125, -37.328125, -30.341796875, -23.35546875, -16.369140625, -9.3828125, -2.396484375, 4.58984375, 11.576171875, 18.5625, 25.548828125, 32.53515625, 39.521484375, 46.5078125, 53.494140625, 60.48046875, 67.466796875, 74.453125, 81.439453125, 88.42578125, 95.412109375, 102.3984375, 109.384765625, 116.37109375, 123.357421875, 130.34375, 137.330078125, 144.31640625, 151.302734375, 158.2890625, 165.275390625, 172.26171875, 179.248046875, 186.234375, 193.220703125, 200.20703125, 207.193359375, 214.1796875, 221.166015625, 228.15234375, 235.138671875, 242.125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 1.0, 9.0, 11.0, 9.0, 14.0, 40.0, 41.0, 55.0, 57.0, 77.0, 101.0, 103.0, 92.0, 83.0, 72.0, 70.0, 55.0, 39.0, 27.0, 20.0, 8.0, 6.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-363.0, -350.74609375, -338.4921875, -326.23828125, -313.984375, -301.73046875, -289.4765625, -277.22265625, -264.96875, -252.71484375, -240.4609375, -228.20703125, -215.953125, -203.69921875, -191.4453125, -179.19140625, -166.9375, -154.68359375, -142.4296875, -130.17578125, -117.921875, -105.66796875, -93.4140625, -81.16015625, -68.90625, -56.65234375, -44.3984375, -32.14453125, -19.890625, -7.63671875, 4.6171875, 16.87109375, 29.125, 41.37890625, 53.6328125, 65.88671875, 78.140625, 90.39453125, 102.6484375, 114.90234375, 127.15625, 139.41015625, 151.6640625, 163.91796875, 176.171875, 188.42578125, 200.6796875, 212.93359375, 225.1875, 237.44140625, 249.6953125, 261.94921875, 274.203125, 286.45703125, 298.7109375, 310.96484375, 323.21875, 335.47265625, 347.7265625, 359.98046875, 372.234375, 384.48828125, 396.7421875, 408.99609375, 421.25]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 15.0, 21.0, 30.0, 58.0, 194.0, 837.0, 7051.0, 876779.0, 158910.0, 3637.0, 675.0, 174.0, 74.0, 26.0, 16.0, 10.0, 11.0, 6.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-384.25, -374.1015625, -363.953125, -353.8046875, -343.65625, -333.5078125, -323.359375, -313.2109375, -303.0625, -292.9140625, -282.765625, -272.6171875, -262.46875, -252.3203125, -242.171875, -232.0234375, -221.875, -211.7265625, -201.578125, -191.4296875, -181.28125, -171.1328125, -160.984375, -150.8359375, -140.6875, -130.5390625, -120.390625, -110.2421875, -100.09375, -89.9453125, -79.796875, -69.6484375, -59.5, -49.3515625, -39.203125, -29.0546875, -18.90625, -8.7578125, 1.390625, 11.5390625, 21.6875, 31.8359375, 41.984375, 52.1328125, 62.28125, 72.4296875, 82.578125, 92.7265625, 102.875, 113.0234375, 123.171875, 133.3203125, 143.46875, 153.6171875, 163.765625, 173.9140625, 184.0625, 194.2109375, 204.359375, 214.5078125, 224.65625, 234.8046875, 244.953125, 255.1015625, 265.25]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 10.0, 16.0, 14.0, 35.0, 47.0, 92.0, 137.0, 225.0, 176.0, 94.0, 45.0, 37.0, 23.0, 13.0, 10.0, 4.0, 10.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.036834716796875, -0.03592681884765625, -0.0350189208984375, -0.03411102294921875, -0.033203125, -0.03229522705078125, -0.0313873291015625, -0.03047943115234375, -0.029571533203125, -0.02866363525390625, -0.0277557373046875, -0.02684783935546875, -0.02593994140625, -0.02503204345703125, -0.0241241455078125, -0.02321624755859375, -0.022308349609375, -0.02140045166015625, -0.0204925537109375, -0.01958465576171875, -0.0186767578125, -0.01776885986328125, -0.0168609619140625, -0.01595306396484375, -0.015045166015625, -0.01413726806640625, -0.0132293701171875, -0.01232147216796875, -0.01141357421875, -0.01050567626953125, -0.0095977783203125, -0.00868988037109375, -0.007781982421875, -0.00687408447265625, -0.0059661865234375, -0.00505828857421875, -0.004150390625, -0.00324249267578125, -0.0023345947265625, -0.00142669677734375, -0.000518798828125, 0.00038909912109375, 0.0012969970703125, 0.00220489501953125, 0.00311279296875, 0.00402069091796875, 0.0049285888671875, 0.00583648681640625, 0.006744384765625, 0.00765228271484375, 0.0085601806640625, 0.00946807861328125, 0.0103759765625, 0.01128387451171875, 0.0121917724609375, 0.01309967041015625, 0.014007568359375, 0.01491546630859375, 0.0158233642578125, 0.01673126220703125, 0.01763916015625, 0.01854705810546875, 0.0194549560546875, 0.02036285400390625, 0.021270751953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 9.0, 12.0, 22.0, 31.0, 45.0, 90.0, 235.0, 703.0, 3599.0, 115778.0, 914658.0, 11323.0, 1333.0, 380.0, 144.0, 69.0, 43.0, 19.0, 17.0, 11.0, 6.0, 5.0, 5.0, 0.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-276.25, -268.177734375, -260.10546875, -252.033203125, -243.9609375, -235.888671875, -227.81640625, -219.744140625, -211.671875, -203.599609375, -195.52734375, -187.455078125, -179.3828125, -171.310546875, -163.23828125, -155.166015625, -147.09375, -139.021484375, -130.94921875, -122.876953125, -114.8046875, -106.732421875, -98.66015625, -90.587890625, -82.515625, -74.443359375, -66.37109375, -58.298828125, -50.2265625, -42.154296875, -34.08203125, -26.009765625, -17.9375, -9.865234375, -1.79296875, 6.279296875, 14.3515625, 22.423828125, 30.49609375, 38.568359375, 46.640625, 54.712890625, 62.78515625, 70.857421875, 78.9296875, 87.001953125, 95.07421875, 103.146484375, 111.21875, 119.291015625, 127.36328125, 135.435546875, 143.5078125, 151.580078125, 159.65234375, 167.724609375, 175.796875, 183.869140625, 191.94140625, 200.013671875, 208.0859375, 216.158203125, 224.23046875, 232.302734375, 240.375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 16.0, 23.0, 48.0, 76.0, 136.0, 216.0, 224.0, 127.0, 66.0, 31.0, 19.0, 13.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-282.0, -276.1240234375, -270.248046875, -264.3720703125, -258.49609375, -252.6201171875, -246.744140625, -240.8681640625, -234.9921875, -229.1162109375, -223.240234375, -217.3642578125, -211.48828125, -205.6123046875, -199.736328125, -193.8603515625, -187.984375, -182.1083984375, -176.232421875, -170.3564453125, -164.48046875, -158.6044921875, -152.728515625, -146.8525390625, -140.9765625, -135.1005859375, -129.224609375, -123.3486328125, -117.47265625, -111.5966796875, -105.720703125, -99.8447265625, -93.96875, -88.0927734375, -82.216796875, -76.3408203125, -70.46484375, -64.5888671875, -58.712890625, -52.8369140625, -46.9609375, -41.0849609375, -35.208984375, -29.3330078125, -23.45703125, -17.5810546875, -11.705078125, -5.8291015625, 0.046875, 5.9228515625, 11.798828125, 17.6748046875, 23.55078125, 29.4267578125, 35.302734375, 41.1787109375, 47.0546875, 52.9306640625, 58.806640625, 64.6826171875, 70.55859375, 76.4345703125, 82.310546875, 88.1865234375, 94.0625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 17.0, 22.0, 44.0, 65.0, 119.0, 161.0, 204.0, 120.0, 85.0, 77.0, 26.0, 15.0, 20.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1758.501953125, -1710.1318359375, -1661.7615966796875, -1613.3914794921875, -1565.0213623046875, -1516.6512451171875, -1468.281005859375, -1419.910888671875, -1371.540771484375, -1323.170654296875, -1274.8004150390625, -1226.4302978515625, -1178.0601806640625, -1129.6900634765625, -1081.31982421875, -1032.94970703125, -984.5795288085938, -936.2093505859375, -887.8392333984375, -839.4690551757812, -791.0989379882812, -742.728759765625, -694.358642578125, -645.9884643554688, -597.6182861328125, -549.2481079101562, -500.87799072265625, -452.5078125, -404.1376953125, -355.76751708984375, -307.3973693847656, -259.0272216796875, -210.6571044921875, -162.28695678710938, -113.91680145263672, -65.54664611816406, -17.176498413085938, 31.193649291992188, 79.56381225585938, 127.9339599609375, 176.30410766601562, 224.67425537109375, 273.0444030761719, 321.41455078125, 369.78472900390625, 418.15484619140625, 466.5250244140625, 514.8951416015625, 563.2653198242188, 611.635498046875, 660.005615234375, 708.3757934570312, 756.7459106445312, 805.1160888671875, 853.4862060546875, 901.8563842773438, 950.2265625, 998.5967407226562, 1046.9669189453125, 1095.3370361328125, 1143.7071533203125, 1192.0772705078125, 1240.447509765625, 1288.817626953125, 1337.187744140625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 9.0, 16.0, 12.0, 24.0, 31.0, 37.0, 42.0, 72.0, 77.0, 92.0, 94.0, 111.0, 72.0, 68.0, 55.0, 50.0, 31.0, 25.0, 24.0, 19.0, 15.0, 7.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1902.5157470703125, -1856.0445556640625, -1809.5733642578125, -1763.102294921875, -1716.631103515625, -1670.159912109375, -1623.688720703125, -1577.217529296875, -1530.746337890625, -1484.275146484375, -1437.803955078125, -1391.332763671875, -1344.8616943359375, -1298.3905029296875, -1251.9193115234375, -1205.4481201171875, -1158.97705078125, -1112.505859375, -1066.03466796875, -1019.5635375976562, -973.0924072265625, -926.6212158203125, -880.1500244140625, -833.6788330078125, -787.2077026367188, -740.7365112304688, -694.265380859375, -647.794189453125, -601.322998046875, -554.8518676757812, -508.38067626953125, -461.9095153808594, -415.4383544921875, -368.9671936035156, -322.49603271484375, -276.02484130859375, -229.55368041992188, -183.08251953125, -136.611328125, -90.14016723632812, -43.66900634765625, 2.8021621704101562, 49.27333068847656, 95.7445068359375, 142.21566772460938, 188.68682861328125, 235.15802001953125, 281.6291809082031, 328.100341796875, 374.5715026855469, 421.04266357421875, 467.51385498046875, 513.9849853515625, 560.4561767578125, 606.9273681640625, 653.3985595703125, 699.8696899414062, 746.3408813476562, 792.81201171875, 839.283203125, 885.75439453125, 932.2255249023438, 978.6967163085938, 1025.1678466796875, 1071.6390380859375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 6.0, 4.0, 0.0, 3.0, 9.0, 10.0, 4.0, 6.0, 14.0, 12.0, 13.0, 15.0, 24.0, 36.0, 63.0, 116.0, 251.0, 707.0, 2206.0, 7928.0, 42408.0, 1162027.0, 2884914.0, 74601.0, 12481.0, 3598.0, 1452.0, 711.0, 348.0, 164.0, 89.0, 31.0, 13.0, 13.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-229.125, -223.8115234375, -218.498046875, -213.1845703125, -207.87109375, -202.5576171875, -197.244140625, -191.9306640625, -186.6171875, -181.3037109375, -175.990234375, -170.6767578125, -165.36328125, -160.0498046875, -154.736328125, -149.4228515625, -144.109375, -138.7958984375, -133.482421875, -128.1689453125, -122.85546875, -117.5419921875, -112.228515625, -106.9150390625, -101.6015625, -96.2880859375, -90.974609375, -85.6611328125, -80.34765625, -75.0341796875, -69.720703125, -64.4072265625, -59.09375, -53.7802734375, -48.466796875, -43.1533203125, -37.83984375, -32.5263671875, -27.212890625, -21.8994140625, -16.5859375, -11.2724609375, -5.958984375, -0.6455078125, 4.66796875, 9.9814453125, 15.294921875, 20.6083984375, 25.921875, 31.2353515625, 36.548828125, 41.8623046875, 47.17578125, 52.4892578125, 57.802734375, 63.1162109375, 68.4296875, 73.7431640625, 79.056640625, 84.3701171875, 89.68359375, 94.9970703125, 100.310546875, 105.6240234375, 110.9375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 16.0, 50.0, 125.0, 183.0, 248.0, 206.0, 116.0, 44.0, 13.0, 4.0, 2.0, 2.0], "bins": [-380.0, -373.26123046875, -366.5224609375, -359.78369140625, -353.044921875, -346.30615234375, -339.5673828125, -332.82861328125, -326.08984375, -319.35107421875, -312.6123046875, -305.87353515625, -299.134765625, -292.39599609375, -285.6572265625, -278.91845703125, -272.1796875, -265.44091796875, -258.7021484375, -251.96337890625, -245.224609375, -238.48583984375, -231.7470703125, -225.00830078125, -218.26953125, -211.53076171875, -204.7919921875, -198.05322265625, -191.314453125, -184.57568359375, -177.8369140625, -171.09814453125, -164.359375, -157.62060546875, -150.8818359375, -144.14306640625, -137.404296875, -130.66552734375, -123.9267578125, -117.18798828125, -110.44921875, -103.71044921875, -96.9716796875, -90.23291015625, -83.494140625, -76.75537109375, -70.0166015625, -63.27783203125, -56.5390625, -49.80029296875, -43.0615234375, -36.32275390625, -29.583984375, -22.84521484375, -16.1064453125, -9.36767578125, -2.62890625, 4.10986328125, 10.8486328125, 17.58740234375, 24.326171875, 31.06494140625, 37.8037109375, 44.54248046875, 51.28125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 4.0, 4.0, 7.0, 12.0, 14.0, 18.0, 32.0, 42.0, 55.0, 109.0, 181.0, 301.0, 584.0, 1294.0, 3150.0, 8987.0, 32498.0, 199753.0, 3430377.0, 438389.0, 54815.0, 14409.0, 5072.0, 2081.0, 935.0, 494.0, 286.0, 133.0, 88.0, 49.0, 29.0, 26.0, 17.0, 10.0, 11.0, 2.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.375, -155.740234375, -150.10546875, -144.470703125, -138.8359375, -133.201171875, -127.56640625, -121.931640625, -116.296875, -110.662109375, -105.02734375, -99.392578125, -93.7578125, -88.123046875, -82.48828125, -76.853515625, -71.21875, -65.583984375, -59.94921875, -54.314453125, -48.6796875, -43.044921875, -37.41015625, -31.775390625, -26.140625, -20.505859375, -14.87109375, -9.236328125, -3.6015625, 2.033203125, 7.66796875, 13.302734375, 18.9375, 24.572265625, 30.20703125, 35.841796875, 41.4765625, 47.111328125, 52.74609375, 58.380859375, 64.015625, 69.650390625, 75.28515625, 80.919921875, 86.5546875, 92.189453125, 97.82421875, 103.458984375, 109.09375, 114.728515625, 120.36328125, 125.998046875, 131.6328125, 137.267578125, 142.90234375, 148.537109375, 154.171875, 159.806640625, 165.44140625, 171.076171875, 176.7109375, 182.345703125, 187.98046875, 193.615234375, 199.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 10.0, 13.0, 9.0, 22.0, 23.0, 31.0, 45.0, 76.0, 94.0, 190.0, 370.0, 778.0, 998.0, 618.0, 290.0, 151.0, 96.0, 57.0, 47.0, 35.0, 30.0, 19.0, 13.0, 10.0, 12.0, 8.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-203.75, -197.44921875, -191.1484375, -184.84765625, -178.546875, -172.24609375, -165.9453125, -159.64453125, -153.34375, -147.04296875, -140.7421875, -134.44140625, -128.140625, -121.83984375, -115.5390625, -109.23828125, -102.9375, -96.63671875, -90.3359375, -84.03515625, -77.734375, -71.43359375, -65.1328125, -58.83203125, -52.53125, -46.23046875, -39.9296875, -33.62890625, -27.328125, -21.02734375, -14.7265625, -8.42578125, -2.125, 4.17578125, 10.4765625, 16.77734375, 23.078125, 29.37890625, 35.6796875, 41.98046875, 48.28125, 54.58203125, 60.8828125, 67.18359375, 73.484375, 79.78515625, 86.0859375, 92.38671875, 98.6875, 104.98828125, 111.2890625, 117.58984375, 123.890625, 130.19140625, 136.4921875, 142.79296875, 149.09375, 155.39453125, 161.6953125, 167.99609375, 174.296875, 180.59765625, 186.8984375, 193.19921875, 199.5]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 9.0, 26.0, 69.0, 170.0, 305.0, 250.0, 105.0, 27.0, 18.0, 7.0, 8.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1206.462890625, -1117.5601806640625, -1028.657470703125, -939.7546997070312, -850.8519897460938, -761.9492797851562, -673.0465087890625, -584.143798828125, -495.2410888671875, -406.33837890625, -317.4356384277344, -228.53289794921875, -139.63018798828125, -50.72747802734375, 38.17529296875, 127.0780029296875, 215.980712890625, 304.8834228515625, 393.7861633300781, 482.68890380859375, 571.5916137695312, 660.4943237304688, 749.3970947265625, 838.2998046875, 927.2025146484375, 1016.105224609375, 1105.0079345703125, 1193.91064453125, 1282.8134765625, 1371.716064453125, 1460.618896484375, 1549.5216064453125, 1638.42431640625, 1727.3270263671875, 1816.229736328125, 1905.132568359375, 1994.03515625, 2082.93798828125, 2171.8408203125, 2260.743408203125, 2349.64599609375, 2438.548828125, 2527.451416015625, 2616.354248046875, 2705.2568359375, 2794.15966796875, 2883.0625, 2971.965087890625, 3060.867919921875, 3149.770751953125, 3238.67333984375, 3327.576171875, 3416.478759765625, 3505.381591796875, 3594.2841796875, 3683.18701171875, 3772.08984375, 3860.99267578125, 3949.895263671875, 4038.798095703125, 4127.70068359375, 4216.603515625, 4305.50634765625, 4394.4091796875, 4483.3115234375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 16.0, 30.0, 42.0, 50.0, 83.0, 99.0, 117.0, 111.0, 109.0, 112.0, 78.0, 57.0, 35.0, 17.0, 25.0, 15.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1464.210205078125, -1400.0552978515625, -1335.900390625, -1271.7454833984375, -1207.590576171875, -1143.435546875, -1079.2806396484375, -1015.125732421875, -950.9708251953125, -886.81591796875, -822.6610107421875, -758.5060424804688, -694.3511352539062, -630.1962280273438, -566.041259765625, -501.8863525390625, -437.7314453125, -373.5765380859375, -309.4216003417969, -245.2666778564453, -181.11175537109375, -116.95684814453125, -52.801910400390625, 11.35302734375, 75.5079345703125, 139.66285705566406, 203.81777954101562, 267.97271728515625, 332.12762451171875, 396.28253173828125, 460.4374694824219, 524.5924072265625, 588.747314453125, 652.9022216796875, 717.05712890625, 781.2120971679688, 845.3670043945312, 909.5219116210938, 973.6768798828125, 1037.831787109375, 1101.9866943359375, 1166.1416015625, 1230.2965087890625, 1294.451416015625, 1358.6064453125, 1422.76123046875, 1486.916259765625, 1551.0711669921875, 1615.22607421875, 1679.3809814453125, 1743.535888671875, 1807.6907958984375, 1871.845703125, 1936.000732421875, 2000.1556396484375, 2064.310546875, 2128.46533203125, 2192.620361328125, 2256.775146484375, 2320.93017578125, 2385.0849609375, 2449.239990234375, 2513.394775390625, 2577.5498046875, 2641.704833984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 5.0, 16.0, 16.0, 20.0, 46.0, 78.0, 103.0, 213.0, 438.0, 898.0, 1846.0, 4439.0, 11952.0, 36559.0, 123193.0, 418709.0, 318595.0, 88664.0, 27233.0, 9122.0, 3469.0, 1444.0, 656.0, 387.0, 195.0, 97.0, 61.0, 36.0, 15.0, 19.0, 9.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.0, -143.044921875, -138.08984375, -133.134765625, -128.1796875, -123.224609375, -118.26953125, -113.314453125, -108.359375, -103.404296875, -98.44921875, -93.494140625, -88.5390625, -83.583984375, -78.62890625, -73.673828125, -68.71875, -63.763671875, -58.80859375, -53.853515625, -48.8984375, -43.943359375, -38.98828125, -34.033203125, -29.078125, -24.123046875, -19.16796875, -14.212890625, -9.2578125, -4.302734375, 0.65234375, 5.607421875, 10.5625, 15.517578125, 20.47265625, 25.427734375, 30.3828125, 35.337890625, 40.29296875, 45.248046875, 50.203125, 55.158203125, 60.11328125, 65.068359375, 70.0234375, 74.978515625, 79.93359375, 84.888671875, 89.84375, 94.798828125, 99.75390625, 104.708984375, 109.6640625, 114.619140625, 119.57421875, 124.529296875, 129.484375, 134.439453125, 139.39453125, 144.349609375, 149.3046875, 154.259765625, 159.21484375, 164.169921875, 169.125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 8.0, 9.0, 10.0, 13.0, 22.0, 22.0, 35.0, 39.0, 50.0, 63.0, 77.0, 82.0, 71.0, 91.0, 73.0, 65.0, 74.0, 43.0, 36.0, 32.0, 27.0, 25.0, 17.0, 12.0, 2.0, 2.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-119.3125, -116.6552734375, -113.998046875, -111.3408203125, -108.68359375, -106.0263671875, -103.369140625, -100.7119140625, -98.0546875, -95.3974609375, -92.740234375, -90.0830078125, -87.42578125, -84.7685546875, -82.111328125, -79.4541015625, -76.796875, -74.1396484375, -71.482421875, -68.8251953125, -66.16796875, -63.5107421875, -60.853515625, -58.1962890625, -55.5390625, -52.8818359375, -50.224609375, -47.5673828125, -44.91015625, -42.2529296875, -39.595703125, -36.9384765625, -34.28125, -31.6240234375, -28.966796875, -26.3095703125, -23.65234375, -20.9951171875, -18.337890625, -15.6806640625, -13.0234375, -10.3662109375, -7.708984375, -5.0517578125, -2.39453125, 0.2626953125, 2.919921875, 5.5771484375, 8.234375, 10.8916015625, 13.548828125, 16.2060546875, 18.86328125, 21.5205078125, 24.177734375, 26.8349609375, 29.4921875, 32.1494140625, 34.806640625, 37.4638671875, 40.12109375, 42.7783203125, 45.435546875, 48.0927734375, 50.75]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 2.0, 6.0, 1.0, 4.0, 5.0, 5.0, 7.0, 14.0, 15.0, 26.0, 34.0, 39.0, 60.0, 93.0, 123.0, 211.0, 343.0, 527.0, 904.0, 1632.0, 3643.0, 13583.0, 113976.0, 807769.0, 86826.0, 11555.0, 3425.0, 1554.0, 781.0, 471.0, 290.0, 206.0, 147.0, 97.0, 49.0, 35.0, 33.0, 15.0, 13.0, 7.0, 8.0, 2.0, 2.0, 10.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-371.75, -360.29296875, -348.8359375, -337.37890625, -325.921875, -314.46484375, -303.0078125, -291.55078125, -280.09375, -268.63671875, -257.1796875, -245.72265625, -234.265625, -222.80859375, -211.3515625, -199.89453125, -188.4375, -176.98046875, -165.5234375, -154.06640625, -142.609375, -131.15234375, -119.6953125, -108.23828125, -96.78125, -85.32421875, -73.8671875, -62.41015625, -50.953125, -39.49609375, -28.0390625, -16.58203125, -5.125, 6.33203125, 17.7890625, 29.24609375, 40.703125, 52.16015625, 63.6171875, 75.07421875, 86.53125, 97.98828125, 109.4453125, 120.90234375, 132.359375, 143.81640625, 155.2734375, 166.73046875, 178.1875, 189.64453125, 201.1015625, 212.55859375, 224.015625, 235.47265625, 246.9296875, 258.38671875, 269.84375, 281.30078125, 292.7578125, 304.21484375, 315.671875, 327.12890625, 338.5859375, 350.04296875, 361.5]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 2.0, 11.0, 5.0, 15.0, 11.0, 17.0, 19.0, 25.0, 43.0, 49.0, 56.0, 70.0, 60.0, 80.0, 81.0, 74.0, 86.0, 68.0, 52.0, 51.0, 39.0, 30.0, 23.0, 8.0, 10.0, 7.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.25, -242.17578125, -228.1015625, -214.02734375, -199.953125, -185.87890625, -171.8046875, -157.73046875, -143.65625, -129.58203125, -115.5078125, -101.43359375, -87.359375, -73.28515625, -59.2109375, -45.13671875, -31.0625, -16.98828125, -2.9140625, 11.16015625, 25.234375, 39.30859375, 53.3828125, 67.45703125, 81.53125, 95.60546875, 109.6796875, 123.75390625, 137.828125, 151.90234375, 165.9765625, 180.05078125, 194.125, 208.19921875, 222.2734375, 236.34765625, 250.421875, 264.49609375, 278.5703125, 292.64453125, 306.71875, 320.79296875, 334.8671875, 348.94140625, 363.015625, 377.08984375, 391.1640625, 405.23828125, 419.3125, 433.38671875, 447.4609375, 461.53515625, 475.609375, 489.68359375, 503.7578125, 517.83203125, 531.90625, 545.98046875, 560.0546875, 574.12890625, 588.203125, 602.27734375, 616.3515625, 630.42578125, 644.5]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 8.0, 10.0, 10.0, 8.0, 20.0, 33.0, 30.0, 52.0, 83.0, 146.0, 273.0, 561.0, 1333.0, 4748.0, 36824.0, 804700.0, 182850.0, 12510.0, 2537.0, 855.0, 388.0, 212.0, 106.0, 68.0, 43.0, 31.0, 26.0, 21.0, 11.0, 6.0, 4.0, 10.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-123.0625, -119.1884765625, -115.314453125, -111.4404296875, -107.56640625, -103.6923828125, -99.818359375, -95.9443359375, -92.0703125, -88.1962890625, -84.322265625, -80.4482421875, -76.57421875, -72.7001953125, -68.826171875, -64.9521484375, -61.078125, -57.2041015625, -53.330078125, -49.4560546875, -45.58203125, -41.7080078125, -37.833984375, -33.9599609375, -30.0859375, -26.2119140625, -22.337890625, -18.4638671875, -14.58984375, -10.7158203125, -6.841796875, -2.9677734375, 0.90625, 4.7802734375, 8.654296875, 12.5283203125, 16.40234375, 20.2763671875, 24.150390625, 28.0244140625, 31.8984375, 35.7724609375, 39.646484375, 43.5205078125, 47.39453125, 51.2685546875, 55.142578125, 59.0166015625, 62.890625, 66.7646484375, 70.638671875, 74.5126953125, 78.38671875, 82.2607421875, 86.134765625, 90.0087890625, 93.8828125, 97.7568359375, 101.630859375, 105.5048828125, 109.37890625, 113.2529296875, 117.126953125, 121.0009765625, 124.875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 4.0, 5.0, 2.0, 10.0, 7.0, 11.0, 11.0, 21.0, 10.0, 24.0, 26.0, 32.0, 46.0, 54.0, 88.0, 156.0, 124.0, 76.0, 62.0, 52.0, 42.0, 32.0, 28.0, 17.0, 14.0, 8.0, 5.0, 7.0, 9.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0189056396484375, -0.01833033561706543, -0.01775503158569336, -0.01717972755432129, -0.01660442352294922, -0.01602911949157715, -0.015453815460205078, -0.014878511428833008, -0.014303207397460938, -0.013727903366088867, -0.013152599334716797, -0.012577295303344727, -0.012001991271972656, -0.011426687240600586, -0.010851383209228516, -0.010276079177856445, -0.009700775146484375, -0.009125471115112305, -0.008550167083740234, -0.007974863052368164, -0.007399559020996094, -0.0068242549896240234, -0.006248950958251953, -0.005673646926879883, -0.0050983428955078125, -0.004523038864135742, -0.003947734832763672, -0.0033724308013916016, -0.0027971267700195312, -0.002221822738647461, -0.0016465187072753906, -0.0010712146759033203, -0.00049591064453125, 7.939338684082031e-05, 0.0006546974182128906, 0.001230001449584961, 0.0018053054809570312, 0.0023806095123291016, 0.002955913543701172, 0.003531217575073242, 0.0041065216064453125, 0.004681825637817383, 0.005257129669189453, 0.0058324337005615234, 0.006407737731933594, 0.006983041763305664, 0.007558345794677734, 0.008133649826049805, 0.008708953857421875, 0.009284257888793945, 0.009859561920166016, 0.010434865951538086, 0.011010169982910156, 0.011585474014282227, 0.012160778045654297, 0.012736082077026367, 0.013311386108398438, 0.013886690139770508, 0.014461994171142578, 0.015037298202514648, 0.015612602233886719, 0.01618790626525879, 0.01676321029663086, 0.01733851432800293, 0.017913818359375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 7.0, 9.0, 5.0, 14.0, 12.0, 29.0, 26.0, 30.0, 44.0, 63.0, 112.0, 160.0, 212.0, 333.0, 627.0, 1038.0, 2113.0, 5039.0, 17127.0, 110832.0, 766445.0, 116680.0, 17515.0, 5080.0, 2156.0, 1039.0, 625.0, 397.0, 240.0, 134.0, 128.0, 72.0, 43.0, 41.0, 26.0, 23.0, 15.0, 10.0, 12.0, 11.0, 8.0, 3.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-83.375, -80.810546875, -78.24609375, -75.681640625, -73.1171875, -70.552734375, -67.98828125, -65.423828125, -62.859375, -60.294921875, -57.73046875, -55.166015625, -52.6015625, -50.037109375, -47.47265625, -44.908203125, -42.34375, -39.779296875, -37.21484375, -34.650390625, -32.0859375, -29.521484375, -26.95703125, -24.392578125, -21.828125, -19.263671875, -16.69921875, -14.134765625, -11.5703125, -9.005859375, -6.44140625, -3.876953125, -1.3125, 1.251953125, 3.81640625, 6.380859375, 8.9453125, 11.509765625, 14.07421875, 16.638671875, 19.203125, 21.767578125, 24.33203125, 26.896484375, 29.4609375, 32.025390625, 34.58984375, 37.154296875, 39.71875, 42.283203125, 44.84765625, 47.412109375, 49.9765625, 52.541015625, 55.10546875, 57.669921875, 60.234375, 62.798828125, 65.36328125, 67.927734375, 70.4921875, 73.056640625, 75.62109375, 78.185546875, 80.75]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 6.0, 8.0, 8.0, 10.0, 12.0, 15.0, 17.0, 22.0, 34.0, 52.0, 65.0, 80.0, 102.0, 78.0, 102.0, 89.0, 57.0, 73.0, 45.0, 36.0, 20.0, 27.0, 9.0, 13.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.75, -74.0966796875, -71.443359375, -68.7900390625, -66.13671875, -63.4833984375, -60.830078125, -58.1767578125, -55.5234375, -52.8701171875, -50.216796875, -47.5634765625, -44.91015625, -42.2568359375, -39.603515625, -36.9501953125, -34.296875, -31.6435546875, -28.990234375, -26.3369140625, -23.68359375, -21.0302734375, -18.376953125, -15.7236328125, -13.0703125, -10.4169921875, -7.763671875, -5.1103515625, -2.45703125, 0.1962890625, 2.849609375, 5.5029296875, 8.15625, 10.8095703125, 13.462890625, 16.1162109375, 18.76953125, 21.4228515625, 24.076171875, 26.7294921875, 29.3828125, 32.0361328125, 34.689453125, 37.3427734375, 39.99609375, 42.6494140625, 45.302734375, 47.9560546875, 50.609375, 53.2626953125, 55.916015625, 58.5693359375, 61.22265625, 63.8759765625, 66.529296875, 69.1826171875, 71.8359375, 74.4892578125, 77.142578125, 79.7958984375, 82.44921875, 85.1025390625, 87.755859375, 90.4091796875, 93.0625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 5.0, 12.0, 34.0, 85.0, 119.0, 312.0, 232.0, 112.0, 49.0, 27.0, 12.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3038.5537109375, -2958.27294921875, -2877.992431640625, -2797.7119140625, -2717.43115234375, -2637.150390625, -2556.869873046875, -2476.58935546875, -2396.30859375, -2316.02783203125, -2235.747314453125, -2155.466796875, -2075.18603515625, -1994.9053955078125, -1914.624755859375, -1834.3441162109375, -1754.0634765625, -1673.7828369140625, -1593.502197265625, -1513.2215576171875, -1432.94091796875, -1352.6602783203125, -1272.379638671875, -1192.0989990234375, -1111.818359375, -1031.5377197265625, -951.257080078125, -870.9764404296875, -790.69580078125, -710.4151611328125, -630.134521484375, -549.8538818359375, -469.5732421875, -389.2926025390625, -309.011962890625, -228.7313232421875, -148.45068359375, -68.1700439453125, 12.110595703125, 92.3912353515625, 172.671875, 252.9525146484375, 333.233154296875, 413.5137939453125, 493.79443359375, 574.0750732421875, 654.355712890625, 734.6363525390625, 814.9169921875, 895.1976318359375, 975.478271484375, 1055.7589111328125, 1136.03955078125, 1216.3201904296875, 1296.600830078125, 1376.8814697265625, 1457.162109375, 1537.4427490234375, 1617.723388671875, 1698.0040283203125, 1778.28466796875, 1858.5653076171875, 1938.845947265625, 2019.1265869140625, 2099.4072265625]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 3.0, 6.0, 3.0, 12.0, 9.0, 16.0, 14.0, 20.0, 22.0, 25.0, 21.0, 39.0, 32.0, 40.0, 49.0, 58.0, 70.0, 75.0, 63.0, 60.0, 57.0, 30.0, 38.0, 25.0, 39.0, 27.0, 28.0, 24.0, 16.0, 12.0, 13.0, 10.0, 10.0, 4.0, 4.0, 5.0, 4.0, 2.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1015.4004516601562, -983.4732666015625, -951.5460815429688, -919.618896484375, -887.6917114257812, -855.7645263671875, -823.8372802734375, -791.91015625, -759.98291015625, -728.0557250976562, -696.1285400390625, -664.2013549804688, -632.274169921875, -600.3469848632812, -568.4197998046875, -536.4925537109375, -504.5654296875, -472.63824462890625, -440.7110595703125, -408.78387451171875, -376.856689453125, -344.92950439453125, -313.0022888183594, -281.0751037597656, -249.14791870117188, -217.22073364257812, -185.29354858398438, -153.36634826660156, -121.43916320800781, -89.51197814941406, -57.58477783203125, -25.6575927734375, 6.2696533203125, 38.196842193603516, 70.12403106689453, 102.05122375488281, 133.97840881347656, 165.9055938720703, 197.83279418945312, 229.75997924804688, 261.6871643066406, 293.6143493652344, 325.5415344238281, 357.46875, 389.39593505859375, 421.3231201171875, 453.25030517578125, 485.177490234375, 517.1046752929688, 549.0318603515625, 580.9590454101562, 612.88623046875, 644.8134155273438, 676.7406005859375, 708.6678466796875, 740.594970703125, 772.522216796875, 804.4494018554688, 836.3765869140625, 868.3037719726562, 900.23095703125, 932.1581420898438, 964.0853271484375, 996.0125732421875, 1027.939697265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 12.0, 16.0, 30.0, 40.0, 83.0, 226.0, 735.0, 3696.0, 33426.0, 3163148.0, 967924.0, 20333.0, 3388.0, 840.0, 253.0, 74.0, 33.0, 11.0, 7.0, 2.0, 2.0], "bins": [-386.0, -378.701171875, -371.40234375, -364.103515625, -356.8046875, -349.505859375, -342.20703125, -334.908203125, -327.609375, -320.310546875, -313.01171875, -305.712890625, -298.4140625, -291.115234375, -283.81640625, -276.517578125, -269.21875, -261.919921875, -254.62109375, -247.322265625, -240.0234375, -232.724609375, -225.42578125, -218.126953125, -210.828125, -203.529296875, -196.23046875, -188.931640625, -181.6328125, -174.333984375, -167.03515625, -159.736328125, -152.4375, -145.138671875, -137.83984375, -130.541015625, -123.2421875, -115.943359375, -108.64453125, -101.345703125, -94.046875, -86.748046875, -79.44921875, -72.150390625, -64.8515625, -57.552734375, -50.25390625, -42.955078125, -35.65625, -28.357421875, -21.05859375, -13.759765625, -6.4609375, 0.837890625, 8.13671875, 15.435546875, 22.734375, 30.033203125, 37.33203125, 44.630859375, 51.9296875, 59.228515625, 66.52734375, 73.826171875, 81.125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 7.0, 12.0, 11.0, 19.0, 42.0, 73.0, 115.0, 108.0, 141.0, 146.0, 113.0, 71.0, 59.0, 43.0, 23.0, 11.0, 13.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-240.0, -235.26904296875, -230.5380859375, -225.80712890625, -221.076171875, -216.34521484375, -211.6142578125, -206.88330078125, -202.15234375, -197.42138671875, -192.6904296875, -187.95947265625, -183.228515625, -178.49755859375, -173.7666015625, -169.03564453125, -164.3046875, -159.57373046875, -154.8427734375, -150.11181640625, -145.380859375, -140.64990234375, -135.9189453125, -131.18798828125, -126.45703125, -121.72607421875, -116.9951171875, -112.26416015625, -107.533203125, -102.80224609375, -98.0712890625, -93.34033203125, -88.609375, -83.87841796875, -79.1474609375, -74.41650390625, -69.685546875, -64.95458984375, -60.2236328125, -55.49267578125, -50.76171875, -46.03076171875, -41.2998046875, -36.56884765625, -31.837890625, -27.10693359375, -22.3759765625, -17.64501953125, -12.9140625, -8.18310546875, -3.4521484375, 1.27880859375, 6.009765625, 10.74072265625, 15.4716796875, 20.20263671875, 24.93359375, 29.66455078125, 34.3955078125, 39.12646484375, 43.857421875, 48.58837890625, 53.3193359375, 58.05029296875, 62.78125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 17.0, 16.0, 26.0, 35.0, 59.0, 87.0, 162.0, 246.0, 463.0, 975.0, 2029.0, 4637.0, 11213.0, 32437.0, 144504.0, 2911225.0, 962918.0, 85576.0, 23094.0, 8120.0, 3217.0, 1476.0, 751.0, 389.0, 239.0, 130.0, 79.0, 49.0, 29.0, 23.0, 11.0, 10.0, 9.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.25, -147.146484375, -142.04296875, -136.939453125, -131.8359375, -126.732421875, -121.62890625, -116.525390625, -111.421875, -106.318359375, -101.21484375, -96.111328125, -91.0078125, -85.904296875, -80.80078125, -75.697265625, -70.59375, -65.490234375, -60.38671875, -55.283203125, -50.1796875, -45.076171875, -39.97265625, -34.869140625, -29.765625, -24.662109375, -19.55859375, -14.455078125, -9.3515625, -4.248046875, 0.85546875, 5.958984375, 11.0625, 16.166015625, 21.26953125, 26.373046875, 31.4765625, 36.580078125, 41.68359375, 46.787109375, 51.890625, 56.994140625, 62.09765625, 67.201171875, 72.3046875, 77.408203125, 82.51171875, 87.615234375, 92.71875, 97.822265625, 102.92578125, 108.029296875, 113.1328125, 118.236328125, 123.33984375, 128.443359375, 133.546875, 138.650390625, 143.75390625, 148.857421875, 153.9609375, 159.064453125, 164.16796875, 169.271484375, 174.375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 9.0, 11.0, 17.0, 19.0, 17.0, 24.0, 50.0, 72.0, 128.0, 262.0, 649.0, 1148.0, 839.0, 334.0, 152.0, 117.0, 64.0, 39.0, 26.0, 28.0, 17.0, 7.0, 3.0, 7.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-215.125, -207.876953125, -200.62890625, -193.380859375, -186.1328125, -178.884765625, -171.63671875, -164.388671875, -157.140625, -149.892578125, -142.64453125, -135.396484375, -128.1484375, -120.900390625, -113.65234375, -106.404296875, -99.15625, -91.908203125, -84.66015625, -77.412109375, -70.1640625, -62.916015625, -55.66796875, -48.419921875, -41.171875, -33.923828125, -26.67578125, -19.427734375, -12.1796875, -4.931640625, 2.31640625, 9.564453125, 16.8125, 24.060546875, 31.30859375, 38.556640625, 45.8046875, 53.052734375, 60.30078125, 67.548828125, 74.796875, 82.044921875, 89.29296875, 96.541015625, 103.7890625, 111.037109375, 118.28515625, 125.533203125, 132.78125, 140.029296875, 147.27734375, 154.525390625, 161.7734375, 169.021484375, 176.26953125, 183.517578125, 190.765625, 198.013671875, 205.26171875, 212.509765625, 219.7578125, 227.005859375, 234.25390625, 241.501953125, 248.75]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 12.0, 37.0, 74.0, 138.0, 253.0, 246.0, 126.0, 47.0, 34.0, 8.0, 6.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1746.4625244140625, -1676.0208740234375, -1605.5791015625, -1535.137451171875, -1464.69580078125, -1394.2540283203125, -1323.8123779296875, -1253.37060546875, -1182.928955078125, -1112.4873046875, -1042.0455322265625, -971.6038818359375, -901.1621704101562, -830.720458984375, -760.27880859375, -689.8370971679688, -619.3953857421875, -548.9536743164062, -478.5119934082031, -408.0703125, -337.62860107421875, -267.1868896484375, -196.74520874023438, -126.30352783203125, -55.86181640625, 14.579879760742188, 85.02157592773438, 155.46327209472656, 225.90496826171875, 296.3466796875, 366.7883605957031, 437.23004150390625, 507.671875, 578.1135864257812, 648.5552978515625, 718.9969482421875, 789.4386596679688, 859.88037109375, 930.322021484375, 1000.7637329101562, 1071.2054443359375, 1141.6470947265625, 1212.0888671875, 1282.530517578125, 1352.97216796875, 1423.4139404296875, 1493.8555908203125, 1564.29736328125, 1634.739013671875, 1705.1806640625, 1775.6224365234375, 1846.0640869140625, 1916.505859375, 1986.947509765625, 2057.38916015625, 2127.830810546875, 2198.2724609375, 2268.714111328125, 2339.15576171875, 2409.59765625, 2480.039306640625, 2550.48095703125, 2620.922607421875, 2691.3642578125, 2761.80615234375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 7.0, 8.0, 9.0, 17.0, 27.0, 24.0, 25.0, 33.0, 41.0, 39.0, 46.0, 65.0, 56.0, 49.0, 75.0, 59.0, 69.0, 51.0, 41.0, 52.0, 37.0, 29.0, 28.0, 21.0, 25.0, 15.0, 10.0, 15.0, 7.0, 6.0, 5.0, 9.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-943.9989013671875, -911.0428466796875, -878.0867919921875, -845.1307373046875, -812.1746826171875, -779.2186279296875, -746.2625732421875, -713.3065185546875, -680.3504638671875, -647.3944091796875, -614.4383544921875, -581.4822998046875, -548.5262451171875, -515.5701904296875, -482.6141357421875, -449.6580810546875, -416.7020263671875, -383.7459716796875, -350.7899169921875, -317.8338623046875, -284.8778076171875, -251.9217529296875, -218.9656982421875, -186.0096435546875, -153.0535888671875, -120.0975341796875, -87.1414794921875, -54.1854248046875, -21.2293701171875, 11.7266845703125, 44.6827392578125, 77.6387939453125, 110.5947265625, 143.55078125, 176.5068359375, 209.462890625, 242.4189453125, 275.375, 308.3310546875, 341.287109375, 374.2431640625, 407.19921875, 440.1552734375, 473.111328125, 506.0673828125, 539.0234375, 571.9794921875, 604.935546875, 637.8916015625, 670.84765625, 703.8037109375, 736.759765625, 769.7158203125, 802.671875, 835.6279296875, 868.583984375, 901.5400390625, 934.49609375, 967.4521484375, 1000.408203125, 1033.3642578125, 1066.3203125, 1099.2763671875, 1132.232421875, 1165.1884765625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 6.0, 6.0, 5.0, 6.0, 10.0, 15.0, 19.0, 54.0, 99.0, 217.0, 426.0, 1111.0, 2791.0, 9175.0, 36339.0, 185909.0, 609054.0, 158706.0, 31884.0, 8317.0, 2623.0, 960.0, 415.0, 199.0, 93.0, 50.0, 29.0, 19.0, 9.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-209.625, -202.9609375, -196.296875, -189.6328125, -182.96875, -176.3046875, -169.640625, -162.9765625, -156.3125, -149.6484375, -142.984375, -136.3203125, -129.65625, -122.9921875, -116.328125, -109.6640625, -103.0, -96.3359375, -89.671875, -83.0078125, -76.34375, -69.6796875, -63.015625, -56.3515625, -49.6875, -43.0234375, -36.359375, -29.6953125, -23.03125, -16.3671875, -9.703125, -3.0390625, 3.625, 10.2890625, 16.953125, 23.6171875, 30.28125, 36.9453125, 43.609375, 50.2734375, 56.9375, 63.6015625, 70.265625, 76.9296875, 83.59375, 90.2578125, 96.921875, 103.5859375, 110.25, 116.9140625, 123.578125, 130.2421875, 136.90625, 143.5703125, 150.234375, 156.8984375, 163.5625, 170.2265625, 176.890625, 183.5546875, 190.21875, 196.8828125, 203.546875, 210.2109375, 216.875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 7.0, 15.0, 16.0, 13.0, 19.0, 22.0, 36.0, 28.0, 45.0, 53.0, 58.0, 56.0, 58.0, 59.0, 61.0, 76.0, 60.0, 58.0, 42.0, 34.0, 32.0, 39.0, 28.0, 23.0, 27.0, 12.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0], "bins": [-108.9375, -106.521484375, -104.10546875, -101.689453125, -99.2734375, -96.857421875, -94.44140625, -92.025390625, -89.609375, -87.193359375, -84.77734375, -82.361328125, -79.9453125, -77.529296875, -75.11328125, -72.697265625, -70.28125, -67.865234375, -65.44921875, -63.033203125, -60.6171875, -58.201171875, -55.78515625, -53.369140625, -50.953125, -48.537109375, -46.12109375, -43.705078125, -41.2890625, -38.873046875, -36.45703125, -34.041015625, -31.625, -29.208984375, -26.79296875, -24.376953125, -21.9609375, -19.544921875, -17.12890625, -14.712890625, -12.296875, -9.880859375, -7.46484375, -5.048828125, -2.6328125, -0.216796875, 2.19921875, 4.615234375, 7.03125, 9.447265625, 11.86328125, 14.279296875, 16.6953125, 19.111328125, 21.52734375, 23.943359375, 26.359375, 28.775390625, 31.19140625, 33.607421875, 36.0234375, 38.439453125, 40.85546875, 43.271484375, 45.6875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 10.0, 18.0, 18.0, 21.0, 43.0, 51.0, 84.0, 145.0, 222.0, 393.0, 716.0, 1528.0, 4176.0, 18580.0, 252121.0, 726955.0, 33189.0, 6088.0, 2067.0, 886.0, 477.0, 281.0, 176.0, 91.0, 50.0, 55.0, 32.0, 23.0, 23.0, 5.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-290.0, -277.98828125, -265.9765625, -253.96484375, -241.953125, -229.94140625, -217.9296875, -205.91796875, -193.90625, -181.89453125, -169.8828125, -157.87109375, -145.859375, -133.84765625, -121.8359375, -109.82421875, -97.8125, -85.80078125, -73.7890625, -61.77734375, -49.765625, -37.75390625, -25.7421875, -13.73046875, -1.71875, 10.29296875, 22.3046875, 34.31640625, 46.328125, 58.33984375, 70.3515625, 82.36328125, 94.375, 106.38671875, 118.3984375, 130.41015625, 142.421875, 154.43359375, 166.4453125, 178.45703125, 190.46875, 202.48046875, 214.4921875, 226.50390625, 238.515625, 250.52734375, 262.5390625, 274.55078125, 286.5625, 298.57421875, 310.5859375, 322.59765625, 334.609375, 346.62109375, 358.6328125, 370.64453125, 382.65625, 394.66796875, 406.6796875, 418.69140625, 430.703125, 442.71484375, 454.7265625, 466.73828125, 478.75]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 12.0, 8.0, 15.0, 17.0, 26.0, 29.0, 42.0, 47.0, 67.0, 74.0, 62.0, 90.0, 89.0, 81.0, 71.0, 53.0, 48.0, 45.0, 39.0, 27.0, 15.0, 13.0, 9.0, 7.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-246.125, -234.326171875, -222.52734375, -210.728515625, -198.9296875, -187.130859375, -175.33203125, -163.533203125, -151.734375, -139.935546875, -128.13671875, -116.337890625, -104.5390625, -92.740234375, -80.94140625, -69.142578125, -57.34375, -45.544921875, -33.74609375, -21.947265625, -10.1484375, 1.650390625, 13.44921875, 25.248046875, 37.046875, 48.845703125, 60.64453125, 72.443359375, 84.2421875, 96.041015625, 107.83984375, 119.638671875, 131.4375, 143.236328125, 155.03515625, 166.833984375, 178.6328125, 190.431640625, 202.23046875, 214.029296875, 225.828125, 237.626953125, 249.42578125, 261.224609375, 273.0234375, 284.822265625, 296.62109375, 308.419921875, 320.21875, 332.017578125, 343.81640625, 355.615234375, 367.4140625, 379.212890625, 391.01171875, 402.810546875, 414.609375, 426.408203125, 438.20703125, 450.005859375, 461.8046875, 473.603515625, 485.40234375, 497.201171875, 509.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 6.0, 8.0, 8.0, 4.0, 10.0, 8.0, 10.0, 14.0, 16.0, 20.0, 29.0, 48.0, 69.0, 103.0, 154.0, 313.0, 720.0, 2179.0, 12709.0, 325375.0, 685933.0, 16626.0, 2532.0, 792.0, 338.0, 178.0, 104.0, 68.0, 37.0, 26.0, 26.0, 16.0, 13.0, 13.0, 4.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-170.5, -165.63671875, -160.7734375, -155.91015625, -151.046875, -146.18359375, -141.3203125, -136.45703125, -131.59375, -126.73046875, -121.8671875, -117.00390625, -112.140625, -107.27734375, -102.4140625, -97.55078125, -92.6875, -87.82421875, -82.9609375, -78.09765625, -73.234375, -68.37109375, -63.5078125, -58.64453125, -53.78125, -48.91796875, -44.0546875, -39.19140625, -34.328125, -29.46484375, -24.6015625, -19.73828125, -14.875, -10.01171875, -5.1484375, -0.28515625, 4.578125, 9.44140625, 14.3046875, 19.16796875, 24.03125, 28.89453125, 33.7578125, 38.62109375, 43.484375, 48.34765625, 53.2109375, 58.07421875, 62.9375, 67.80078125, 72.6640625, 77.52734375, 82.390625, 87.25390625, 92.1171875, 96.98046875, 101.84375, 106.70703125, 111.5703125, 116.43359375, 121.296875, 126.16015625, 131.0234375, 135.88671875, 140.75]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 11.0, 17.0, 10.0, 24.0, 32.0, 38.0, 54.0, 113.0, 190.0, 181.0, 113.0, 65.0, 36.0, 29.0, 19.0, 15.0, 13.0, 10.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020050048828125, -0.01933121681213379, -0.018612384796142578, -0.017893552780151367, -0.017174720764160156, -0.016455888748168945, -0.015737056732177734, -0.015018224716186523, -0.014299392700195312, -0.013580560684204102, -0.01286172866821289, -0.01214289665222168, -0.011424064636230469, -0.010705232620239258, -0.009986400604248047, -0.009267568588256836, -0.008548736572265625, -0.007829904556274414, -0.007111072540283203, -0.006392240524291992, -0.005673408508300781, -0.00495457649230957, -0.004235744476318359, -0.0035169124603271484, -0.0027980804443359375, -0.0020792484283447266, -0.0013604164123535156, -0.0006415843963623047, 7.724761962890625e-05, 0.0007960796356201172, 0.0015149116516113281, 0.002233743667602539, 0.00295257568359375, 0.003671407699584961, 0.004390239715576172, 0.005109071731567383, 0.005827903747558594, 0.006546735763549805, 0.007265567779541016, 0.007984399795532227, 0.008703231811523438, 0.009422063827514648, 0.01014089584350586, 0.01085972785949707, 0.011578559875488281, 0.012297391891479492, 0.013016223907470703, 0.013735055923461914, 0.014453887939453125, 0.015172719955444336, 0.015891551971435547, 0.016610383987426758, 0.01732921600341797, 0.01804804801940918, 0.01876688003540039, 0.0194857120513916, 0.020204544067382812, 0.020923376083374023, 0.021642208099365234, 0.022361040115356445, 0.023079872131347656, 0.023798704147338867, 0.024517536163330078, 0.02523636817932129, 0.0259552001953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 9.0, 12.0, 18.0, 22.0, 39.0, 77.0, 107.0, 197.0, 380.0, 1009.0, 2999.0, 17354.0, 743569.0, 267769.0, 11070.0, 2353.0, 802.0, 354.0, 139.0, 95.0, 62.0, 30.0, 26.0, 15.0, 9.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-140.0, -135.744140625, -131.48828125, -127.232421875, -122.9765625, -118.720703125, -114.46484375, -110.208984375, -105.953125, -101.697265625, -97.44140625, -93.185546875, -88.9296875, -84.673828125, -80.41796875, -76.162109375, -71.90625, -67.650390625, -63.39453125, -59.138671875, -54.8828125, -50.626953125, -46.37109375, -42.115234375, -37.859375, -33.603515625, -29.34765625, -25.091796875, -20.8359375, -16.580078125, -12.32421875, -8.068359375, -3.8125, 0.443359375, 4.69921875, 8.955078125, 13.2109375, 17.466796875, 21.72265625, 25.978515625, 30.234375, 34.490234375, 38.74609375, 43.001953125, 47.2578125, 51.513671875, 55.76953125, 60.025390625, 64.28125, 68.537109375, 72.79296875, 77.048828125, 81.3046875, 85.560546875, 89.81640625, 94.072265625, 98.328125, 102.583984375, 106.83984375, 111.095703125, 115.3515625, 119.607421875, 123.86328125, 128.119140625, 132.375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 1.0, 4.0, 7.0, 5.0, 13.0, 20.0, 23.0, 38.0, 79.0, 126.0, 178.0, 163.0, 122.0, 74.0, 65.0, 30.0, 15.0, 17.0, 10.0, 7.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.875, -115.28125, -111.6875, -108.09375, -104.5, -100.90625, -97.3125, -93.71875, -90.125, -86.53125, -82.9375, -79.34375, -75.75, -72.15625, -68.5625, -64.96875, -61.375, -57.78125, -54.1875, -50.59375, -47.0, -43.40625, -39.8125, -36.21875, -32.625, -29.03125, -25.4375, -21.84375, -18.25, -14.65625, -11.0625, -7.46875, -3.875, -0.28125, 3.3125, 6.90625, 10.5, 14.09375, 17.6875, 21.28125, 24.875, 28.46875, 32.0625, 35.65625, 39.25, 42.84375, 46.4375, 50.03125, 53.625, 57.21875, 60.8125, 64.40625, 68.0, 71.59375, 75.1875, 78.78125, 82.375, 85.96875, 89.5625, 93.15625, 96.75, 100.34375, 103.9375, 107.53125, 111.125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 5.0, 14.0, 35.0, 67.0, 109.0, 135.0, 232.0, 139.0, 104.0, 51.0, 35.0, 22.0, 16.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2232.2333984375, -2185.23828125, -2138.242919921875, -2091.247802734375, -2044.2525634765625, -1997.25732421875, -1950.26220703125, -1903.2669677734375, -1856.271728515625, -1809.2764892578125, -1762.2813720703125, -1715.2861328125, -1668.2908935546875, -1621.295654296875, -1574.300537109375, -1527.3052978515625, -1480.3101806640625, -1433.31494140625, -1386.31982421875, -1339.3245849609375, -1292.329345703125, -1245.334228515625, -1198.3389892578125, -1151.34375, -1104.3486328125, -1057.3533935546875, -1010.3582153320312, -963.363037109375, -916.3677978515625, -869.3726196289062, -822.37744140625, -775.3822021484375, -728.3870849609375, -681.3919067382812, -634.3966674804688, -587.4014892578125, -540.40625, -493.41107177734375, -446.4158935546875, -399.4206848144531, -352.42547607421875, -305.4302673339844, -258.43505859375, -211.43988037109375, -164.44467163085938, -117.449462890625, -70.45428466796875, -23.459075927734375, 23.5361328125, 70.53133392333984, 117.52653503417969, 164.521728515625, 211.51693725585938, 258.51214599609375, 305.50732421875, 352.5025329589844, 399.49774169921875, 446.4929504394531, 493.4881591796875, 540.4833374023438, 587.478515625, 634.4737548828125, 681.4689331054688, 728.464111328125, 775.4593505859375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 19.0, 12.0, 13.0, 16.0, 19.0, 18.0, 21.0, 24.0, 26.0, 29.0, 22.0, 37.0, 41.0, 31.0, 57.0, 51.0, 71.0, 68.0, 57.0, 55.0, 35.0, 33.0, 32.0, 24.0, 26.0, 23.0, 12.0, 19.0, 18.0, 17.0, 9.0, 11.0, 10.0, 8.0, 7.0, 4.0, 5.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-902.8841552734375, -874.5045776367188, -846.125, -817.7454833984375, -789.3659057617188, -760.986328125, -732.6067504882812, -704.2271728515625, -675.8475952148438, -647.468017578125, -619.0884399414062, -590.7088623046875, -562.329345703125, -533.9497680664062, -505.5701904296875, -477.19061279296875, -448.8110656738281, -420.4314880371094, -392.05194091796875, -363.67236328125, -335.29278564453125, -306.9132080078125, -278.5336608886719, -250.15408325195312, -221.77452087402344, -193.39495849609375, -165.015380859375, -136.6358184814453, -108.2562484741211, -79.87667846679688, -51.49711608886719, -23.117538452148438, 5.26202392578125, 33.64159393310547, 62.02116012573242, 90.40072631835938, 118.7802963256836, 147.1598663330078, 175.5394287109375, 203.91900634765625, 232.29856872558594, 260.6781311035156, 289.0577087402344, 317.437255859375, 345.81683349609375, 374.1964111328125, 402.57598876953125, 430.95556640625, 459.3351135253906, 487.7146911621094, 516.09423828125, 544.4738159179688, 572.8533935546875, 601.2329711914062, 629.612548828125, 657.9920654296875, 686.3716430664062, 714.751220703125, 743.1307983398438, 771.5103759765625, 799.889892578125, 828.2694702148438, 856.6490478515625, 885.0286254882812, 913.408203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 8.0, 10.0, 24.0, 26.0, 48.0, 77.0, 148.0, 277.0, 617.0, 1521.0, 4215.0, 13548.0, 81330.0, 3107581.0, 933086.0, 37989.0, 8943.0, 2899.0, 1034.0, 423.0, 208.0, 115.0, 65.0, 22.0, 19.0, 13.0, 12.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-213.25, -208.150390625, -203.05078125, -197.951171875, -192.8515625, -187.751953125, -182.65234375, -177.552734375, -172.453125, -167.353515625, -162.25390625, -157.154296875, -152.0546875, -146.955078125, -141.85546875, -136.755859375, -131.65625, -126.556640625, -121.45703125, -116.357421875, -111.2578125, -106.158203125, -101.05859375, -95.958984375, -90.859375, -85.759765625, -80.66015625, -75.560546875, -70.4609375, -65.361328125, -60.26171875, -55.162109375, -50.0625, -44.962890625, -39.86328125, -34.763671875, -29.6640625, -24.564453125, -19.46484375, -14.365234375, -9.265625, -4.166015625, 0.93359375, 6.033203125, 11.1328125, 16.232421875, 21.33203125, 26.431640625, 31.53125, 36.630859375, 41.73046875, 46.830078125, 51.9296875, 57.029296875, 62.12890625, 67.228515625, 72.328125, 77.427734375, 82.52734375, 87.626953125, 92.7265625, 97.826171875, 102.92578125, 108.025390625, 113.125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 7.0, 11.0, 8.0, 4.0, 10.0, 7.0, 15.0, 15.0, 19.0, 19.0, 19.0, 25.0, 29.0, 48.0, 40.0, 34.0, 40.0, 41.0, 41.0, 33.0, 43.0, 44.0, 41.0, 41.0, 31.0, 27.0, 31.0, 30.0, 36.0, 31.0, 22.0, 15.0, 24.0, 20.0, 10.0, 13.0, 15.0, 5.0, 12.0, 6.0, 11.0, 6.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-49.5, -48.068359375, -46.63671875, -45.205078125, -43.7734375, -42.341796875, -40.91015625, -39.478515625, -38.046875, -36.615234375, -35.18359375, -33.751953125, -32.3203125, -30.888671875, -29.45703125, -28.025390625, -26.59375, -25.162109375, -23.73046875, -22.298828125, -20.8671875, -19.435546875, -18.00390625, -16.572265625, -15.140625, -13.708984375, -12.27734375, -10.845703125, -9.4140625, -7.982421875, -6.55078125, -5.119140625, -3.6875, -2.255859375, -0.82421875, 0.607421875, 2.0390625, 3.470703125, 4.90234375, 6.333984375, 7.765625, 9.197265625, 10.62890625, 12.060546875, 13.4921875, 14.923828125, 16.35546875, 17.787109375, 19.21875, 20.650390625, 22.08203125, 23.513671875, 24.9453125, 26.376953125, 27.80859375, 29.240234375, 30.671875, 32.103515625, 33.53515625, 34.966796875, 36.3984375, 37.830078125, 39.26171875, 40.693359375, 42.125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 7.0, 7.0, 4.0, 6.0, 12.0, 22.0, 23.0, 39.0, 93.0, 147.0, 330.0, 953.0, 3157.0, 13065.0, 82359.0, 3528152.0, 522185.0, 33786.0, 6885.0, 1842.0, 609.0, 249.0, 128.0, 75.0, 42.0, 31.0, 25.0, 14.0, 13.0, 8.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.375, -219.474609375, -211.57421875, -203.673828125, -195.7734375, -187.873046875, -179.97265625, -172.072265625, -164.171875, -156.271484375, -148.37109375, -140.470703125, -132.5703125, -124.669921875, -116.76953125, -108.869140625, -100.96875, -93.068359375, -85.16796875, -77.267578125, -69.3671875, -61.466796875, -53.56640625, -45.666015625, -37.765625, -29.865234375, -21.96484375, -14.064453125, -6.1640625, 1.736328125, 9.63671875, 17.537109375, 25.4375, 33.337890625, 41.23828125, 49.138671875, 57.0390625, 64.939453125, 72.83984375, 80.740234375, 88.640625, 96.541015625, 104.44140625, 112.341796875, 120.2421875, 128.142578125, 136.04296875, 143.943359375, 151.84375, 159.744140625, 167.64453125, 175.544921875, 183.4453125, 191.345703125, 199.24609375, 207.146484375, 215.046875, 222.947265625, 230.84765625, 238.748046875, 246.6484375, 254.548828125, 262.44921875, 270.349609375, 278.25]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 14.0, 8.0, 7.0, 12.0, 20.0, 24.0, 23.0, 43.0, 45.0, 81.0, 132.0, 262.0, 512.0, 837.0, 832.0, 492.0, 242.0, 146.0, 84.0, 54.0, 39.0, 36.0, 26.0, 21.0, 9.0, 11.0, 9.0, 4.0, 6.0, 10.0, 7.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.25, -136.0234375, -130.796875, -125.5703125, -120.34375, -115.1171875, -109.890625, -104.6640625, -99.4375, -94.2109375, -88.984375, -83.7578125, -78.53125, -73.3046875, -68.078125, -62.8515625, -57.625, -52.3984375, -47.171875, -41.9453125, -36.71875, -31.4921875, -26.265625, -21.0390625, -15.8125, -10.5859375, -5.359375, -0.1328125, 5.09375, 10.3203125, 15.546875, 20.7734375, 26.0, 31.2265625, 36.453125, 41.6796875, 46.90625, 52.1328125, 57.359375, 62.5859375, 67.8125, 73.0390625, 78.265625, 83.4921875, 88.71875, 93.9453125, 99.171875, 104.3984375, 109.625, 114.8515625, 120.078125, 125.3046875, 130.53125, 135.7578125, 140.984375, 146.2109375, 151.4375, 156.6640625, 161.890625, 167.1171875, 172.34375, 177.5703125, 182.796875, 188.0234375, 193.25]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 15.0, 50.0, 137.0, 286.0, 267.0, 136.0, 44.0, 30.0, 7.0, 4.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1814.13720703125, -1738.433349609375, -1662.7296142578125, -1587.0257568359375, -1511.322021484375, -1435.6181640625, -1359.914306640625, -1284.21044921875, -1208.5067138671875, -1132.8028564453125, -1057.09912109375, -981.395263671875, -905.6914672851562, -829.9876708984375, -754.2838134765625, -678.5800170898438, -602.876220703125, -527.1724243164062, -451.4685974121094, -375.7647705078125, -300.06097412109375, -224.357177734375, -148.65335083007812, -72.94952392578125, 2.7542724609375, 78.45808410644531, 154.16189575195312, 229.86570739746094, 305.56951904296875, 381.2733154296875, 456.9771423339844, 532.6809692382812, 608.385009765625, 684.0888061523438, 759.7926025390625, 835.4964599609375, 911.2002563476562, 986.904052734375, 1062.60791015625, 1138.311767578125, 1214.0155029296875, 1289.7193603515625, 1365.423095703125, 1441.126953125, 1516.830810546875, 1592.5345458984375, 1668.2384033203125, 1743.942138671875, 1819.64599609375, 1895.349853515625, 1971.0535888671875, 2046.7574462890625, 2122.461181640625, 2198.1650390625, 2273.868896484375, 2349.57275390625, 2425.2763671875, 2500.980224609375, 2576.68408203125, 2652.3876953125, 2728.091552734375, 2803.79541015625, 2879.499267578125, 2955.203125, 3030.906982421875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 1.0, 3.0, 11.0, 12.0, 7.0, 8.0, 5.0, 16.0, 18.0, 27.0, 27.0, 29.0, 35.0, 41.0, 47.0, 36.0, 47.0, 46.0, 50.0, 59.0, 51.0, 46.0, 40.0, 37.0, 44.0, 31.0, 33.0, 35.0, 19.0, 23.0, 27.0, 7.0, 17.0, 19.0, 7.0, 12.0, 6.0, 8.0, 1.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-752.062744140625, -728.3822021484375, -704.70166015625, -681.0211791992188, -657.3406372070312, -633.6600952148438, -609.9796142578125, -586.299072265625, -562.6185302734375, -538.93798828125, -515.2574462890625, -491.57696533203125, -467.89642333984375, -444.21588134765625, -420.5353698730469, -396.8548583984375, -373.17431640625, -349.4937744140625, -325.8132629394531, -302.13275146484375, -278.45220947265625, -254.7716827392578, -231.09115600585938, -207.41062927246094, -183.7301025390625, -160.04957580566406, -136.36904907226562, -112.68852233886719, -89.00799560546875, -65.32746887207031, -41.646942138671875, -17.966415405273438, 5.71405029296875, 29.394577026367188, 53.075103759765625, 76.75563049316406, 100.4361572265625, 124.11668395996094, 147.79721069335938, 171.4777374267578, 195.15826416015625, 218.8387908935547, 242.51931762695312, 266.1998291015625, 289.88037109375, 313.5609130859375, 337.2414245605469, 360.92193603515625, 384.60247802734375, 408.28302001953125, 431.9635314941406, 455.64404296875, 479.3245849609375, 503.005126953125, 526.6856689453125, 550.3661499023438, 574.0466918945312, 597.7272338867188, 621.40771484375, 645.0882568359375, 668.768798828125, 692.4493408203125, 716.1298828125, 739.8103637695312, 763.4909057617188]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 5.0, 11.0, 21.0, 15.0, 28.0, 29.0, 75.0, 89.0, 154.0, 283.0, 483.0, 873.0, 1587.0, 3228.0, 6986.0, 15929.0, 38592.0, 99449.0, 262511.0, 356501.0, 158686.0, 59320.0, 23998.0, 10255.0, 4565.0, 2226.0, 1148.0, 605.0, 353.0, 215.0, 113.0, 69.0, 48.0, 33.0, 27.0, 18.0, 11.0, 4.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-97.6875, -94.748046875, -91.80859375, -88.869140625, -85.9296875, -82.990234375, -80.05078125, -77.111328125, -74.171875, -71.232421875, -68.29296875, -65.353515625, -62.4140625, -59.474609375, -56.53515625, -53.595703125, -50.65625, -47.716796875, -44.77734375, -41.837890625, -38.8984375, -35.958984375, -33.01953125, -30.080078125, -27.140625, -24.201171875, -21.26171875, -18.322265625, -15.3828125, -12.443359375, -9.50390625, -6.564453125, -3.625, -0.685546875, 2.25390625, 5.193359375, 8.1328125, 11.072265625, 14.01171875, 16.951171875, 19.890625, 22.830078125, 25.76953125, 28.708984375, 31.6484375, 34.587890625, 37.52734375, 40.466796875, 43.40625, 46.345703125, 49.28515625, 52.224609375, 55.1640625, 58.103515625, 61.04296875, 63.982421875, 66.921875, 69.861328125, 72.80078125, 75.740234375, 78.6796875, 81.619140625, 84.55859375, 87.498046875, 90.4375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 9.0, 11.0, 11.0, 11.0, 11.0, 14.0, 14.0, 28.0, 24.0, 34.0, 25.0, 38.0, 35.0, 31.0, 46.0, 46.0, 44.0, 54.0, 40.0, 46.0, 42.0, 46.0, 48.0, 29.0, 39.0, 34.0, 23.0, 21.0, 18.0, 24.0, 19.0, 13.0, 13.0, 12.0, 16.0, 4.0, 10.0, 1.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.4375, -61.63427734375, -59.8310546875, -58.02783203125, -56.224609375, -54.42138671875, -52.6181640625, -50.81494140625, -49.01171875, -47.20849609375, -45.4052734375, -43.60205078125, -41.798828125, -39.99560546875, -38.1923828125, -36.38916015625, -34.5859375, -32.78271484375, -30.9794921875, -29.17626953125, -27.373046875, -25.56982421875, -23.7666015625, -21.96337890625, -20.16015625, -18.35693359375, -16.5537109375, -14.75048828125, -12.947265625, -11.14404296875, -9.3408203125, -7.53759765625, -5.734375, -3.93115234375, -2.1279296875, -0.32470703125, 1.478515625, 3.28173828125, 5.0849609375, 6.88818359375, 8.69140625, 10.49462890625, 12.2978515625, 14.10107421875, 15.904296875, 17.70751953125, 19.5107421875, 21.31396484375, 23.1171875, 24.92041015625, 26.7236328125, 28.52685546875, 30.330078125, 32.13330078125, 33.9365234375, 35.73974609375, 37.54296875, 39.34619140625, 41.1494140625, 42.95263671875, 44.755859375, 46.55908203125, 48.3623046875, 50.16552734375, 51.96875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 13.0, 21.0, 10.0, 19.0, 33.0, 48.0, 76.0, 170.0, 327.0, 820.0, 2787.0, 13635.0, 141206.0, 816409.0, 61990.0, 7882.0, 1838.0, 640.0, 285.0, 139.0, 73.0, 50.0, 28.0, 9.0, 18.0, 11.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-381.75, -372.517578125, -363.28515625, -354.052734375, -344.8203125, -335.587890625, -326.35546875, -317.123046875, -307.890625, -298.658203125, -289.42578125, -280.193359375, -270.9609375, -261.728515625, -252.49609375, -243.263671875, -234.03125, -224.798828125, -215.56640625, -206.333984375, -197.1015625, -187.869140625, -178.63671875, -169.404296875, -160.171875, -150.939453125, -141.70703125, -132.474609375, -123.2421875, -114.009765625, -104.77734375, -95.544921875, -86.3125, -77.080078125, -67.84765625, -58.615234375, -49.3828125, -40.150390625, -30.91796875, -21.685546875, -12.453125, -3.220703125, 6.01171875, 15.244140625, 24.4765625, 33.708984375, 42.94140625, 52.173828125, 61.40625, 70.638671875, 79.87109375, 89.103515625, 98.3359375, 107.568359375, 116.80078125, 126.033203125, 135.265625, 144.498046875, 153.73046875, 162.962890625, 172.1953125, 181.427734375, 190.66015625, 199.892578125, 209.125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 5.0, 7.0, 9.0, 9.0, 12.0, 18.0, 13.0, 16.0, 24.0, 24.0, 25.0, 34.0, 30.0, 31.0, 52.0, 49.0, 64.0, 63.0, 59.0, 47.0, 56.0, 50.0, 38.0, 48.0, 49.0, 25.0, 17.0, 18.0, 13.0, 17.0, 11.0, 9.0, 11.0, 7.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-227.125, -219.9453125, -212.765625, -205.5859375, -198.40625, -191.2265625, -184.046875, -176.8671875, -169.6875, -162.5078125, -155.328125, -148.1484375, -140.96875, -133.7890625, -126.609375, -119.4296875, -112.25, -105.0703125, -97.890625, -90.7109375, -83.53125, -76.3515625, -69.171875, -61.9921875, -54.8125, -47.6328125, -40.453125, -33.2734375, -26.09375, -18.9140625, -11.734375, -4.5546875, 2.625, 9.8046875, 16.984375, 24.1640625, 31.34375, 38.5234375, 45.703125, 52.8828125, 60.0625, 67.2421875, 74.421875, 81.6015625, 88.78125, 95.9609375, 103.140625, 110.3203125, 117.5, 124.6796875, 131.859375, 139.0390625, 146.21875, 153.3984375, 160.578125, 167.7578125, 174.9375, 182.1171875, 189.296875, 196.4765625, 203.65625, 210.8359375, 218.015625, 225.1953125, 232.375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 10.0, 6.0, 7.0, 16.0, 19.0, 30.0, 58.0, 83.0, 151.0, 315.0, 675.0, 1702.0, 5611.0, 29606.0, 331265.0, 629488.0, 39292.0, 6786.0, 1887.0, 755.0, 340.0, 191.0, 101.0, 55.0, 36.0, 20.0, 12.0, 10.0, 9.0, 2.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-80.0, -77.71875, -75.4375, -73.15625, -70.875, -68.59375, -66.3125, -64.03125, -61.75, -59.46875, -57.1875, -54.90625, -52.625, -50.34375, -48.0625, -45.78125, -43.5, -41.21875, -38.9375, -36.65625, -34.375, -32.09375, -29.8125, -27.53125, -25.25, -22.96875, -20.6875, -18.40625, -16.125, -13.84375, -11.5625, -9.28125, -7.0, -4.71875, -2.4375, -0.15625, 2.125, 4.40625, 6.6875, 8.96875, 11.25, 13.53125, 15.8125, 18.09375, 20.375, 22.65625, 24.9375, 27.21875, 29.5, 31.78125, 34.0625, 36.34375, 38.625, 40.90625, 43.1875, 45.46875, 47.75, 50.03125, 52.3125, 54.59375, 56.875, 59.15625, 61.4375, 63.71875, 66.0]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 5.0, 6.0, 11.0, 16.0, 23.0, 47.0, 49.0, 110.0, 168.0, 180.0, 121.0, 94.0, 43.0, 28.0, 22.0, 17.0, 14.0, 11.0, 8.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015106201171875, -0.014590740203857422, -0.014075279235839844, -0.013559818267822266, -0.013044357299804688, -0.01252889633178711, -0.012013435363769531, -0.011497974395751953, -0.010982513427734375, -0.010467052459716797, -0.009951591491699219, -0.00943613052368164, -0.008920669555664062, -0.008405208587646484, -0.007889747619628906, -0.007374286651611328, -0.00685882568359375, -0.006343364715576172, -0.005827903747558594, -0.005312442779541016, -0.0047969818115234375, -0.004281520843505859, -0.0037660598754882812, -0.003250598907470703, -0.002735137939453125, -0.002219676971435547, -0.0017042160034179688, -0.0011887550354003906, -0.0006732940673828125, -0.00015783309936523438, 0.00035762786865234375, 0.0008730888366699219, 0.0013885498046875, 0.0019040107727050781, 0.0024194717407226562, 0.0029349327087402344, 0.0034503936767578125, 0.003965854644775391, 0.004481315612792969, 0.004996776580810547, 0.005512237548828125, 0.006027698516845703, 0.006543159484863281, 0.007058620452880859, 0.0075740814208984375, 0.008089542388916016, 0.008605003356933594, 0.009120464324951172, 0.00963592529296875, 0.010151386260986328, 0.010666847229003906, 0.011182308197021484, 0.011697769165039062, 0.01221323013305664, 0.012728691101074219, 0.013244152069091797, 0.013759613037109375, 0.014275074005126953, 0.014790534973144531, 0.01530599594116211, 0.015821456909179688, 0.016336917877197266, 0.016852378845214844, 0.017367839813232422, 0.01788330078125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 5.0, 11.0, 11.0, 17.0, 26.0, 30.0, 54.0, 59.0, 82.0, 129.0, 203.0, 324.0, 564.0, 1113.0, 2346.0, 5480.0, 16195.0, 66806.0, 536829.0, 335770.0, 57693.0, 14831.0, 5268.0, 2260.0, 994.0, 572.0, 332.0, 163.0, 123.0, 74.0, 41.0, 44.0, 21.0, 21.0, 13.0, 13.0, 10.0, 11.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.03125, -47.39453125, -45.7578125, -44.12109375, -42.484375, -40.84765625, -39.2109375, -37.57421875, -35.9375, -34.30078125, -32.6640625, -31.02734375, -29.390625, -27.75390625, -26.1171875, -24.48046875, -22.84375, -21.20703125, -19.5703125, -17.93359375, -16.296875, -14.66015625, -13.0234375, -11.38671875, -9.75, -8.11328125, -6.4765625, -4.83984375, -3.203125, -1.56640625, 0.0703125, 1.70703125, 3.34375, 4.98046875, 6.6171875, 8.25390625, 9.890625, 11.52734375, 13.1640625, 14.80078125, 16.4375, 18.07421875, 19.7109375, 21.34765625, 22.984375, 24.62109375, 26.2578125, 27.89453125, 29.53125, 31.16796875, 32.8046875, 34.44140625, 36.078125, 37.71484375, 39.3515625, 40.98828125, 42.625, 44.26171875, 45.8984375, 47.53515625, 49.171875, 50.80859375, 52.4453125, 54.08203125, 55.71875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 5.0, 9.0, 8.0, 9.0, 16.0, 11.0, 26.0, 34.0, 59.0, 72.0, 86.0, 100.0, 81.0, 115.0, 95.0, 56.0, 70.0, 44.0, 29.0, 19.0, 15.0, 9.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.15625, -48.19384765625, -46.2314453125, -44.26904296875, -42.306640625, -40.34423828125, -38.3818359375, -36.41943359375, -34.45703125, -32.49462890625, -30.5322265625, -28.56982421875, -26.607421875, -24.64501953125, -22.6826171875, -20.72021484375, -18.7578125, -16.79541015625, -14.8330078125, -12.87060546875, -10.908203125, -8.94580078125, -6.9833984375, -5.02099609375, -3.05859375, -1.09619140625, 0.8662109375, 2.82861328125, 4.791015625, 6.75341796875, 8.7158203125, 10.67822265625, 12.640625, 14.60302734375, 16.5654296875, 18.52783203125, 20.490234375, 22.45263671875, 24.4150390625, 26.37744140625, 28.33984375, 30.30224609375, 32.2646484375, 34.22705078125, 36.189453125, 38.15185546875, 40.1142578125, 42.07666015625, 44.0390625, 46.00146484375, 47.9638671875, 49.92626953125, 51.888671875, 53.85107421875, 55.8134765625, 57.77587890625, 59.73828125, 61.70068359375, 63.6630859375, 65.62548828125, 67.587890625, 69.55029296875, 71.5126953125, 73.47509765625, 75.4375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 17.0, 16.0, 27.0, 80.0, 146.0, 318.0, 213.0, 91.0, 39.0, 22.0, 13.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2009.111083984375, -1955.80322265625, -1902.495361328125, -1849.1876220703125, -1795.8797607421875, -1742.5718994140625, -1689.2640380859375, -1635.956298828125, -1582.6484375, -1529.340576171875, -1476.03271484375, -1422.7249755859375, -1369.4171142578125, -1316.1092529296875, -1262.8013916015625, -1209.49365234375, -1156.185791015625, -1102.8779296875, -1049.570068359375, -996.2622680664062, -942.9544677734375, -889.6466064453125, -836.3387451171875, -783.0309448242188, -729.7230224609375, -676.4151611328125, -623.1073608398438, -569.7994995117188, -516.49169921875, -463.183837890625, -409.8760070800781, -356.56817626953125, -303.2603759765625, -249.95254516601562, -196.64471435546875, -143.3368682861328, -90.02903747558594, -36.72119140625, 16.586639404296875, 69.89447021484375, 123.20230102539062, 176.5101318359375, 229.81796264648438, 283.12579345703125, 336.43365478515625, 389.7414855957031, 443.04931640625, 496.3571472167969, 549.6649780273438, 602.9728393554688, 656.2806396484375, 709.5885009765625, 762.8963012695312, 816.2041625976562, 869.511962890625, 922.81982421875, 976.127685546875, 1029.435546875, 1082.743408203125, 1136.0511474609375, 1189.3590087890625, 1242.6668701171875, 1295.9747314453125, 1349.282470703125, 1402.59033203125]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 3.0, 8.0, 6.0, 12.0, 9.0, 16.0, 14.0, 22.0, 25.0, 26.0, 25.0, 31.0, 34.0, 38.0, 52.0, 52.0, 82.0, 76.0, 84.0, 53.0, 54.0, 36.0, 37.0, 23.0, 18.0, 26.0, 25.0, 20.0, 13.0, 16.0, 16.0, 7.0, 11.0, 8.0, 2.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-913.4935302734375, -883.3871459960938, -853.28076171875, -823.17431640625, -793.0679321289062, -762.9615478515625, -732.8551635742188, -702.748779296875, -672.642333984375, -642.5359497070312, -612.4295654296875, -582.3231201171875, -552.2167358398438, -522.1103515625, -492.00396728515625, -461.8975830078125, -431.79119873046875, -401.684814453125, -371.5783996582031, -341.4720153808594, -311.3656005859375, -281.25921630859375, -251.15283203125, -221.0464324951172, -190.94003295898438, -160.83363342285156, -130.72723388671875, -100.620849609375, -70.51445007324219, -40.408050537109375, -10.301666259765625, 19.804733276367188, 49.9111328125, 80.01753234863281, 110.1239242553711, 140.23031616210938, 170.3367156982422, 200.443115234375, 230.54949951171875, 260.6558837890625, 290.7622985839844, 320.8686828613281, 350.97509765625, 381.08148193359375, 411.1878662109375, 441.2942810058594, 471.4006652832031, 501.507080078125, 531.6134643554688, 561.7198486328125, 591.8262329101562, 621.9326171875, 652.0390625, 682.1454467773438, 712.2518310546875, 742.3582153320312, 772.464599609375, 802.5709838867188, 832.6773681640625, 862.7838134765625, 892.8901977539062, 922.99658203125, 953.1029663085938, 983.2093505859375, 1013.3157958984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 10.0, 10.0, 14.0, 11.0, 38.0, 54.0, 86.0, 155.0, 232.0, 471.0, 846.0, 1757.0, 3864.0, 10192.0, 45879.0, 395812.0, 2592667.0, 998590.0, 112854.0, 19645.0, 6151.0, 2494.0, 1182.0, 585.0, 296.0, 158.0, 99.0, 52.0, 27.0, 12.0, 11.0, 10.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-93.5625, -90.9423828125, -88.322265625, -85.7021484375, -83.08203125, -80.4619140625, -77.841796875, -75.2216796875, -72.6015625, -69.9814453125, -67.361328125, -64.7412109375, -62.12109375, -59.5009765625, -56.880859375, -54.2607421875, -51.640625, -49.0205078125, -46.400390625, -43.7802734375, -41.16015625, -38.5400390625, -35.919921875, -33.2998046875, -30.6796875, -28.0595703125, -25.439453125, -22.8193359375, -20.19921875, -17.5791015625, -14.958984375, -12.3388671875, -9.71875, -7.0986328125, -4.478515625, -1.8583984375, 0.76171875, 3.3818359375, 6.001953125, 8.6220703125, 11.2421875, 13.8623046875, 16.482421875, 19.1025390625, 21.72265625, 24.3427734375, 26.962890625, 29.5830078125, 32.203125, 34.8232421875, 37.443359375, 40.0634765625, 42.68359375, 45.3037109375, 47.923828125, 50.5439453125, 53.1640625, 55.7841796875, 58.404296875, 61.0244140625, 63.64453125, 66.2646484375, 68.884765625, 71.5048828125, 74.125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 3.0, 6.0, 7.0, 12.0, 15.0, 10.0, 18.0, 15.0, 15.0, 21.0, 17.0, 34.0, 23.0, 33.0, 34.0, 49.0, 36.0, 43.0, 40.0, 51.0, 41.0, 61.0, 36.0, 45.0, 48.0, 32.0, 40.0, 26.0, 25.0, 26.0, 22.0, 14.0, 17.0, 10.0, 11.0, 11.0, 14.0, 5.0, 12.0, 2.0, 6.0, 5.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-60.28125, -58.5078125, -56.734375, -54.9609375, -53.1875, -51.4140625, -49.640625, -47.8671875, -46.09375, -44.3203125, -42.546875, -40.7734375, -39.0, -37.2265625, -35.453125, -33.6796875, -31.90625, -30.1328125, -28.359375, -26.5859375, -24.8125, -23.0390625, -21.265625, -19.4921875, -17.71875, -15.9453125, -14.171875, -12.3984375, -10.625, -8.8515625, -7.078125, -5.3046875, -3.53125, -1.7578125, 0.015625, 1.7890625, 3.5625, 5.3359375, 7.109375, 8.8828125, 10.65625, 12.4296875, 14.203125, 15.9765625, 17.75, 19.5234375, 21.296875, 23.0703125, 24.84375, 26.6171875, 28.390625, 30.1640625, 31.9375, 33.7109375, 35.484375, 37.2578125, 39.03125, 40.8046875, 42.578125, 44.3515625, 46.125, 47.8984375, 49.671875, 51.4453125, 53.21875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 0.0, 4.0, 6.0, 3.0, 7.0, 15.0, 23.0, 16.0, 31.0, 45.0, 89.0, 146.0, 312.0, 953.0, 3178.0, 16067.0, 188442.0, 3815420.0, 150702.0, 14228.0, 2944.0, 867.0, 355.0, 166.0, 88.0, 47.0, 27.0, 23.0, 22.0, 16.0, 5.0, 6.0, 7.0, 3.0, 5.0, 4.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.25, -176.8125, -170.375, -163.9375, -157.5, -151.0625, -144.625, -138.1875, -131.75, -125.3125, -118.875, -112.4375, -106.0, -99.5625, -93.125, -86.6875, -80.25, -73.8125, -67.375, -60.9375, -54.5, -48.0625, -41.625, -35.1875, -28.75, -22.3125, -15.875, -9.4375, -3.0, 3.4375, 9.875, 16.3125, 22.75, 29.1875, 35.625, 42.0625, 48.5, 54.9375, 61.375, 67.8125, 74.25, 80.6875, 87.125, 93.5625, 100.0, 106.4375, 112.875, 119.3125, 125.75, 132.1875, 138.625, 145.0625, 151.5, 157.9375, 164.375, 170.8125, 177.25, 183.6875, 190.125, 196.5625, 203.0, 209.4375, 215.875, 222.3125, 228.75]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 5.0, 12.0, 15.0, 20.0, 24.0, 24.0, 41.0, 69.0, 99.0, 175.0, 288.0, 527.0, 751.0, 751.0, 491.0, 294.0, 148.0, 82.0, 56.0, 52.0, 42.0, 17.0, 21.0, 13.0, 10.0, 10.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-112.625, -108.26953125, -103.9140625, -99.55859375, -95.203125, -90.84765625, -86.4921875, -82.13671875, -77.78125, -73.42578125, -69.0703125, -64.71484375, -60.359375, -56.00390625, -51.6484375, -47.29296875, -42.9375, -38.58203125, -34.2265625, -29.87109375, -25.515625, -21.16015625, -16.8046875, -12.44921875, -8.09375, -3.73828125, 0.6171875, 4.97265625, 9.328125, 13.68359375, 18.0390625, 22.39453125, 26.75, 31.10546875, 35.4609375, 39.81640625, 44.171875, 48.52734375, 52.8828125, 57.23828125, 61.59375, 65.94921875, 70.3046875, 74.66015625, 79.015625, 83.37109375, 87.7265625, 92.08203125, 96.4375, 100.79296875, 105.1484375, 109.50390625, 113.859375, 118.21484375, 122.5703125, 126.92578125, 131.28125, 135.63671875, 139.9921875, 144.34765625, 148.703125, 153.05859375, 157.4140625, 161.76953125, 166.125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 10.0, 16.0, 30.0, 64.0, 145.0, 192.0, 200.0, 147.0, 87.0, 41.0, 26.0, 12.0, 11.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1111.638671875, -1070.3480224609375, -1029.0574951171875, -987.7669067382812, -946.476318359375, -905.1856689453125, -863.8950805664062, -822.6044921875, -781.3139038085938, -740.0233154296875, -698.7327270507812, -657.442138671875, -616.1514892578125, -574.8609619140625, -533.5703125, -492.27972412109375, -450.9891357421875, -409.69854736328125, -368.407958984375, -327.1173400878906, -285.8267517089844, -244.53616333007812, -203.2455596923828, -161.9549560546875, -120.66436767578125, -79.37377166748047, -38.08317565917969, 3.2074203491210938, 44.498016357421875, 85.78860473632812, 127.07920837402344, 168.36981201171875, 209.660400390625, 250.95098876953125, 292.2415771484375, 333.5321960449219, 374.8227844238281, 416.1133728027344, 457.40399169921875, 498.694580078125, 539.9851684570312, 581.2757568359375, 622.5663452148438, 663.85693359375, 705.1475830078125, 746.4381103515625, 787.728759765625, 829.0193481445312, 870.3099365234375, 911.6005249023438, 952.89111328125, 994.1817016601562, 1035.4722900390625, 1076.762939453125, 1118.053466796875, 1159.3441162109375, 1200.634765625, 1241.9254150390625, 1283.2159423828125, 1324.506591796875, 1365.797119140625, 1407.0877685546875, 1448.3782958984375, 1489.6689453125, 1530.95947265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 9.0, 13.0, 4.0, 5.0, 11.0, 8.0, 12.0, 16.0, 19.0, 28.0, 33.0, 36.0, 36.0, 34.0, 39.0, 31.0, 37.0, 35.0, 42.0, 41.0, 38.0, 37.0, 42.0, 37.0, 37.0, 31.0, 26.0, 39.0, 31.0, 23.0, 30.0, 17.0, 19.0, 23.0, 15.0, 15.0, 13.0, 8.0, 6.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-506.08447265625, -489.6415100097656, -473.19854736328125, -456.7555847167969, -440.3126220703125, -423.86968994140625, -407.4267272949219, -390.9837646484375, -374.5408020019531, -358.09783935546875, -341.6548767089844, -325.2119140625, -308.76898193359375, -292.32598876953125, -275.883056640625, -259.4400939941406, -242.99713134765625, -226.55416870117188, -210.1112060546875, -193.6682586669922, -177.2252960205078, -160.78233337402344, -144.33938598632812, -127.89642333984375, -111.45346069335938, -95.010498046875, -78.56754302978516, -62.12458419799805, -45.68162536621094, -29.238662719726562, -12.795707702636719, 3.647247314453125, 20.0902099609375, 36.53316879272461, 52.97612762451172, 69.41908264160156, 85.86204528808594, 102.30500793457031, 118.74796295166016, 135.19091796875, 151.63388061523438, 168.07684326171875, 184.51980590820312, 200.96275329589844, 217.4057159423828, 233.8486785888672, 250.2916259765625, 266.7345886230469, 283.17755126953125, 299.6205139160156, 316.0634765625, 332.5064392089844, 348.94940185546875, 365.392333984375, 381.8352966308594, 398.27825927734375, 414.7212219238281, 431.1641845703125, 447.6071472167969, 464.05010986328125, 480.4930419921875, 496.93603515625, 513.3789672851562, 529.8218994140625, 546.264892578125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 4.0, 5.0, 9.0, 13.0, 16.0, 29.0, 57.0, 63.0, 130.0, 272.0, 534.0, 1300.0, 3437.0, 12011.0, 51760.0, 288765.0, 540372.0, 116488.0, 23471.0, 6175.0, 2025.0, 812.0, 364.0, 187.0, 96.0, 57.0, 36.0, 25.0, 19.0, 6.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.125, -139.51171875, -134.8984375, -130.28515625, -125.671875, -121.05859375, -116.4453125, -111.83203125, -107.21875, -102.60546875, -97.9921875, -93.37890625, -88.765625, -84.15234375, -79.5390625, -74.92578125, -70.3125, -65.69921875, -61.0859375, -56.47265625, -51.859375, -47.24609375, -42.6328125, -38.01953125, -33.40625, -28.79296875, -24.1796875, -19.56640625, -14.953125, -10.33984375, -5.7265625, -1.11328125, 3.5, 8.11328125, 12.7265625, 17.33984375, 21.953125, 26.56640625, 31.1796875, 35.79296875, 40.40625, 45.01953125, 49.6328125, 54.24609375, 58.859375, 63.47265625, 68.0859375, 72.69921875, 77.3125, 81.92578125, 86.5390625, 91.15234375, 95.765625, 100.37890625, 104.9921875, 109.60546875, 114.21875, 118.83203125, 123.4453125, 128.05859375, 132.671875, 137.28515625, 141.8984375, 146.51171875, 151.125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 8.0, 6.0, 7.0, 8.0, 11.0, 10.0, 14.0, 17.0, 17.0, 24.0, 29.0, 20.0, 31.0, 36.0, 33.0, 37.0, 37.0, 50.0, 48.0, 42.0, 38.0, 61.0, 44.0, 32.0, 37.0, 44.0, 37.0, 30.0, 34.0, 20.0, 18.0, 17.0, 17.0, 16.0, 14.0, 16.0, 10.0, 4.0, 5.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.09375, -54.29736328125, -52.5009765625, -50.70458984375, -48.908203125, -47.11181640625, -45.3154296875, -43.51904296875, -41.72265625, -39.92626953125, -38.1298828125, -36.33349609375, -34.537109375, -32.74072265625, -30.9443359375, -29.14794921875, -27.3515625, -25.55517578125, -23.7587890625, -21.96240234375, -20.166015625, -18.36962890625, -16.5732421875, -14.77685546875, -12.98046875, -11.18408203125, -9.3876953125, -7.59130859375, -5.794921875, -3.99853515625, -2.2021484375, -0.40576171875, 1.390625, 3.18701171875, 4.9833984375, 6.77978515625, 8.576171875, 10.37255859375, 12.1689453125, 13.96533203125, 15.76171875, 17.55810546875, 19.3544921875, 21.15087890625, 22.947265625, 24.74365234375, 26.5400390625, 28.33642578125, 30.1328125, 31.92919921875, 33.7255859375, 35.52197265625, 37.318359375, 39.11474609375, 40.9111328125, 42.70751953125, 44.50390625, 46.30029296875, 48.0966796875, 49.89306640625, 51.689453125, 53.48583984375, 55.2822265625, 57.07861328125, 58.875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 10.0, 12.0, 21.0, 26.0, 44.0, 67.0, 111.0, 212.0, 360.0, 801.0, 1833.0, 5904.0, 35440.0, 700319.0, 274324.0, 22023.0, 4162.0, 1355.0, 650.0, 322.0, 203.0, 121.0, 81.0, 50.0, 33.0, 21.0, 14.0, 6.0, 9.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.25, -219.3828125, -211.515625, -203.6484375, -195.78125, -187.9140625, -180.046875, -172.1796875, -164.3125, -156.4453125, -148.578125, -140.7109375, -132.84375, -124.9765625, -117.109375, -109.2421875, -101.375, -93.5078125, -85.640625, -77.7734375, -69.90625, -62.0390625, -54.171875, -46.3046875, -38.4375, -30.5703125, -22.703125, -14.8359375, -6.96875, 0.8984375, 8.765625, 16.6328125, 24.5, 32.3671875, 40.234375, 48.1015625, 55.96875, 63.8359375, 71.703125, 79.5703125, 87.4375, 95.3046875, 103.171875, 111.0390625, 118.90625, 126.7734375, 134.640625, 142.5078125, 150.375, 158.2421875, 166.109375, 173.9765625, 181.84375, 189.7109375, 197.578125, 205.4453125, 213.3125, 221.1796875, 229.046875, 236.9140625, 244.78125, 252.6484375, 260.515625, 268.3828125, 276.25]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 2.0, 6.0, 7.0, 10.0, 11.0, 14.0, 19.0, 30.0, 23.0, 25.0, 41.0, 40.0, 28.0, 42.0, 38.0, 56.0, 54.0, 52.0, 38.0, 50.0, 52.0, 49.0, 50.0, 39.0, 32.0, 34.0, 16.0, 17.0, 19.0, 18.0, 17.0, 11.0, 11.0, 6.0, 8.0, 6.0, 6.0, 3.0, 6.0, 2.0, 0.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-197.625, -190.576171875, -183.52734375, -176.478515625, -169.4296875, -162.380859375, -155.33203125, -148.283203125, -141.234375, -134.185546875, -127.13671875, -120.087890625, -113.0390625, -105.990234375, -98.94140625, -91.892578125, -84.84375, -77.794921875, -70.74609375, -63.697265625, -56.6484375, -49.599609375, -42.55078125, -35.501953125, -28.453125, -21.404296875, -14.35546875, -7.306640625, -0.2578125, 6.791015625, 13.83984375, 20.888671875, 27.9375, 34.986328125, 42.03515625, 49.083984375, 56.1328125, 63.181640625, 70.23046875, 77.279296875, 84.328125, 91.376953125, 98.42578125, 105.474609375, 112.5234375, 119.572265625, 126.62109375, 133.669921875, 140.71875, 147.767578125, 154.81640625, 161.865234375, 168.9140625, 175.962890625, 183.01171875, 190.060546875, 197.109375, 204.158203125, 211.20703125, 218.255859375, 225.3046875, 232.353515625, 239.40234375, 246.451171875, 253.5]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 8.0, 18.0, 16.0, 26.0, 46.0, 62.0, 108.0, 213.0, 347.0, 668.0, 1275.0, 3267.0, 9882.0, 42181.0, 689741.0, 258432.0, 29337.0, 7676.0, 2698.0, 1168.0, 547.0, 316.0, 192.0, 120.0, 65.0, 36.0, 30.0, 20.0, 14.0, 8.0, 6.0, 8.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.90625, -53.1845703125, -51.462890625, -49.7412109375, -48.01953125, -46.2978515625, -44.576171875, -42.8544921875, -41.1328125, -39.4111328125, -37.689453125, -35.9677734375, -34.24609375, -32.5244140625, -30.802734375, -29.0810546875, -27.359375, -25.6376953125, -23.916015625, -22.1943359375, -20.47265625, -18.7509765625, -17.029296875, -15.3076171875, -13.5859375, -11.8642578125, -10.142578125, -8.4208984375, -6.69921875, -4.9775390625, -3.255859375, -1.5341796875, 0.1875, 1.9091796875, 3.630859375, 5.3525390625, 7.07421875, 8.7958984375, 10.517578125, 12.2392578125, 13.9609375, 15.6826171875, 17.404296875, 19.1259765625, 20.84765625, 22.5693359375, 24.291015625, 26.0126953125, 27.734375, 29.4560546875, 31.177734375, 32.8994140625, 34.62109375, 36.3427734375, 38.064453125, 39.7861328125, 41.5078125, 43.2294921875, 44.951171875, 46.6728515625, 48.39453125, 50.1162109375, 51.837890625, 53.5595703125, 55.28125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 6.0, 9.0, 11.0, 20.0, 18.0, 42.0, 50.0, 121.0, 223.0, 210.0, 104.0, 53.0, 32.0, 19.0, 17.0, 8.0, 13.0, 2.0, 3.0, 8.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01727294921875, -0.01674938201904297, -0.016225814819335938, -0.015702247619628906, -0.015178680419921875, -0.014655113220214844, -0.014131546020507812, -0.013607978820800781, -0.01308441162109375, -0.012560844421386719, -0.012037277221679688, -0.011513710021972656, -0.010990142822265625, -0.010466575622558594, -0.009943008422851562, -0.009419441223144531, -0.0088958740234375, -0.008372306823730469, -0.007848739624023438, -0.007325172424316406, -0.006801605224609375, -0.006278038024902344, -0.0057544708251953125, -0.005230903625488281, -0.00470733642578125, -0.004183769226074219, -0.0036602020263671875, -0.0031366348266601562, -0.002613067626953125, -0.0020895004272460938, -0.0015659332275390625, -0.0010423660278320312, -0.000518798828125, 4.76837158203125e-06, 0.0005283355712890625, 0.0010519027709960938, 0.001575469970703125, 0.0020990371704101562, 0.0026226043701171875, 0.0031461715698242188, 0.00366973876953125, 0.004193305969238281, 0.0047168731689453125, 0.005240440368652344, 0.005764007568359375, 0.006287574768066406, 0.0068111419677734375, 0.007334709167480469, 0.0078582763671875, 0.008381843566894531, 0.008905410766601562, 0.009428977966308594, 0.009952545166015625, 0.010476112365722656, 0.010999679565429688, 0.011523246765136719, 0.01204681396484375, 0.012570381164550781, 0.013093948364257812, 0.013617515563964844, 0.014141082763671875, 0.014664649963378906, 0.015188217163085938, 0.01571178436279297, 0.0162353515625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 3.0, 7.0, 16.0, 22.0, 35.0, 44.0, 60.0, 116.0, 202.0, 387.0, 867.0, 1828.0, 5304.0, 20580.0, 138853.0, 786717.0, 73264.0, 13501.0, 3836.0, 1452.0, 649.0, 314.0, 184.0, 108.0, 59.0, 40.0, 34.0, 19.0, 14.0, 10.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.3125, -51.6123046875, -49.912109375, -48.2119140625, -46.51171875, -44.8115234375, -43.111328125, -41.4111328125, -39.7109375, -38.0107421875, -36.310546875, -34.6103515625, -32.91015625, -31.2099609375, -29.509765625, -27.8095703125, -26.109375, -24.4091796875, -22.708984375, -21.0087890625, -19.30859375, -17.6083984375, -15.908203125, -14.2080078125, -12.5078125, -10.8076171875, -9.107421875, -7.4072265625, -5.70703125, -4.0068359375, -2.306640625, -0.6064453125, 1.09375, 2.7939453125, 4.494140625, 6.1943359375, 7.89453125, 9.5947265625, 11.294921875, 12.9951171875, 14.6953125, 16.3955078125, 18.095703125, 19.7958984375, 21.49609375, 23.1962890625, 24.896484375, 26.5966796875, 28.296875, 29.9970703125, 31.697265625, 33.3974609375, 35.09765625, 36.7978515625, 38.498046875, 40.1982421875, 41.8984375, 43.5986328125, 45.298828125, 46.9990234375, 48.69921875, 50.3994140625, 52.099609375, 53.7998046875, 55.5]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 5.0, 7.0, 13.0, 6.0, 12.0, 14.0, 19.0, 27.0, 37.0, 34.0, 59.0, 81.0, 116.0, 101.0, 120.0, 75.0, 56.0, 48.0, 27.0, 30.0, 21.0, 15.0, 21.0, 16.0, 9.0, 9.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.625, -53.277099609375, -51.92919921875, -50.581298828125, -49.2333984375, -47.885498046875, -46.53759765625, -45.189697265625, -43.841796875, -42.493896484375, -41.14599609375, -39.798095703125, -38.4501953125, -37.102294921875, -35.75439453125, -34.406494140625, -33.05859375, -31.710693359375, -30.36279296875, -29.014892578125, -27.6669921875, -26.319091796875, -24.97119140625, -23.623291015625, -22.275390625, -20.927490234375, -19.57958984375, -18.231689453125, -16.8837890625, -15.535888671875, -14.18798828125, -12.840087890625, -11.4921875, -10.144287109375, -8.79638671875, -7.448486328125, -6.1005859375, -4.752685546875, -3.40478515625, -2.056884765625, -0.708984375, 0.638916015625, 1.98681640625, 3.334716796875, 4.6826171875, 6.030517578125, 7.37841796875, 8.726318359375, 10.07421875, 11.422119140625, 12.77001953125, 14.117919921875, 15.4658203125, 16.813720703125, 18.16162109375, 19.509521484375, 20.857421875, 22.205322265625, 23.55322265625, 24.901123046875, 26.2490234375, 27.596923828125, 28.94482421875, 30.292724609375, 31.640625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 4.0, 3.0, 1.0, 19.0, 35.0, 49.0, 116.0, 332.0, 274.0, 98.0, 38.0, 16.0, 4.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1098.8272705078125, -1046.491455078125, -994.1556396484375, -941.81982421875, -889.4840087890625, -837.148193359375, -784.8123168945312, -732.4765014648438, -680.1406860351562, -627.8048706054688, -575.4690551757812, -523.1331787109375, -470.7973937988281, -418.4615783691406, -366.125732421875, -313.7899169921875, -261.4541015625, -209.1182861328125, -156.78245544433594, -104.44662475585938, -52.110809326171875, 0.225006103515625, 52.56085205078125, 104.89666748046875, 157.23248291015625, 209.56829833984375, 261.90411376953125, 314.2399597167969, 366.5757751464844, 418.9115905761719, 471.2474365234375, 523.583251953125, 575.9189453125, 628.2547607421875, 680.590576171875, 732.9263916015625, 785.26220703125, 837.5980224609375, 889.9338989257812, 942.2697143554688, 994.6055297851562, 1046.94140625, 1099.2772216796875, 1151.613037109375, 1203.9488525390625, 1256.28466796875, 1308.6204833984375, 1360.956298828125, 1413.2921142578125, 1465.6279296875, 1517.9637451171875, 1570.299560546875, 1622.6353759765625, 1674.97119140625, 1727.30712890625, 1779.642822265625, 1831.978759765625, 1884.3145751953125, 1936.650390625, 1988.9862060546875, 2041.322021484375, 2093.657958984375, 2145.99365234375, 2198.32958984375, 2250.665283203125]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 7.0, 5.0, 8.0, 6.0, 7.0, 11.0, 16.0, 10.0, 18.0, 23.0, 16.0, 24.0, 27.0, 27.0, 39.0, 49.0, 52.0, 84.0, 112.0, 92.0, 56.0, 39.0, 41.0, 39.0, 26.0, 19.0, 21.0, 16.0, 16.0, 15.0, 8.0, 11.0, 13.0, 12.0, 6.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-881.1434326171875, -854.0552368164062, -826.967041015625, -799.8787841796875, -772.7905883789062, -745.702392578125, -718.6141967773438, -691.5260009765625, -664.437744140625, -637.3495483398438, -610.2613525390625, -583.173095703125, -556.0848999023438, -528.9967041015625, -501.90850830078125, -474.8203125, -447.73211669921875, -420.6439208984375, -393.5556945800781, -366.4674987792969, -339.3792724609375, -312.29107666015625, -285.202880859375, -258.11468505859375, -231.02645874023438, -203.93824768066406, -176.85003662109375, -149.7618408203125, -122.67362976074219, -95.58541870117188, -68.49722290039062, -41.40901184082031, -14.32086181640625, 12.767345428466797, 39.855552673339844, 66.94375610351562, 94.03196716308594, 121.12017822265625, 148.2083740234375, 175.2965850830078, 202.38479614257812, 229.47300720214844, 256.56121826171875, 283.6494140625, 310.73760986328125, 337.8258361816406, 364.9140319824219, 392.00225830078125, 419.0904541015625, 446.17864990234375, 473.2668762207031, 500.3550720214844, 527.4432983398438, 554.531494140625, 581.6196899414062, 608.7078857421875, 635.796142578125, 662.8843383789062, 689.9725341796875, 717.060791015625, 744.1489868164062, 771.2371826171875, 798.3253784179688, 825.41357421875, 852.5017700195312]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 7.0, 3.0, 7.0, 13.0, 15.0, 25.0, 42.0, 63.0, 112.0, 194.0, 373.0, 723.0, 1425.0, 3160.0, 8266.0, 32429.0, 364401.0, 2910989.0, 786680.0, 64928.0, 12673.0, 4154.0, 1831.0, 851.0, 436.0, 227.0, 107.0, 52.0, 35.0, 20.0, 10.0, 9.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-131.25, -127.853515625, -124.45703125, -121.060546875, -117.6640625, -114.267578125, -110.87109375, -107.474609375, -104.078125, -100.681640625, -97.28515625, -93.888671875, -90.4921875, -87.095703125, -83.69921875, -80.302734375, -76.90625, -73.509765625, -70.11328125, -66.716796875, -63.3203125, -59.923828125, -56.52734375, -53.130859375, -49.734375, -46.337890625, -42.94140625, -39.544921875, -36.1484375, -32.751953125, -29.35546875, -25.958984375, -22.5625, -19.166015625, -15.76953125, -12.373046875, -8.9765625, -5.580078125, -2.18359375, 1.212890625, 4.609375, 8.005859375, 11.40234375, 14.798828125, 18.1953125, 21.591796875, 24.98828125, 28.384765625, 31.78125, 35.177734375, 38.57421875, 41.970703125, 45.3671875, 48.763671875, 52.16015625, 55.556640625, 58.953125, 62.349609375, 65.74609375, 69.142578125, 72.5390625, 75.935546875, 79.33203125, 82.728515625, 86.125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 10.0, 14.0, 13.0, 13.0, 21.0, 24.0, 34.0, 26.0, 45.0, 48.0, 38.0, 56.0, 59.0, 49.0, 53.0, 60.0, 62.0, 59.0, 61.0, 47.0, 42.0, 31.0, 27.0, 23.0, 20.0, 11.0, 18.0, 5.0, 9.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.4375, -85.15625, -82.875, -80.59375, -78.3125, -76.03125, -73.75, -71.46875, -69.1875, -66.90625, -64.625, -62.34375, -60.0625, -57.78125, -55.5, -53.21875, -50.9375, -48.65625, -46.375, -44.09375, -41.8125, -39.53125, -37.25, -34.96875, -32.6875, -30.40625, -28.125, -25.84375, -23.5625, -21.28125, -19.0, -16.71875, -14.4375, -12.15625, -9.875, -7.59375, -5.3125, -3.03125, -0.75, 1.53125, 3.8125, 6.09375, 8.375, 10.65625, 12.9375, 15.21875, 17.5, 19.78125, 22.0625, 24.34375, 26.625, 28.90625, 31.1875, 33.46875, 35.75, 38.03125, 40.3125, 42.59375, 44.875, 47.15625, 49.4375, 51.71875, 54.0, 56.28125, 58.5625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 5.0, 3.0, 4.0, 5.0, 5.0, 7.0, 8.0, 17.0, 9.0, 17.0, 35.0, 55.0, 83.0, 144.0, 337.0, 753.0, 2589.0, 11171.0, 96941.0, 3738537.0, 318050.0, 19620.0, 3857.0, 1136.0, 424.0, 175.0, 95.0, 46.0, 41.0, 21.0, 25.0, 10.0, 9.0, 12.0, 9.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-200.125, -193.8046875, -187.484375, -181.1640625, -174.84375, -168.5234375, -162.203125, -155.8828125, -149.5625, -143.2421875, -136.921875, -130.6015625, -124.28125, -117.9609375, -111.640625, -105.3203125, -99.0, -92.6796875, -86.359375, -80.0390625, -73.71875, -67.3984375, -61.078125, -54.7578125, -48.4375, -42.1171875, -35.796875, -29.4765625, -23.15625, -16.8359375, -10.515625, -4.1953125, 2.125, 8.4453125, 14.765625, 21.0859375, 27.40625, 33.7265625, 40.046875, 46.3671875, 52.6875, 59.0078125, 65.328125, 71.6484375, 77.96875, 84.2890625, 90.609375, 96.9296875, 103.25, 109.5703125, 115.890625, 122.2109375, 128.53125, 134.8515625, 141.171875, 147.4921875, 153.8125, 160.1328125, 166.453125, 172.7734375, 179.09375, 185.4140625, 191.734375, 198.0546875, 204.375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 3.0, 9.0, 10.0, 9.0, 11.0, 20.0, 32.0, 33.0, 64.0, 74.0, 122.0, 195.0, 392.0, 597.0, 793.0, 691.0, 429.0, 212.0, 133.0, 71.0, 56.0, 31.0, 24.0, 11.0, 13.0, 10.0, 2.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.25, -151.439453125, -146.62890625, -141.818359375, -137.0078125, -132.197265625, -127.38671875, -122.576171875, -117.765625, -112.955078125, -108.14453125, -103.333984375, -98.5234375, -93.712890625, -88.90234375, -84.091796875, -79.28125, -74.470703125, -69.66015625, -64.849609375, -60.0390625, -55.228515625, -50.41796875, -45.607421875, -40.796875, -35.986328125, -31.17578125, -26.365234375, -21.5546875, -16.744140625, -11.93359375, -7.123046875, -2.3125, 2.498046875, 7.30859375, 12.119140625, 16.9296875, 21.740234375, 26.55078125, 31.361328125, 36.171875, 40.982421875, 45.79296875, 50.603515625, 55.4140625, 60.224609375, 65.03515625, 69.845703125, 74.65625, 79.466796875, 84.27734375, 89.087890625, 93.8984375, 98.708984375, 103.51953125, 108.330078125, 113.140625, 117.951171875, 122.76171875, 127.572265625, 132.3828125, 137.193359375, 142.00390625, 146.814453125, 151.625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 6.0, 23.0, 77.0, 362.0, 376.0, 111.0, 32.0, 14.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4510.78369140625, -4420.6982421875, -4330.61279296875, -4240.52734375, -4150.4423828125, -4060.35693359375, -3970.271484375, -3880.18603515625, -3790.1005859375, -3700.01513671875, -3609.929931640625, -3519.844482421875, -3429.759033203125, -3339.673828125, -3249.58837890625, -3159.5029296875, -3069.417724609375, -2979.332275390625, -2889.2470703125, -2799.16162109375, -2709.076171875, -2618.99072265625, -2528.905517578125, -2438.820068359375, -2348.73486328125, -2258.6494140625, -2168.564208984375, -2078.478759765625, -1988.393310546875, -1898.3079833984375, -1808.22265625, -1718.13720703125, -1628.051513671875, -1537.9661865234375, -1447.8807373046875, -1357.79541015625, -1267.7099609375, -1177.6246337890625, -1087.539306640625, -997.4539184570312, -907.3685302734375, -817.2831420898438, -727.19775390625, -637.1124267578125, -547.0270385742188, -456.941650390625, -366.8563232421875, -276.77093505859375, -186.685546875, -96.60017395019531, -6.514801025390625, 83.570556640625, 173.65594482421875, 263.7413330078125, 353.82666015625, 443.91204833984375, 533.9974365234375, 624.0828247070312, 714.168212890625, 804.2535400390625, 894.3389282226562, 984.42431640625, 1074.5096435546875, 1164.594970703125, 1254.680419921875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 7.0, 8.0, 13.0, 20.0, 13.0, 24.0, 28.0, 31.0, 37.0, 35.0, 38.0, 49.0, 41.0, 53.0, 50.0, 64.0, 57.0, 49.0, 57.0, 54.0, 29.0, 33.0, 33.0, 24.0, 31.0, 24.0, 15.0, 19.0, 11.0, 16.0, 6.0, 3.0, 5.0, 2.0, 0.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-564.8651123046875, -544.4038696289062, -523.942626953125, -503.4814147949219, -483.0201721191406, -462.5589294433594, -442.09771728515625, -421.636474609375, -401.17523193359375, -380.7139892578125, -360.25274658203125, -339.7915344238281, -319.3302917480469, -298.8690490722656, -278.4078369140625, -257.94659423828125, -237.4853515625, -217.02410888671875, -196.56288146972656, -176.10165405273438, -155.64041137695312, -135.17916870117188, -114.71794128417969, -94.2567138671875, -73.79547119140625, -53.33423614501953, -32.87300109863281, -12.411766052246094, 8.049468994140625, 28.510704040527344, 48.97193908691406, 69.43316650390625, 89.8944091796875, 110.35564422607422, 130.81687927246094, 151.27810668945312, 171.73934936523438, 192.20059204101562, 212.6618194580078, 233.123046875, 253.58428955078125, 274.0455322265625, 294.50677490234375, 314.9679870605469, 335.4292297363281, 355.8904724121094, 376.3516845703125, 396.81292724609375, 417.274169921875, 437.73541259765625, 458.1966552734375, 478.6578674316406, 499.1191101074219, 519.580322265625, 540.0415649414062, 560.5028076171875, 580.9640502929688, 601.42529296875, 621.8865356445312, 642.3477783203125, 662.8089599609375, 683.2702026367188, 703.7314453125, 724.1926879882812, 744.6539306640625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 9.0, 10.0, 15.0, 28.0, 46.0, 61.0, 106.0, 219.0, 393.0, 796.0, 1699.0, 4117.0, 11294.0, 36617.0, 145186.0, 534059.0, 234216.0, 53998.0, 15869.0, 5525.0, 2217.0, 987.0, 465.0, 254.0, 118.0, 89.0, 48.0, 33.0, 23.0, 17.0, 9.0, 7.0, 11.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-159.625, -155.4951171875, -151.365234375, -147.2353515625, -143.10546875, -138.9755859375, -134.845703125, -130.7158203125, -126.5859375, -122.4560546875, -118.326171875, -114.1962890625, -110.06640625, -105.9365234375, -101.806640625, -97.6767578125, -93.546875, -89.4169921875, -85.287109375, -81.1572265625, -77.02734375, -72.8974609375, -68.767578125, -64.6376953125, -60.5078125, -56.3779296875, -52.248046875, -48.1181640625, -43.98828125, -39.8583984375, -35.728515625, -31.5986328125, -27.46875, -23.3388671875, -19.208984375, -15.0791015625, -10.94921875, -6.8193359375, -2.689453125, 1.4404296875, 5.5703125, 9.7001953125, 13.830078125, 17.9599609375, 22.08984375, 26.2197265625, 30.349609375, 34.4794921875, 38.609375, 42.7392578125, 46.869140625, 50.9990234375, 55.12890625, 59.2587890625, 63.388671875, 67.5185546875, 71.6484375, 75.7783203125, 79.908203125, 84.0380859375, 88.16796875, 92.2978515625, 96.427734375, 100.5576171875, 104.6875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 7.0, 5.0, 8.0, 16.0, 11.0, 8.0, 13.0, 14.0, 12.0, 16.0, 21.0, 34.0, 32.0, 30.0, 33.0, 38.0, 44.0, 38.0, 59.0, 50.0, 37.0, 48.0, 41.0, 49.0, 40.0, 43.0, 32.0, 36.0, 28.0, 25.0, 17.0, 20.0, 24.0, 20.0, 12.0, 11.0, 7.0, 7.0, 5.0, 8.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-65.6875, -63.87890625, -62.0703125, -60.26171875, -58.453125, -56.64453125, -54.8359375, -53.02734375, -51.21875, -49.41015625, -47.6015625, -45.79296875, -43.984375, -42.17578125, -40.3671875, -38.55859375, -36.75, -34.94140625, -33.1328125, -31.32421875, -29.515625, -27.70703125, -25.8984375, -24.08984375, -22.28125, -20.47265625, -18.6640625, -16.85546875, -15.046875, -13.23828125, -11.4296875, -9.62109375, -7.8125, -6.00390625, -4.1953125, -2.38671875, -0.578125, 1.23046875, 3.0390625, 4.84765625, 6.65625, 8.46484375, 10.2734375, 12.08203125, 13.890625, 15.69921875, 17.5078125, 19.31640625, 21.125, 22.93359375, 24.7421875, 26.55078125, 28.359375, 30.16796875, 31.9765625, 33.78515625, 35.59375, 37.40234375, 39.2109375, 41.01953125, 42.828125, 44.63671875, 46.4453125, 48.25390625, 50.0625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 8.0, 9.0, 12.0, 22.0, 41.0, 74.0, 108.0, 183.0, 321.0, 654.0, 1420.0, 3729.0, 18319.0, 677642.0, 324166.0, 15937.0, 3351.0, 1308.0, 579.0, 292.0, 155.0, 92.0, 54.0, 26.0, 20.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-260.0, -251.0234375, -242.046875, -233.0703125, -224.09375, -215.1171875, -206.140625, -197.1640625, -188.1875, -179.2109375, -170.234375, -161.2578125, -152.28125, -143.3046875, -134.328125, -125.3515625, -116.375, -107.3984375, -98.421875, -89.4453125, -80.46875, -71.4921875, -62.515625, -53.5390625, -44.5625, -35.5859375, -26.609375, -17.6328125, -8.65625, 0.3203125, 9.296875, 18.2734375, 27.25, 36.2265625, 45.203125, 54.1796875, 63.15625, 72.1328125, 81.109375, 90.0859375, 99.0625, 108.0390625, 117.015625, 125.9921875, 134.96875, 143.9453125, 152.921875, 161.8984375, 170.875, 179.8515625, 188.828125, 197.8046875, 206.78125, 215.7578125, 224.734375, 233.7109375, 242.6875, 251.6640625, 260.640625, 269.6171875, 278.59375, 287.5703125, 296.546875, 305.5234375, 314.5]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 8.0, 8.0, 14.0, 17.0, 20.0, 32.0, 36.0, 27.0, 41.0, 55.0, 67.0, 71.0, 81.0, 82.0, 76.0, 65.0, 53.0, 52.0, 46.0, 42.0, 23.0, 23.0, 21.0, 9.0, 9.0, 3.0, 2.0, 8.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-265.25, -256.1875, -247.125, -238.0625, -229.0, -219.9375, -210.875, -201.8125, -192.75, -183.6875, -174.625, -165.5625, -156.5, -147.4375, -138.375, -129.3125, -120.25, -111.1875, -102.125, -93.0625, -84.0, -74.9375, -65.875, -56.8125, -47.75, -38.6875, -29.625, -20.5625, -11.5, -2.4375, 6.625, 15.6875, 24.75, 33.8125, 42.875, 51.9375, 61.0, 70.0625, 79.125, 88.1875, 97.25, 106.3125, 115.375, 124.4375, 133.5, 142.5625, 151.625, 160.6875, 169.75, 178.8125, 187.875, 196.9375, 206.0, 215.0625, 224.125, 233.1875, 242.25, 251.3125, 260.375, 269.4375, 278.5, 287.5625, 296.625, 305.6875, 314.75]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 8.0, 6.0, 9.0, 8.0, 18.0, 18.0, 32.0, 26.0, 34.0, 71.0, 97.0, 132.0, 270.0, 434.0, 962.0, 2270.0, 6760.0, 27917.0, 663928.0, 310569.0, 24708.0, 6114.0, 2102.0, 925.0, 446.0, 218.0, 146.0, 89.0, 58.0, 53.0, 28.0, 18.0, 19.0, 17.0, 11.0, 8.0, 4.0, 4.0, 5.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.15625, -40.70068359375, -39.2451171875, -37.78955078125, -36.333984375, -34.87841796875, -33.4228515625, -31.96728515625, -30.51171875, -29.05615234375, -27.6005859375, -26.14501953125, -24.689453125, -23.23388671875, -21.7783203125, -20.32275390625, -18.8671875, -17.41162109375, -15.9560546875, -14.50048828125, -13.044921875, -11.58935546875, -10.1337890625, -8.67822265625, -7.22265625, -5.76708984375, -4.3115234375, -2.85595703125, -1.400390625, 0.05517578125, 1.5107421875, 2.96630859375, 4.421875, 5.87744140625, 7.3330078125, 8.78857421875, 10.244140625, 11.69970703125, 13.1552734375, 14.61083984375, 16.06640625, 17.52197265625, 18.9775390625, 20.43310546875, 21.888671875, 23.34423828125, 24.7998046875, 26.25537109375, 27.7109375, 29.16650390625, 30.6220703125, 32.07763671875, 33.533203125, 34.98876953125, 36.4443359375, 37.89990234375, 39.35546875, 40.81103515625, 42.2666015625, 43.72216796875, 45.177734375, 46.63330078125, 48.0888671875, 49.54443359375, 51.0]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 6.0, 7.0, 3.0, 6.0, 11.0, 8.0, 15.0, 16.0, 32.0, 46.0, 94.0, 187.0, 253.0, 122.0, 67.0, 36.0, 30.0, 12.0, 10.0, 8.0, 7.0, 7.0, 2.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012237548828125, -0.011818766593933105, -0.011399984359741211, -0.010981202125549316, -0.010562419891357422, -0.010143637657165527, -0.009724855422973633, -0.009306073188781738, -0.008887290954589844, -0.00846850872039795, -0.008049726486206055, -0.00763094425201416, -0.007212162017822266, -0.006793379783630371, -0.0063745975494384766, -0.005955815315246582, -0.0055370330810546875, -0.005118250846862793, -0.0046994686126708984, -0.004280686378479004, -0.0038619041442871094, -0.003443121910095215, -0.0030243396759033203, -0.0026055574417114258, -0.0021867752075195312, -0.0017679929733276367, -0.0013492107391357422, -0.0009304285049438477, -0.0005116462707519531, -9.28640365600586e-05, 0.00032591819763183594, 0.0007447004318237305, 0.001163482666015625, 0.0015822649002075195, 0.002001047134399414, 0.0024198293685913086, 0.002838611602783203, 0.0032573938369750977, 0.003676176071166992, 0.004094958305358887, 0.004513740539550781, 0.004932522773742676, 0.00535130500793457, 0.005770087242126465, 0.006188869476318359, 0.006607651710510254, 0.0070264339447021484, 0.007445216178894043, 0.007863998413085938, 0.008282780647277832, 0.008701562881469727, 0.009120345115661621, 0.009539127349853516, 0.00995790958404541, 0.010376691818237305, 0.0107954740524292, 0.011214256286621094, 0.011633038520812988, 0.012051820755004883, 0.012470602989196777, 0.012889385223388672, 0.013308167457580566, 0.013726949691772461, 0.014145731925964355, 0.01456451416015625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 9.0, 6.0, 5.0, 8.0, 22.0, 29.0, 38.0, 39.0, 88.0, 114.0, 172.0, 244.0, 357.0, 664.0, 1278.0, 2846.0, 7472.0, 25735.0, 163840.0, 756591.0, 65199.0, 14520.0, 4799.0, 2007.0, 968.0, 552.0, 281.0, 214.0, 146.0, 105.0, 62.0, 46.0, 27.0, 17.0, 17.0, 13.0, 9.0, 9.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.53125, -36.4365234375, -35.341796875, -34.2470703125, -33.15234375, -32.0576171875, -30.962890625, -29.8681640625, -28.7734375, -27.6787109375, -26.583984375, -25.4892578125, -24.39453125, -23.2998046875, -22.205078125, -21.1103515625, -20.015625, -18.9208984375, -17.826171875, -16.7314453125, -15.63671875, -14.5419921875, -13.447265625, -12.3525390625, -11.2578125, -10.1630859375, -9.068359375, -7.9736328125, -6.87890625, -5.7841796875, -4.689453125, -3.5947265625, -2.5, -1.4052734375, -0.310546875, 0.7841796875, 1.87890625, 2.9736328125, 4.068359375, 5.1630859375, 6.2578125, 7.3525390625, 8.447265625, 9.5419921875, 10.63671875, 11.7314453125, 12.826171875, 13.9208984375, 15.015625, 16.1103515625, 17.205078125, 18.2998046875, 19.39453125, 20.4892578125, 21.583984375, 22.6787109375, 23.7734375, 24.8681640625, 25.962890625, 27.0576171875, 28.15234375, 29.2470703125, 30.341796875, 31.4365234375, 32.53125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 8.0, 3.0, 14.0, 11.0, 15.0, 21.0, 31.0, 25.0, 52.0, 66.0, 82.0, 115.0, 122.0, 110.0, 70.0, 65.0, 34.0, 35.0, 35.0, 21.0, 9.0, 3.0, 8.0, 12.0, 7.0, 4.0, 2.0, 5.0, 0.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.8125, -38.6796875, -37.546875, -36.4140625, -35.28125, -34.1484375, -33.015625, -31.8828125, -30.75, -29.6171875, -28.484375, -27.3515625, -26.21875, -25.0859375, -23.953125, -22.8203125, -21.6875, -20.5546875, -19.421875, -18.2890625, -17.15625, -16.0234375, -14.890625, -13.7578125, -12.625, -11.4921875, -10.359375, -9.2265625, -8.09375, -6.9609375, -5.828125, -4.6953125, -3.5625, -2.4296875, -1.296875, -0.1640625, 0.96875, 2.1015625, 3.234375, 4.3671875, 5.5, 6.6328125, 7.765625, 8.8984375, 10.03125, 11.1640625, 12.296875, 13.4296875, 14.5625, 15.6953125, 16.828125, 17.9609375, 19.09375, 20.2265625, 21.359375, 22.4921875, 23.625, 24.7578125, 25.890625, 27.0234375, 28.15625, 29.2890625, 30.421875, 31.5546875, 32.6875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 12.0, 24.0, 38.0, 104.0, 197.0, 422.0, 121.0, 42.0, 14.0, 9.0, 6.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1416.813232421875, -1366.7763671875, -1316.7393798828125, -1266.7025146484375, -1216.66552734375, -1166.628662109375, -1116.591796875, -1066.5548095703125, -1016.5179443359375, -966.4810180664062, -916.444091796875, -866.4072265625, -816.3703002929688, -766.3333740234375, -716.2964477539062, -666.259521484375, -616.2225952148438, -566.1856689453125, -516.1487426757812, -466.1118469238281, -416.074951171875, -366.03802490234375, -316.0010986328125, -265.9642028808594, -215.92727661132812, -165.89036560058594, -115.85344696044922, -65.8165283203125, -15.779617309570312, 34.257293701171875, 84.29421997070312, 134.33111572265625, 184.3680419921875, 234.4049530029297, 284.4418640136719, 334.4787902832031, 384.51568603515625, 434.5526123046875, 484.58953857421875, 534.62646484375, 584.663330078125, 634.7002563476562, 684.7371826171875, 734.7740478515625, 784.8109741210938, 834.847900390625, 884.8848266601562, 934.9217529296875, 984.9586791992188, 1034.99560546875, 1085.032470703125, 1135.0694580078125, 1185.1063232421875, 1235.143310546875, 1285.18017578125, 1335.217041015625, 1385.2540283203125, 1435.2908935546875, 1485.327880859375, 1535.36474609375, 1585.4017333984375, 1635.4385986328125, 1685.4755859375, 1735.512451171875, 1785.54931640625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 3.0, 6.0, 6.0, 8.0, 5.0, 7.0, 17.0, 11.0, 17.0, 33.0, 20.0, 41.0, 33.0, 36.0, 38.0, 58.0, 163.0, 134.0, 61.0, 40.0, 34.0, 33.0, 33.0, 24.0, 34.0, 14.0, 19.0, 9.0, 12.0, 6.0, 11.0, 10.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-816.8866577148438, -788.5109252929688, -760.13525390625, -731.759521484375, -703.3838500976562, -675.0081176757812, -646.6324462890625, -618.2567138671875, -589.8809814453125, -561.5052490234375, -533.1295776367188, -504.75384521484375, -476.378173828125, -448.00244140625, -419.6267395019531, -391.25103759765625, -362.8753662109375, -334.4996643066406, -306.12396240234375, -277.74822998046875, -249.37254333496094, -220.99684143066406, -192.62112426757812, -164.24542236328125, -135.86972045898438, -107.4940185546875, -79.1183090209961, -50.74259948730469, -22.366897583007812, 6.0088043212890625, 34.384521484375, 62.760223388671875, 91.13592529296875, 119.51162719726562, 147.8873291015625, 176.26304626464844, 204.6387481689453, 233.0144500732422, 261.3901672363281, 289.765869140625, 318.1415710449219, 346.51727294921875, 374.8929748535156, 403.2686767578125, 431.6444091796875, 460.02008056640625, 488.39581298828125, 516.771484375, 545.147216796875, 573.52294921875, 601.8986206054688, 630.2743530273438, 658.6500244140625, 687.0257568359375, 715.4014892578125, 743.7771606445312, 772.15283203125, 800.528564453125, 828.9042358398438, 857.2799682617188, 885.6556396484375, 914.0313720703125, 942.4071044921875, 970.7827758789062, 999.1585083007812]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 6.0, 14.0, 20.0, 36.0, 51.0, 94.0, 165.0, 233.0, 470.0, 838.0, 1935.0, 5546.0, 23421.0, 336223.0, 3221534.0, 561725.0, 31198.0, 6477.0, 2237.0, 969.0, 464.0, 254.0, 128.0, 87.0, 53.0, 42.0, 29.0, 13.0, 3.0, 9.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-215.375, -210.1943359375, -205.013671875, -199.8330078125, -194.65234375, -189.4716796875, -184.291015625, -179.1103515625, -173.9296875, -168.7490234375, -163.568359375, -158.3876953125, -153.20703125, -148.0263671875, -142.845703125, -137.6650390625, -132.484375, -127.3037109375, -122.123046875, -116.9423828125, -111.76171875, -106.5810546875, -101.400390625, -96.2197265625, -91.0390625, -85.8583984375, -80.677734375, -75.4970703125, -70.31640625, -65.1357421875, -59.955078125, -54.7744140625, -49.59375, -44.4130859375, -39.232421875, -34.0517578125, -28.87109375, -23.6904296875, -18.509765625, -13.3291015625, -8.1484375, -2.9677734375, 2.212890625, 7.3935546875, 12.57421875, 17.7548828125, 22.935546875, 28.1162109375, 33.296875, 38.4775390625, 43.658203125, 48.8388671875, 54.01953125, 59.2001953125, 64.380859375, 69.5615234375, 74.7421875, 79.9228515625, 85.103515625, 90.2841796875, 95.46484375, 100.6455078125, 105.826171875, 111.0068359375, 116.1875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 5.0, 5.0, 12.0, 12.0, 13.0, 20.0, 23.0, 20.0, 30.0, 23.0, 34.0, 36.0, 39.0, 36.0, 40.0, 45.0, 44.0, 41.0, 51.0, 45.0, 43.0, 45.0, 48.0, 33.0, 45.0, 38.0, 21.0, 21.0, 31.0, 18.0, 12.0, 15.0, 7.0, 7.0, 8.0, 7.0, 5.0, 2.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.78125, -47.0927734375, -45.404296875, -43.7158203125, -42.02734375, -40.3388671875, -38.650390625, -36.9619140625, -35.2734375, -33.5849609375, -31.896484375, -30.2080078125, -28.51953125, -26.8310546875, -25.142578125, -23.4541015625, -21.765625, -20.0771484375, -18.388671875, -16.7001953125, -15.01171875, -13.3232421875, -11.634765625, -9.9462890625, -8.2578125, -6.5693359375, -4.880859375, -3.1923828125, -1.50390625, 0.1845703125, 1.873046875, 3.5615234375, 5.25, 6.9384765625, 8.626953125, 10.3154296875, 12.00390625, 13.6923828125, 15.380859375, 17.0693359375, 18.7578125, 20.4462890625, 22.134765625, 23.8232421875, 25.51171875, 27.2001953125, 28.888671875, 30.5771484375, 32.265625, 33.9541015625, 35.642578125, 37.3310546875, 39.01953125, 40.7080078125, 42.396484375, 44.0849609375, 45.7734375, 47.4619140625, 49.150390625, 50.8388671875, 52.52734375, 54.2158203125, 55.904296875, 57.5927734375, 59.28125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 6.0, 3.0, 8.0, 5.0, 8.0, 16.0, 22.0, 32.0, 32.0, 61.0, 86.0, 120.0, 177.0, 272.0, 528.0, 1162.0, 3051.0, 12601.0, 144994.0, 3898910.0, 115275.0, 11472.0, 2938.0, 1156.0, 493.0, 273.0, 198.0, 121.0, 70.0, 56.0, 46.0, 26.0, 14.0, 11.0, 7.0, 9.0, 8.0, 3.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-262.25, -254.171875, -246.09375, -238.015625, -229.9375, -221.859375, -213.78125, -205.703125, -197.625, -189.546875, -181.46875, -173.390625, -165.3125, -157.234375, -149.15625, -141.078125, -133.0, -124.921875, -116.84375, -108.765625, -100.6875, -92.609375, -84.53125, -76.453125, -68.375, -60.296875, -52.21875, -44.140625, -36.0625, -27.984375, -19.90625, -11.828125, -3.75, 4.328125, 12.40625, 20.484375, 28.5625, 36.640625, 44.71875, 52.796875, 60.875, 68.953125, 77.03125, 85.109375, 93.1875, 101.265625, 109.34375, 117.421875, 125.5, 133.578125, 141.65625, 149.734375, 157.8125, 165.890625, 173.96875, 182.046875, 190.125, 198.203125, 206.28125, 214.359375, 222.4375, 230.515625, 238.59375, 246.671875, 254.75]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 8.0, 10.0, 18.0, 12.0, 19.0, 28.0, 34.0, 63.0, 94.0, 117.0, 213.0, 312.0, 531.0, 712.0, 664.0, 407.0, 277.0, 169.0, 105.0, 70.0, 48.0, 41.0, 34.0, 13.0, 11.0, 17.0, 13.0, 6.0, 6.0, 6.0, 4.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-163.125, -157.439453125, -151.75390625, -146.068359375, -140.3828125, -134.697265625, -129.01171875, -123.326171875, -117.640625, -111.955078125, -106.26953125, -100.583984375, -94.8984375, -89.212890625, -83.52734375, -77.841796875, -72.15625, -66.470703125, -60.78515625, -55.099609375, -49.4140625, -43.728515625, -38.04296875, -32.357421875, -26.671875, -20.986328125, -15.30078125, -9.615234375, -3.9296875, 1.755859375, 7.44140625, 13.126953125, 18.8125, 24.498046875, 30.18359375, 35.869140625, 41.5546875, 47.240234375, 52.92578125, 58.611328125, 64.296875, 69.982421875, 75.66796875, 81.353515625, 87.0390625, 92.724609375, 98.41015625, 104.095703125, 109.78125, 115.466796875, 121.15234375, 126.837890625, 132.5234375, 138.208984375, 143.89453125, 149.580078125, 155.265625, 160.951171875, 166.63671875, 172.322265625, 178.0078125, 183.693359375, 189.37890625, 195.064453125, 200.75]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 7.0, 12.0, 20.0, 30.0, 65.0, 105.0, 174.0, 213.0, 151.0, 84.0, 53.0, 34.0, 11.0, 6.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1414.443603515625, -1351.1727294921875, -1287.90185546875, -1224.631103515625, -1161.3602294921875, -1098.08935546875, -1034.818603515625, -971.5477294921875, -908.27685546875, -845.0059814453125, -781.7351684570312, -718.46435546875, -655.1934814453125, -591.922607421875, -528.6517944335938, -465.3809509277344, -402.110107421875, -338.8392639160156, -275.56842041015625, -212.29757690429688, -149.0267333984375, -85.75588989257812, -22.48504638671875, 40.785797119140625, 104.056640625, 167.32748413085938, 230.59832763671875, 293.8691711425781, 357.1400146484375, 420.4108581542969, 483.68170166015625, 546.9525146484375, 610.223388671875, 673.4942626953125, 736.7650756835938, 800.035888671875, 863.3067626953125, 926.57763671875, 989.8484497070312, 1053.1192626953125, 1116.39013671875, 1179.6610107421875, 1242.931884765625, 1306.20263671875, 1369.4735107421875, 1432.744384765625, 1496.01513671875, 1559.2860107421875, 1622.556884765625, 1685.8277587890625, 1749.0986328125, 1812.369384765625, 1875.6402587890625, 1938.9111328125, 2002.181884765625, 2065.452880859375, 2128.7236328125, 2191.994384765625, 2255.265380859375, 2318.5361328125, 2381.80712890625, 2445.077880859375, 2508.3486328125, 2571.61962890625, 2634.890380859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 7.0, 5.0, 6.0, 13.0, 5.0, 23.0, 15.0, 15.0, 26.0, 27.0, 22.0, 29.0, 31.0, 28.0, 29.0, 44.0, 55.0, 48.0, 64.0, 50.0, 50.0, 45.0, 45.0, 43.0, 38.0, 41.0, 24.0, 26.0, 28.0, 17.0, 13.0, 15.0, 10.0, 14.0, 8.0, 3.0, 8.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-910.77001953125, -883.1921997070312, -855.6143798828125, -828.03662109375, -800.4588012695312, -772.8809814453125, -745.30322265625, -717.7254028320312, -690.1475830078125, -662.5697631835938, -634.991943359375, -607.4141845703125, -579.8363647460938, -552.258544921875, -524.6807861328125, -497.10296630859375, -469.525146484375, -441.94732666015625, -414.3695373535156, -386.791748046875, -359.21392822265625, -331.6361083984375, -304.0583190917969, -276.48052978515625, -248.9027099609375, -221.3249053955078, -193.74710083007812, -166.16929626464844, -138.59149169921875, -111.01368713378906, -83.43588256835938, -55.85807800292969, -28.28021240234375, -0.7024078369140625, 26.875396728515625, 54.45320129394531, 82.031005859375, 109.60881042480469, 137.18661499023438, 164.76441955566406, 192.34222412109375, 219.92002868652344, 247.49783325195312, 275.07562255859375, 302.6534423828125, 330.23126220703125, 357.8090515136719, 385.3868408203125, 412.96466064453125, 440.54248046875, 468.1202697753906, 495.69805908203125, 523.27587890625, 550.8536987304688, 578.4315185546875, 606.00927734375, 633.5870971679688, 661.1649169921875, 688.74267578125, 716.3204956054688, 743.8983154296875, 771.4761352539062, 799.053955078125, 826.6317138671875, 854.2095336914062]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 8.0, 7.0, 4.0, 20.0, 17.0, 23.0, 34.0, 59.0, 74.0, 114.0, 184.0, 267.0, 441.0, 747.0, 1245.0, 2146.0, 4498.0, 10191.0, 27704.0, 95803.0, 446990.0, 341240.0, 76081.0, 22955.0, 8764.0, 3914.0, 1984.0, 1177.0, 692.0, 413.0, 256.0, 194.0, 91.0, 68.0, 45.0, 30.0, 14.0, 12.0, 7.0, 6.0, 7.0, 7.0, 5.0, 6.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-94.125, -91.17578125, -88.2265625, -85.27734375, -82.328125, -79.37890625, -76.4296875, -73.48046875, -70.53125, -67.58203125, -64.6328125, -61.68359375, -58.734375, -55.78515625, -52.8359375, -49.88671875, -46.9375, -43.98828125, -41.0390625, -38.08984375, -35.140625, -32.19140625, -29.2421875, -26.29296875, -23.34375, -20.39453125, -17.4453125, -14.49609375, -11.546875, -8.59765625, -5.6484375, -2.69921875, 0.25, 3.19921875, 6.1484375, 9.09765625, 12.046875, 14.99609375, 17.9453125, 20.89453125, 23.84375, 26.79296875, 29.7421875, 32.69140625, 35.640625, 38.58984375, 41.5390625, 44.48828125, 47.4375, 50.38671875, 53.3359375, 56.28515625, 59.234375, 62.18359375, 65.1328125, 68.08203125, 71.03125, 73.98046875, 76.9296875, 79.87890625, 82.828125, 85.77734375, 88.7265625, 91.67578125, 94.625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 2.0, 7.0, 6.0, 12.0, 16.0, 13.0, 21.0, 20.0, 30.0, 30.0, 42.0, 42.0, 46.0, 59.0, 58.0, 65.0, 59.0, 53.0, 63.0, 54.0, 53.0, 47.0, 44.0, 30.0, 38.0, 19.0, 21.0, 15.0, 14.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-86.4375, -84.060546875, -81.68359375, -79.306640625, -76.9296875, -74.552734375, -72.17578125, -69.798828125, -67.421875, -65.044921875, -62.66796875, -60.291015625, -57.9140625, -55.537109375, -53.16015625, -50.783203125, -48.40625, -46.029296875, -43.65234375, -41.275390625, -38.8984375, -36.521484375, -34.14453125, -31.767578125, -29.390625, -27.013671875, -24.63671875, -22.259765625, -19.8828125, -17.505859375, -15.12890625, -12.751953125, -10.375, -7.998046875, -5.62109375, -3.244140625, -0.8671875, 1.509765625, 3.88671875, 6.263671875, 8.640625, 11.017578125, 13.39453125, 15.771484375, 18.1484375, 20.525390625, 22.90234375, 25.279296875, 27.65625, 30.033203125, 32.41015625, 34.787109375, 37.1640625, 39.541015625, 41.91796875, 44.294921875, 46.671875, 49.048828125, 51.42578125, 53.802734375, 56.1796875, 58.556640625, 60.93359375, 63.310546875, 65.6875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 12.0, 9.0, 16.0, 15.0, 22.0, 43.0, 54.0, 69.0, 120.0, 216.0, 356.0, 672.0, 1789.0, 6776.0, 54091.0, 892412.0, 79584.0, 8442.0, 2113.0, 760.0, 373.0, 171.0, 137.0, 82.0, 68.0, 47.0, 32.0, 17.0, 16.0, 9.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-150.625, -145.697265625, -140.76953125, -135.841796875, -130.9140625, -125.986328125, -121.05859375, -116.130859375, -111.203125, -106.275390625, -101.34765625, -96.419921875, -91.4921875, -86.564453125, -81.63671875, -76.708984375, -71.78125, -66.853515625, -61.92578125, -56.998046875, -52.0703125, -47.142578125, -42.21484375, -37.287109375, -32.359375, -27.431640625, -22.50390625, -17.576171875, -12.6484375, -7.720703125, -2.79296875, 2.134765625, 7.0625, 11.990234375, 16.91796875, 21.845703125, 26.7734375, 31.701171875, 36.62890625, 41.556640625, 46.484375, 51.412109375, 56.33984375, 61.267578125, 66.1953125, 71.123046875, 76.05078125, 80.978515625, 85.90625, 90.833984375, 95.76171875, 100.689453125, 105.6171875, 110.544921875, 115.47265625, 120.400390625, 125.328125, 130.255859375, 135.18359375, 140.111328125, 145.0390625, 149.966796875, 154.89453125, 159.822265625, 164.75]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 5.0, 9.0, 11.0, 14.0, 16.0, 17.0, 23.0, 27.0, 34.0, 15.0, 35.0, 48.0, 33.0, 69.0, 92.0, 72.0, 69.0, 66.0, 60.0, 41.0, 31.0, 38.0, 23.0, 31.0, 20.0, 14.0, 13.0, 11.0, 5.0, 9.0, 4.0, 6.0, 7.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-266.5, -258.78125, -251.0625, -243.34375, -235.625, -227.90625, -220.1875, -212.46875, -204.75, -197.03125, -189.3125, -181.59375, -173.875, -166.15625, -158.4375, -150.71875, -143.0, -135.28125, -127.5625, -119.84375, -112.125, -104.40625, -96.6875, -88.96875, -81.25, -73.53125, -65.8125, -58.09375, -50.375, -42.65625, -34.9375, -27.21875, -19.5, -11.78125, -4.0625, 3.65625, 11.375, 19.09375, 26.8125, 34.53125, 42.25, 49.96875, 57.6875, 65.40625, 73.125, 80.84375, 88.5625, 96.28125, 104.0, 111.71875, 119.4375, 127.15625, 134.875, 142.59375, 150.3125, 158.03125, 165.75, 173.46875, 181.1875, 188.90625, 196.625, 204.34375, 212.0625, 219.78125, 227.5]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 8.0, 15.0, 4.0, 14.0, 14.0, 6.0, 18.0, 27.0, 37.0, 63.0, 83.0, 131.0, 268.0, 534.0, 1011.0, 2689.0, 8549.0, 42193.0, 860164.0, 109596.0, 15761.0, 4247.0, 1588.0, 669.0, 293.0, 180.0, 131.0, 63.0, 39.0, 27.0, 29.0, 11.0, 17.0, 11.0, 8.0, 8.0, 3.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-22.03125, -21.377685546875, -20.72412109375, -20.070556640625, -19.4169921875, -18.763427734375, -18.10986328125, -17.456298828125, -16.802734375, -16.149169921875, -15.49560546875, -14.842041015625, -14.1884765625, -13.534912109375, -12.88134765625, -12.227783203125, -11.57421875, -10.920654296875, -10.26708984375, -9.613525390625, -8.9599609375, -8.306396484375, -7.65283203125, -6.999267578125, -6.345703125, -5.692138671875, -5.03857421875, -4.385009765625, -3.7314453125, -3.077880859375, -2.42431640625, -1.770751953125, -1.1171875, -0.463623046875, 0.18994140625, 0.843505859375, 1.4970703125, 2.150634765625, 2.80419921875, 3.457763671875, 4.111328125, 4.764892578125, 5.41845703125, 6.072021484375, 6.7255859375, 7.379150390625, 8.03271484375, 8.686279296875, 9.33984375, 9.993408203125, 10.64697265625, 11.300537109375, 11.9541015625, 12.607666015625, 13.26123046875, 13.914794921875, 14.568359375, 15.221923828125, 15.87548828125, 16.529052734375, 17.1826171875, 17.836181640625, 18.48974609375, 19.143310546875, 19.796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 9.0, 15.0, 20.0, 27.0, 37.0, 62.0, 148.0, 258.0, 161.0, 106.0, 44.0, 35.0, 18.0, 20.0, 19.0, 3.0, 7.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01209259033203125, -0.011815667152404785, -0.01153874397277832, -0.011261820793151855, -0.01098489761352539, -0.010707974433898926, -0.010431051254272461, -0.010154128074645996, -0.009877204895019531, -0.009600281715393066, -0.009323358535766602, -0.009046435356140137, -0.008769512176513672, -0.008492588996887207, -0.008215665817260742, -0.007938742637634277, -0.0076618194580078125, -0.007384896278381348, -0.007107973098754883, -0.006831049919128418, -0.006554126739501953, -0.006277203559875488, -0.0060002803802490234, -0.005723357200622559, -0.005446434020996094, -0.005169510841369629, -0.004892587661743164, -0.004615664482116699, -0.004338741302490234, -0.0040618181228637695, -0.0037848949432373047, -0.00350797176361084, -0.003231048583984375, -0.00295412540435791, -0.0026772022247314453, -0.0024002790451049805, -0.0021233558654785156, -0.0018464326858520508, -0.001569509506225586, -0.001292586326599121, -0.0010156631469726562, -0.0007387399673461914, -0.00046181678771972656, -0.00018489360809326172, 9.202957153320312e-05, 0.00036895275115966797, 0.0006458759307861328, 0.0009227991104125977, 0.0011997222900390625, 0.0014766454696655273, 0.0017535686492919922, 0.002030491828918457, 0.002307415008544922, 0.0025843381881713867, 0.0028612613677978516, 0.0031381845474243164, 0.0034151077270507812, 0.003692030906677246, 0.003968954086303711, 0.004245877265930176, 0.004522800445556641, 0.0047997236251831055, 0.00507664680480957, 0.005353569984436035, 0.0056304931640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 11.0, 13.0, 14.0, 20.0, 31.0, 55.0, 76.0, 112.0, 156.0, 288.0, 556.0, 1010.0, 2232.0, 5322.0, 14497.0, 52147.0, 735669.0, 189272.0, 30113.0, 9791.0, 3728.0, 1623.0, 770.0, 434.0, 254.0, 130.0, 75.0, 43.0, 33.0, 31.0, 16.0, 14.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.15625, -13.664794921875, -13.17333984375, -12.681884765625, -12.1904296875, -11.698974609375, -11.20751953125, -10.716064453125, -10.224609375, -9.733154296875, -9.24169921875, -8.750244140625, -8.2587890625, -7.767333984375, -7.27587890625, -6.784423828125, -6.29296875, -5.801513671875, -5.31005859375, -4.818603515625, -4.3271484375, -3.835693359375, -3.34423828125, -2.852783203125, -2.361328125, -1.869873046875, -1.37841796875, -0.886962890625, -0.3955078125, 0.095947265625, 0.58740234375, 1.078857421875, 1.5703125, 2.061767578125, 2.55322265625, 3.044677734375, 3.5361328125, 4.027587890625, 4.51904296875, 5.010498046875, 5.501953125, 5.993408203125, 6.48486328125, 6.976318359375, 7.4677734375, 7.959228515625, 8.45068359375, 8.942138671875, 9.43359375, 9.925048828125, 10.41650390625, 10.907958984375, 11.3994140625, 11.890869140625, 12.38232421875, 12.873779296875, 13.365234375, 13.856689453125, 14.34814453125, 14.839599609375, 15.3310546875, 15.822509765625, 16.31396484375, 16.805419921875, 17.296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 8.0, 8.0, 9.0, 10.0, 4.0, 13.0, 15.0, 11.0, 25.0, 28.0, 29.0, 39.0, 54.0, 78.0, 79.0, 122.0, 133.0, 78.0, 55.0, 41.0, 38.0, 27.0, 21.0, 10.0, 11.0, 12.0, 7.0, 13.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.609375, -19.0048828125, -18.400390625, -17.7958984375, -17.19140625, -16.5869140625, -15.982421875, -15.3779296875, -14.7734375, -14.1689453125, -13.564453125, -12.9599609375, -12.35546875, -11.7509765625, -11.146484375, -10.5419921875, -9.9375, -9.3330078125, -8.728515625, -8.1240234375, -7.51953125, -6.9150390625, -6.310546875, -5.7060546875, -5.1015625, -4.4970703125, -3.892578125, -3.2880859375, -2.68359375, -2.0791015625, -1.474609375, -0.8701171875, -0.265625, 0.3388671875, 0.943359375, 1.5478515625, 2.15234375, 2.7568359375, 3.361328125, 3.9658203125, 4.5703125, 5.1748046875, 5.779296875, 6.3837890625, 6.98828125, 7.5927734375, 8.197265625, 8.8017578125, 9.40625, 10.0107421875, 10.615234375, 11.2197265625, 11.82421875, 12.4287109375, 13.033203125, 13.6376953125, 14.2421875, 14.8466796875, 15.451171875, 16.0556640625, 16.66015625, 17.2646484375, 17.869140625, 18.4736328125, 19.078125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 10.0, 15.0, 28.0, 77.0, 452.0, 294.0, 64.0, 33.0, 15.0, 8.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1379.2645263671875, -1334.676513671875, -1290.08837890625, -1245.5003662109375, -1200.912353515625, -1156.32421875, -1111.7362060546875, -1067.148193359375, -1022.5601196289062, -977.9720458984375, -933.384033203125, -888.7959594726562, -844.2078857421875, -799.619873046875, -755.0317993164062, -710.4437255859375, -665.855712890625, -621.2676391601562, -576.6796264648438, -532.091552734375, -487.5035095214844, -442.91546630859375, -398.327392578125, -353.7393493652344, -309.15130615234375, -264.5632629394531, -219.97520446777344, -175.38714599609375, -130.79910278320312, -86.2110595703125, -41.62298583984375, 2.965057373046875, 47.55322265625, 92.14127349853516, 136.7293243408203, 181.3173828125, 225.90542602539062, 270.49346923828125, 315.08154296875, 359.6695861816406, 404.25762939453125, 448.8456726074219, 493.4337158203125, 538.0217895507812, 582.60986328125, 627.1978759765625, 671.7859497070312, 716.3740234375, 760.9620361328125, 805.5501098632812, 850.1381225585938, 894.7261962890625, 939.314208984375, 983.9022827148438, 1028.4903564453125, 1073.078369140625, 1117.66650390625, 1162.2545166015625, 1206.8426513671875, 1251.4306640625, 1296.0186767578125, 1340.606689453125, 1385.19482421875, 1429.7828369140625, 1474.370849609375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 9.0, 8.0, 8.0, 15.0, 19.0, 13.0, 25.0, 19.0, 17.0, 14.0, 31.0, 31.0, 65.0, 232.0, 199.0, 56.0, 26.0, 28.0, 34.0, 20.0, 27.0, 12.0, 20.0, 12.0, 9.0, 8.0, 6.0, 10.0, 8.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-628.5965576171875, -606.85693359375, -585.1173706054688, -563.3777465820312, -541.63818359375, -519.8985595703125, -498.158935546875, -476.4193420410156, -454.67974853515625, -432.9401550292969, -411.2005615234375, -389.4609375, -367.7213439941406, -345.98175048828125, -324.24212646484375, -302.5025329589844, -280.762939453125, -259.0233459472656, -237.2837371826172, -215.54412841796875, -193.80453491210938, -172.06494140625, -150.32533264160156, -128.58572387695312, -106.84613037109375, -85.10652923583984, -63.36692810058594, -41.62732696533203, -19.887725830078125, 1.8518753051757812, 23.591476440429688, 45.331085205078125, 67.07061767578125, 88.81021881103516, 110.54981994628906, 132.2894287109375, 154.02902221679688, 175.76861572265625, 197.5082244873047, 219.24783325195312, 240.9874267578125, 262.7270202636719, 284.46661376953125, 306.20623779296875, 327.9458312988281, 349.6854248046875, 371.425048828125, 393.1646423339844, 414.90423583984375, 436.6438293457031, 458.3834228515625, 480.123046875, 501.8626403808594, 523.6022338867188, 545.3418579101562, 567.0814208984375, 588.821044921875, 610.5606689453125, 632.3002319335938, 654.0398559570312, 675.7794189453125, 697.51904296875, 719.2586669921875, 740.998291015625, 762.7378540039062]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 4.0, 4.0, 8.0, 9.0, 5.0, 22.0, 22.0, 24.0, 29.0, 28.0, 38.0, 42.0, 40.0, 100.0, 275.0, 70.0, 41.0, 31.0, 38.0, 24.0, 14.0, 15.0, 19.0, 11.0, 14.0, 11.0, 15.0, 9.0, 8.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.3125, -48.3349609375, -46.357421875, -44.3798828125, -42.40234375, -40.4248046875, -38.447265625, -36.4697265625, -34.4921875, -32.5146484375, -30.537109375, -28.5595703125, -26.58203125, -24.6044921875, -22.626953125, -20.6494140625, -18.671875, -16.6943359375, -14.716796875, -12.7392578125, -10.76171875, -8.7841796875, -6.806640625, -4.8291015625, -2.8515625, -0.8740234375, 1.103515625, 3.0810546875, 5.05859375, 7.0361328125, 9.013671875, 10.9912109375, 12.96875, 14.9462890625, 16.923828125, 18.9013671875, 20.87890625, 22.8564453125, 24.833984375, 26.8115234375, 28.7890625, 30.7666015625, 32.744140625, 34.7216796875, 36.69921875, 38.6767578125, 40.654296875, 42.6318359375, 44.609375, 46.5869140625, 48.564453125, 50.5419921875, 52.51953125, 54.4970703125, 56.474609375, 58.4521484375, 60.4296875, 62.4072265625, 64.384765625, 66.3623046875, 68.33984375, 70.3173828125, 72.294921875, 74.2724609375, 76.25]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 5.0, 13.0, 19.0, 21.0, 45.0, 88.0, 99.0, 264.0, 667.0, 1989.0, 8989.0, 8337562.0, 33331.0, 3721.0, 963.0, 361.0, 182.0, 111.0, 51.0, 31.0, 22.0, 19.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-737.411376953125, -713.4223022460938, -689.4332275390625, -665.4441528320312, -641.455078125, -617.4660034179688, -593.4769287109375, -569.48779296875, -545.498779296875, -521.5097045898438, -497.5206298828125, -473.53155517578125, -449.54248046875, -425.55340576171875, -401.5643005371094, -377.5752258300781, -353.58612060546875, -329.5970458984375, -305.60797119140625, -281.618896484375, -257.62982177734375, -233.64073181152344, -209.65164184570312, -185.66256713867188, -161.67349243164062, -137.68441772460938, -113.6953353881836, -89.70625305175781, -65.71717834472656, -41.72810363769531, -17.739013671875, 6.25006103515625, 30.23919677734375, 54.228275299072266, 78.21735382080078, 102.20643615722656, 126.19551086425781, 150.18458557128906, 174.17367553710938, 198.16275024414062, 222.15182495117188, 246.14089965820312, 270.1299743652344, 294.11907958984375, 318.108154296875, 342.09722900390625, 366.0863037109375, 390.07537841796875, 414.064453125, 438.05352783203125, 462.0426025390625, 486.03167724609375, 510.020751953125, 534.0098266601562, 557.9989013671875, 581.988037109375, 605.97705078125, 629.9661254882812, 653.9552001953125, 677.9442749023438, 701.933349609375, 725.9224243164062, 749.9114990234375, 773.900634765625, 797.8897094726562]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 5.0, 1.0, 8.0, 5.0, 3.0, 3.0, 9.0, 5.0, 5.0, 7.0, 5.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-769.1875610351562, -745.0888061523438, -720.9901123046875, -696.891357421875, -672.7926025390625, -648.69384765625, -624.5951538085938, -600.4963989257812, -576.397705078125, -552.2989501953125, -528.2002563476562, -504.10150146484375, -480.00274658203125, -455.9040222167969, -431.8052978515625, -407.70654296875, -383.6077880859375, -359.5090637207031, -335.4103088378906, -311.31158447265625, -287.21282958984375, -263.1141052246094, -239.015380859375, -214.91664123535156, -190.81790161132812, -166.7191619873047, -142.62042236328125, -118.52169799804688, -94.42295837402344, -70.32421875, -46.225494384765625, -22.126754760742188, 1.971923828125, 26.070659637451172, 50.169395446777344, 74.26812744140625, 98.36686706542969, 122.46560668945312, 146.5643310546875, 170.66307067871094, 194.76181030273438, 218.8605499267578, 242.95928955078125, 267.0580139160156, 291.15673828125, 315.2554931640625, 339.3542175292969, 363.45294189453125, 387.55169677734375, 411.6504211425781, 435.7491760253906, 459.847900390625, 483.9466552734375, 508.0453796386719, 532.1441040039062, 556.2428588867188, 580.341552734375, 604.4403076171875, 628.5390014648438, 652.6377563476562, 676.7365112304688, 700.835205078125, 724.9339599609375, 749.03271484375, 773.1314697265625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 11.0, 6.0, 11.0, 17.0, 25.0, 34.0, 60.0, 60.0, 103.0, 155.0, 276.0, 563.0, 1108.0, 2752.0, 7283.0, 21565.0, 73478.0, 216893.0, 139788.0, 39585.0, 12668.0, 4411.0, 1709.0, 793.0, 365.0, 208.0, 102.0, 68.0, 36.0, 33.0, 21.0, 17.0, 13.0, 12.0, 6.0, 11.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-607.5, -588.953125, -570.40625, -551.859375, -533.3125, -514.765625, -496.21875, -477.671875, -459.125, -440.578125, -422.03125, -403.484375, -384.9375, -366.390625, -347.84375, -329.296875, -310.75, -292.203125, -273.65625, -255.109375, -236.5625, -218.015625, -199.46875, -180.921875, -162.375, -143.828125, -125.28125, -106.734375, -88.1875, -69.640625, -51.09375, -32.546875, -14.0, 4.546875, 23.09375, 41.640625, 60.1875, 78.734375, 97.28125, 115.828125, 134.375, 152.921875, 171.46875, 190.015625, 208.5625, 227.109375, 245.65625, 264.203125, 282.75, 301.296875, 319.84375, 338.390625, 356.9375, 375.484375, 394.03125, 412.578125, 431.125, 449.671875, 468.21875, 486.765625, 505.3125, 523.859375, 542.40625, 560.953125, 579.5]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 14.0, 15.0, 15.0, 28.0, 23.0, 25.0, 49.0, 38.0, 73.0, 68.0, 73.0, 96.0, 98.0, 83.0, 63.0, 55.0, 46.0, 25.0, 37.0, 22.0, 16.0, 13.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-122.875, -119.90234375, -116.9296875, -113.95703125, -110.984375, -108.01171875, -105.0390625, -102.06640625, -99.09375, -96.12109375, -93.1484375, -90.17578125, -87.203125, -84.23046875, -81.2578125, -78.28515625, -75.3125, -72.33984375, -69.3671875, -66.39453125, -63.421875, -60.44921875, -57.4765625, -54.50390625, -51.53125, -48.55859375, -45.5859375, -42.61328125, -39.640625, -36.66796875, -33.6953125, -30.72265625, -27.75, -24.77734375, -21.8046875, -18.83203125, -15.859375, -12.88671875, -9.9140625, -6.94140625, -3.96875, -0.99609375, 1.9765625, 4.94921875, 7.921875, 10.89453125, 13.8671875, 16.83984375, 19.8125, 22.78515625, 25.7578125, 28.73046875, 31.703125, 34.67578125, 37.6484375, 40.62109375, 43.59375, 46.56640625, 49.5390625, 52.51171875, 55.484375, 58.45703125, 61.4296875, 64.40234375, 67.375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 1.0, 2.0, 10.0, 4.0, 5.0, 16.0, 18.0, 36.0, 56.0, 98.0, 106.0, 54.0, 33.0, 18.0, 8.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-698.52978515625, -676.5953369140625, -654.6609497070312, -632.7265014648438, -610.7920532226562, -588.857666015625, -566.9232177734375, -544.98876953125, -523.0543212890625, -501.1199035644531, -479.1854553222656, -457.25103759765625, -435.31658935546875, -413.3821716308594, -391.44775390625, -369.5133056640625, -347.57891845703125, -325.6445007324219, -303.7100524902344, -281.775634765625, -259.8411865234375, -237.90676879882812, -215.97235107421875, -194.0379180908203, -172.10348510742188, -150.16905212402344, -128.234619140625, -106.30020141601562, -84.36576843261719, -62.43133544921875, -40.496917724609375, -18.562484741210938, 3.3719482421875, 25.306377410888672, 47.240806579589844, 69.17523193359375, 91.10966491699219, 113.04409790039062, 134.978515625, 156.91294860839844, 178.84738159179688, 200.7818145751953, 222.71624755859375, 244.65066528320312, 266.5850830078125, 288.51953125, 310.4539489746094, 332.38836669921875, 354.32281494140625, 376.2572326660156, 398.1916809082031, 420.1260986328125, 442.060546875, 463.9949645996094, 485.92938232421875, 507.86383056640625, 529.7982177734375, 551.732666015625, 573.6670532226562, 595.6015014648438, 617.5359497070312, 639.4703369140625, 661.40478515625, 683.3392333984375, 705.273681640625]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 4.0, 4.0, 4.0, 13.0, 9.0, 20.0, 41.0, 49.0, 76.0, 79.0, 63.0, 39.0, 19.0, 11.0, 11.0, 8.0, 6.0, 7.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-358.06939697265625, -346.4508056640625, -334.8322448730469, -323.2136535644531, -311.5950622558594, -299.9764709472656, -288.35791015625, -276.73931884765625, -265.1207275390625, -253.5021514892578, -241.88356018066406, -230.26498413085938, -218.64639282226562, -207.02781677246094, -195.40924072265625, -183.7906494140625, -172.1720733642578, -160.55349731445312, -148.93490600585938, -137.3163299560547, -125.69773864746094, -114.07916259765625, -102.46057891845703, -90.84199523925781, -79.2234115600586, -67.60482788085938, -55.986244201660156, -44.3676643371582, -32.749080657958984, -21.130496978759766, -9.511917114257812, 2.1066665649414062, 13.725250244140625, 25.343833923339844, 36.96241760253906, 48.580997467041016, 60.199581146240234, 71.81816101074219, 83.4367446899414, 95.05532836914062, 106.67391204833984, 118.29249572753906, 129.91107177734375, 141.5296630859375, 153.1482391357422, 164.76683044433594, 176.38540649414062, 188.00399780273438, 199.62257385253906, 211.24114990234375, 222.8597412109375, 234.4783172607422, 246.09690856933594, 257.7154846191406, 269.3340759277344, 280.95263671875, 292.57122802734375, 304.1898193359375, 315.8083801269531, 327.4269714355469, 339.0455627441406, 350.6641540527344, 362.28271484375, 373.90130615234375, 385.5198974609375]}, "eval/loss": 1.884699821472168, "eval/wer": 0.2931722126317043, "eval/runtime": 880.9122, "eval/samples_per_second": 2.999, "eval/steps_per_second": 0.376} \ No newline at end of file