diff --git "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 6.1431, "train/learning_rate": 2.9109263657957245e-05, "train/epoch": 1.68, "train/global_step": 1500, "_runtime": 9625, "_timestamp": 1646670864, "_step": 1500, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 4.0, 9.0, 2.0, 2.0, 24.0, 91.0, 20.0, 7.0, 10.0, 3.0, 30133.0, 129.0, 35.0, 11.0, 5.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-213.5, -205.0703125, -196.640625, -188.2109375, -179.78125, -171.3515625, -162.921875, -154.4921875, -146.0625, -137.6328125, -129.203125, -120.7734375, -112.34375, -103.9140625, -95.484375, -87.0546875, -78.625, -70.1953125, -61.765625, -53.3359375, -44.90625, -36.4765625, -28.046875, -19.6171875, -11.1875, -2.7578125, 5.671875, 14.1015625, 22.53125, 30.9609375, 39.390625, 47.8203125, 56.25, 64.6796875, 73.109375, 81.5390625, 89.96875, 98.3984375, 106.828125, 115.2578125, 123.6875, 132.1171875, 140.546875, 148.9765625, 157.40625, 165.8359375, 174.265625, 182.6953125, 191.125, 199.5546875, 207.984375, 216.4140625, 224.84375, 233.2734375, 241.703125, 250.1328125, 258.5625, 266.9921875, 275.421875, 283.8515625, 292.28125, 300.7109375, 309.140625, 317.5703125, 326.0]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 7.0, 1.0, 8.0, 4.0, 9.0, 7.0, 19.0, 21.0, 18.0, 23.0, 30.0, 38.0, 41.0, 39.0, 48.0, 42.0, 63.0, 49.0, 57.0, 64.0, 51.0, 49.0, 52.0, 37.0, 40.0, 27.0, 25.0, 28.0, 22.0, 22.0, 11.0, 8.0, 7.0, 5.0, 9.0, 3.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.18177032470703, -77.88196563720703, -75.5821533203125, -73.2823486328125, -70.98253631591797, -68.68273162841797, -66.38291931152344, -64.08311462402344, -61.78330612182617, -59.483497619628906, -57.18368911743164, -54.883880615234375, -52.584075927734375, -50.284263610839844, -47.984458923339844, -45.68465042114258, -43.38484191894531, -41.08503341674805, -38.78522491455078, -36.485416412353516, -34.18560791015625, -31.885801315307617, -29.585994720458984, -27.28618621826172, -24.986377716064453, -22.686569213867188, -20.386760711669922, -18.08695411682129, -15.787145614624023, -13.487337112426758, -11.187529563903809, -8.88772201538086, -6.5879058837890625, -4.288097858428955, -1.9882898330688477, 0.31151819229125977, 2.611326217651367, 4.911134719848633, 7.210942268371582, 9.510749816894531, 11.810558319091797, 14.110366821289062, 16.410175323486328, 18.70998191833496, 21.009790420532227, 23.309598922729492, 25.609405517578125, 27.90921401977539, 30.209022521972656, 32.50883102416992, 34.80863952636719, 37.10844802856445, 39.40825653076172, 41.70806121826172, 44.007869720458984, 46.30767822265625, 48.607486724853516, 50.90729522705078, 53.20710372924805, 55.50691223144531, 57.80671691894531, 60.106529235839844, 62.406333923339844, 64.70614624023438, 67.00595092773438]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 6.0, 11.0, 12.0, 12.0, 17.0, 21.0, 15.0, 21.0, 23.0, 34.0, 42.0, 24.0, 32.0, 33.0, 33.0, 34.0, 38.0, 34.0, 47.0, 50.0, 44.0, 37.0, 45.0, 36.0, 43.0, 37.0, 26.0, 21.0, 16.0, 26.0, 25.0, 20.0, 18.0, 13.0, 13.0, 8.0, 3.0, 2.0, 6.0, 6.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.045013427734375, -60.00284957885742, -57.960689544677734, -55.91852569580078, -53.876365661621094, -51.83420181274414, -49.79203796386719, -47.7498779296875, -45.70771408081055, -43.665550231933594, -41.623390197753906, -39.58122634887695, -37.5390625, -35.49690246582031, -33.45473861694336, -31.41257667541504, -29.37041473388672, -27.3282527923584, -25.286090850830078, -23.243927001953125, -21.201765060424805, -19.159603118896484, -17.11743927001953, -15.075277328491211, -13.03311538696289, -10.99095344543457, -8.948790550231934, -6.906628131866455, -4.864465713500977, -2.8223037719726562, -0.7801408767700195, 1.2620220184326172, 3.3041763305664062, 5.346338748931885, 7.388501167297363, 9.4306640625, 11.47282600402832, 13.51498794555664, 15.557150840759277, 17.599313735961914, 19.641475677490234, 21.683637619018555, 23.725799560546875, 25.767963409423828, 27.81012535095215, 29.85228729248047, 31.894451141357422, 33.936614990234375, 35.97877502441406, 38.020938873291016, 40.0630989074707, 42.105262756347656, 44.147422790527344, 46.1895866394043, 48.23175048828125, 50.27391052246094, 52.31607437133789, 54.358238220214844, 56.40039825439453, 58.442562103271484, 60.48472595214844, 62.526885986328125, 64.56904602050781, 66.61121368408203, 68.65337371826172]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 7.0, 8.0, 17.0, 20.0, 39.0, 44.0, 83.0, 103.0, 185.0, 287.0, 467.0, 682.0, 1036.0, 1589.0, 2461.0, 3733.0, 5655.0, 8615.0, 13184.0, 20458.0, 30955.0, 46610.0, 71287.0, 114712.0, 229867.0, 200377.0, 104240.0, 65853.0, 43386.0, 28427.0, 18748.0, 12257.0, 8043.0, 5278.0, 3425.0, 2203.0, 1447.0, 931.0, 621.0, 409.0, 279.0, 188.0, 116.0, 82.0, 46.0, 39.0, 18.0, 19.0, 8.0, 9.0, 2.0, 3.0, 2.0, 3.0], "bins": [-204.125, -198.27734375, -192.4296875, -186.58203125, -180.734375, -174.88671875, -169.0390625, -163.19140625, -157.34375, -151.49609375, -145.6484375, -139.80078125, -133.953125, -128.10546875, -122.2578125, -116.41015625, -110.5625, -104.71484375, -98.8671875, -93.01953125, -87.171875, -81.32421875, -75.4765625, -69.62890625, -63.78125, -57.93359375, -52.0859375, -46.23828125, -40.390625, -34.54296875, -28.6953125, -22.84765625, -17.0, -11.15234375, -5.3046875, 0.54296875, 6.390625, 12.23828125, 18.0859375, 23.93359375, 29.78125, 35.62890625, 41.4765625, 47.32421875, 53.171875, 59.01953125, 64.8671875, 70.71484375, 76.5625, 82.41015625, 88.2578125, 94.10546875, 99.953125, 105.80078125, 111.6484375, 117.49609375, 123.34375, 129.19140625, 135.0390625, 140.88671875, 146.734375, 152.58203125, 158.4296875, 164.27734375, 170.125]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 8.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 5.0, 7.0, 10.0, 13.0, 13.0, 19.0, 18.0, 29.0, 23.0, 27.0, 25.0, 40.0, 36.0, 67.0, 63.0, 88.0, 84.0, 71.0, 65.0, 33.0, 34.0, 30.0, 32.0, 24.0, 19.0, 15.0, 15.0, 18.0, 8.0, 6.0, 11.0, 9.0, 12.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-79.875, -77.451171875, -75.02734375, -72.603515625, -70.1796875, -67.755859375, -65.33203125, -62.908203125, -60.484375, -58.060546875, -55.63671875, -53.212890625, -50.7890625, -48.365234375, -45.94140625, -43.517578125, -41.09375, -38.669921875, -36.24609375, -33.822265625, -31.3984375, -28.974609375, -26.55078125, -24.126953125, -21.703125, -19.279296875, -16.85546875, -14.431640625, -12.0078125, -9.583984375, -7.16015625, -4.736328125, -2.3125, 0.111328125, 2.53515625, 4.958984375, 7.3828125, 9.806640625, 12.23046875, 14.654296875, 17.078125, 19.501953125, 21.92578125, 24.349609375, 26.7734375, 29.197265625, 31.62109375, 34.044921875, 36.46875, 38.892578125, 41.31640625, 43.740234375, 46.1640625, 48.587890625, 51.01171875, 53.435546875, 55.859375, 58.283203125, 60.70703125, 63.130859375, 65.5546875, 67.978515625, 70.40234375, 72.826171875, 75.25]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 6.0, 8.0, 9.0, 12.0, 17.0, 21.0, 20.0, 21.0, 29.0, 37.0, 48.0, 55.0, 49.0, 75.0, 50.0, 73.0, 63.0, 63.0, 39.0, 48.0, 51.0, 32.0, 23.0, 37.0, 28.0, 17.0, 21.0, 11.0, 8.0, 7.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.38386535644531, -48.77256774902344, -47.16127395629883, -45.54998016357422, -43.938682556152344, -42.32738494873047, -40.71609115600586, -39.10479736328125, -37.493499755859375, -35.8822021484375, -34.27090835571289, -32.65961456298828, -31.048316955566406, -29.437021255493164, -27.825725555419922, -26.21442985534668, -24.603134155273438, -22.991838455200195, -21.380542755126953, -19.76924705505371, -18.15795135498047, -16.546655654907227, -14.935359954833984, -13.324064254760742, -11.7127685546875, -10.101472854614258, -8.490177154541016, -6.878881454467773, -5.267585754394531, -3.656290054321289, -2.044994354248047, -0.4336986541748047, 1.1776008605957031, 2.7888965606689453, 4.4001922607421875, 6.01148796081543, 7.622783660888672, 9.234079360961914, 10.845375061035156, 12.456670761108398, 14.06796646118164, 15.679262161254883, 17.290557861328125, 18.901853561401367, 20.51314926147461, 22.12444496154785, 23.735740661621094, 25.347036361694336, 26.958332061767578, 28.56962776184082, 30.180923461914062, 31.792219161987305, 33.40351486206055, 35.014808654785156, 36.62610626220703, 38.237403869628906, 39.848697662353516, 41.459991455078125, 43.0712890625, 44.682586669921875, 46.293880462646484, 47.905174255371094, 49.51647186279297, 51.127769470214844, 52.73906326293945]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 5.0, 11.0, 10.0, 13.0, 12.0, 12.0, 10.0, 20.0, 28.0, 23.0, 22.0, 35.0, 26.0, 30.0, 29.0, 33.0, 39.0, 46.0, 46.0, 37.0, 34.0, 35.0, 28.0, 42.0, 41.0, 34.0, 26.0, 37.0, 21.0, 26.0, 24.0, 26.0, 18.0, 23.0, 18.0, 14.0, 8.0, 8.0, 13.0, 7.0, 6.0, 3.0, 4.0, 6.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.74040222167969, -35.52992630004883, -34.3194465637207, -33.108970642089844, -31.898494720458984, -30.688016891479492, -29.4775390625, -28.26706314086914, -27.05658721923828, -25.84610939025879, -24.63563346862793, -23.425155639648438, -22.214679718017578, -21.004201889038086, -19.793724060058594, -18.583248138427734, -17.372770309448242, -16.16229248046875, -14.95181655883789, -13.741338729858398, -12.530862808227539, -11.320384979248047, -10.109908103942871, -8.899431228637695, -7.6889543533325195, -6.478477478027344, -5.268000602722168, -4.057523250579834, -2.847046375274658, -1.6365694999694824, -0.42609214782714844, 0.7843847274780273, 1.9948616027832031, 3.205338478088379, 4.415815353393555, 5.626292705535889, 6.8367695808410645, 8.047246932983398, 9.257723808288574, 10.46820068359375, 11.678677558898926, 12.889154434204102, 14.099631309509277, 15.310108184814453, 16.520586013793945, 17.731061935424805, 18.941539764404297, 20.152015686035156, 21.36249351501465, 22.57297134399414, 23.783447265625, 24.993925094604492, 26.20440101623535, 27.414878845214844, 28.625354766845703, 29.835832595825195, 31.046310424804688, 32.25678634643555, 33.46726608276367, 34.67774200439453, 35.88821792602539, 37.09869384765625, 38.309173583984375, 39.519649505615234, 40.730125427246094]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 6.0, 6.0, 4.0, 13.0, 12.0, 21.0, 38.0, 48.0, 62.0, 125.0, 189.0, 320.0, 442.0, 751.0, 1083.0, 1809.0, 2774.0, 4480.0, 7099.0, 11589.0, 19156.0, 31775.0, 53682.0, 96417.0, 183315.0, 385481.0, 771205.0, 1051964.0, 779449.0, 380478.0, 180476.0, 94606.0, 53603.0, 30644.0, 18678.0, 11660.0, 7148.0, 4624.0, 3059.0, 2026.0, 1299.0, 895.0, 607.0, 380.0, 244.0, 179.0, 126.0, 77.0, 56.0, 36.0, 34.0, 13.0, 13.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.5, -35.30322265625, -34.1064453125, -32.90966796875, -31.712890625, -30.51611328125, -29.3193359375, -28.12255859375, -26.92578125, -25.72900390625, -24.5322265625, -23.33544921875, -22.138671875, -20.94189453125, -19.7451171875, -18.54833984375, -17.3515625, -16.15478515625, -14.9580078125, -13.76123046875, -12.564453125, -11.36767578125, -10.1708984375, -8.97412109375, -7.77734375, -6.58056640625, -5.3837890625, -4.18701171875, -2.990234375, -1.79345703125, -0.5966796875, 0.60009765625, 1.796875, 2.99365234375, 4.1904296875, 5.38720703125, 6.583984375, 7.78076171875, 8.9775390625, 10.17431640625, 11.37109375, 12.56787109375, 13.7646484375, 14.96142578125, 16.158203125, 17.35498046875, 18.5517578125, 19.74853515625, 20.9453125, 22.14208984375, 23.3388671875, 24.53564453125, 25.732421875, 26.92919921875, 28.1259765625, 29.32275390625, 30.51953125, 31.71630859375, 32.9130859375, 34.10986328125, 35.306640625, 36.50341796875, 37.7001953125, 38.89697265625, 40.09375]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 6.0, 8.0, 5.0, 6.0, 7.0, 10.0, 12.0, 13.0, 19.0, 16.0, 14.0, 19.0, 21.0, 28.0, 29.0, 37.0, 29.0, 30.0, 23.0, 44.0, 48.0, 48.0, 34.0, 25.0, 40.0, 39.0, 31.0, 32.0, 44.0, 31.0, 23.0, 23.0, 29.0, 19.0, 22.0, 20.0, 15.0, 18.0, 8.0, 17.0, 10.0, 8.0, 7.0, 9.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0], "bins": [-23.109375, -22.345947265625, -21.58251953125, -20.819091796875, -20.0556640625, -19.292236328125, -18.52880859375, -17.765380859375, -17.001953125, -16.238525390625, -15.47509765625, -14.711669921875, -13.9482421875, -13.184814453125, -12.42138671875, -11.657958984375, -10.89453125, -10.131103515625, -9.36767578125, -8.604248046875, -7.8408203125, -7.077392578125, -6.31396484375, -5.550537109375, -4.787109375, -4.023681640625, -3.26025390625, -2.496826171875, -1.7333984375, -0.969970703125, -0.20654296875, 0.556884765625, 1.3203125, 2.083740234375, 2.84716796875, 3.610595703125, 4.3740234375, 5.137451171875, 5.90087890625, 6.664306640625, 7.427734375, 8.191162109375, 8.95458984375, 9.718017578125, 10.4814453125, 11.244873046875, 12.00830078125, 12.771728515625, 13.53515625, 14.298583984375, 15.06201171875, 15.825439453125, 16.5888671875, 17.352294921875, 18.11572265625, 18.879150390625, 19.642578125, 20.406005859375, 21.16943359375, 21.932861328125, 22.6962890625, 23.459716796875, 24.22314453125, 24.986572265625, 25.75]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 19.0, 27.0, 32.0, 54.0, 71.0, 125.0, 197.0, 256.0, 414.0, 669.0, 955.0, 1531.0, 2363.0, 3525.0, 5638.0, 8611.0, 13962.0, 22293.0, 35956.0, 58900.0, 97027.0, 159595.0, 263076.0, 427195.0, 680334.0, 831018.0, 607938.0, 377825.0, 231557.0, 140493.0, 85309.0, 51776.0, 31900.0, 19530.0, 12055.0, 7797.0, 4977.0, 3178.0, 2117.0, 1408.0, 835.0, 615.0, 393.0, 253.0, 163.0, 103.0, 87.0, 37.0, 29.0, 28.0, 13.0, 6.0, 8.0, 7.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.609375, -28.66552734375, -27.7216796875, -26.77783203125, -25.833984375, -24.89013671875, -23.9462890625, -23.00244140625, -22.05859375, -21.11474609375, -20.1708984375, -19.22705078125, -18.283203125, -17.33935546875, -16.3955078125, -15.45166015625, -14.5078125, -13.56396484375, -12.6201171875, -11.67626953125, -10.732421875, -9.78857421875, -8.8447265625, -7.90087890625, -6.95703125, -6.01318359375, -5.0693359375, -4.12548828125, -3.181640625, -2.23779296875, -1.2939453125, -0.35009765625, 0.59375, 1.53759765625, 2.4814453125, 3.42529296875, 4.369140625, 5.31298828125, 6.2568359375, 7.20068359375, 8.14453125, 9.08837890625, 10.0322265625, 10.97607421875, 11.919921875, 12.86376953125, 13.8076171875, 14.75146484375, 15.6953125, 16.63916015625, 17.5830078125, 18.52685546875, 19.470703125, 20.41455078125, 21.3583984375, 22.30224609375, 23.24609375, 24.18994140625, 25.1337890625, 26.07763671875, 27.021484375, 27.96533203125, 28.9091796875, 29.85302734375, 30.796875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 12.0, 7.0, 11.0, 8.0, 12.0, 10.0, 19.0, 29.0, 37.0, 37.0, 33.0, 52.0, 59.0, 81.0, 101.0, 91.0, 120.0, 124.0, 193.0, 212.0, 244.0, 291.0, 293.0, 328.0, 273.0, 221.0, 208.0, 166.0, 147.0, 127.0, 97.0, 86.0, 76.0, 52.0, 44.0, 32.0, 36.0, 25.0, 21.0, 19.0, 13.0, 5.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.734375, -12.3365478515625, -11.938720703125, -11.5408935546875, -11.14306640625, -10.7452392578125, -10.347412109375, -9.9495849609375, -9.5517578125, -9.1539306640625, -8.756103515625, -8.3582763671875, -7.96044921875, -7.5626220703125, -7.164794921875, -6.7669677734375, -6.369140625, -5.9713134765625, -5.573486328125, -5.1756591796875, -4.77783203125, -4.3800048828125, -3.982177734375, -3.5843505859375, -3.1865234375, -2.7886962890625, -2.390869140625, -1.9930419921875, -1.59521484375, -1.1973876953125, -0.799560546875, -0.4017333984375, -0.00390625, 0.3939208984375, 0.791748046875, 1.1895751953125, 1.58740234375, 1.9852294921875, 2.383056640625, 2.7808837890625, 3.1787109375, 3.5765380859375, 3.974365234375, 4.3721923828125, 4.77001953125, 5.1678466796875, 5.565673828125, 5.9635009765625, 6.361328125, 6.7591552734375, 7.156982421875, 7.5548095703125, 7.95263671875, 8.3504638671875, 8.748291015625, 9.1461181640625, 9.5439453125, 9.9417724609375, 10.339599609375, 10.7374267578125, 11.13525390625, 11.5330810546875, 11.930908203125, 12.3287353515625, 12.7265625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 7.0, 5.0, 6.0, 4.0, 13.0, 7.0, 12.0, 17.0, 13.0, 26.0, 15.0, 35.0, 29.0, 32.0, 41.0, 36.0, 56.0, 46.0, 50.0, 60.0, 64.0, 41.0, 43.0, 50.0, 43.0, 35.0, 27.0, 34.0, 25.0, 30.0, 23.0, 13.0, 18.0, 7.0, 8.0, 8.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.98836898803711, -32.030860900878906, -31.073352813720703, -30.1158447265625, -29.158336639404297, -28.200828552246094, -27.24332046508789, -26.285812377929688, -25.328304290771484, -24.37079620361328, -23.413288116455078, -22.455780029296875, -21.498271942138672, -20.54076385498047, -19.583255767822266, -18.625747680664062, -17.668237686157227, -16.710729598999023, -15.75322151184082, -14.795713424682617, -13.838205337524414, -12.880697250366211, -11.923188209533691, -10.965680122375488, -10.008172035217285, -9.050663948059082, -8.093155860900879, -7.135647296905518, -6.1781392097473145, -5.220631122589111, -4.26312255859375, -3.305614471435547, -2.3481063842773438, -1.390598177909851, -0.4330899715423584, 0.5244183540344238, 1.481926441192627, 2.43943452835083, 3.3969430923461914, 4.3544511795043945, 5.311959266662598, 6.269467353820801, 7.226975440979004, 8.184484481811523, 9.141992568969727, 10.09950065612793, 11.057008743286133, 12.014516830444336, 12.972024917602539, 13.929533004760742, 14.887041091918945, 15.844549179077148, 16.80205726623535, 17.759565353393555, 18.71707534790039, 19.674583435058594, 20.632091522216797, 21.589599609375, 22.547107696533203, 23.504615783691406, 24.46212387084961, 25.419631958007812, 26.377140045166016, 27.33464813232422, 28.292156219482422]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 1.0, 8.0, 5.0, 4.0, 3.0, 10.0, 16.0, 26.0, 14.0, 19.0, 15.0, 21.0, 21.0, 31.0, 34.0, 23.0, 37.0, 35.0, 45.0, 34.0, 48.0, 49.0, 30.0, 41.0, 32.0, 53.0, 37.0, 37.0, 39.0, 34.0, 22.0, 22.0, 27.0, 24.0, 19.0, 12.0, 10.0, 13.0, 10.0, 7.0, 7.0, 11.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.612638473510742, -27.6652889251709, -26.717939376831055, -25.77058982849121, -24.823240280151367, -23.875890731811523, -22.928543090820312, -21.98119354248047, -21.033843994140625, -20.08649444580078, -19.139144897460938, -18.191795349121094, -17.24444580078125, -16.297096252441406, -15.349747657775879, -14.402398109436035, -13.455047607421875, -12.507698059082031, -11.560348510742188, -10.612998962402344, -9.6656494140625, -8.718299865722656, -7.770951271057129, -6.823601722717285, -5.876252174377441, -4.928902626037598, -3.981553316116333, -3.0342040061950684, -2.0868544578552246, -1.1395049095153809, -0.1921558380126953, 0.7551937103271484, 1.7025413513183594, 2.649890899658203, 3.5972402095794678, 4.544589519500732, 5.491939067840576, 6.43928861618042, 7.3866376876831055, 8.33398723602295, 9.281336784362793, 10.228686332702637, 11.17603588104248, 12.123384475708008, 13.070734024047852, 14.018083572387695, 14.965433120727539, 15.912782669067383, 16.860132217407227, 17.80748176574707, 18.754831314086914, 19.702180862426758, 20.6495304107666, 21.596879959106445, 22.544227600097656, 23.4915771484375, 24.438926696777344, 25.386276245117188, 26.33362579345703, 27.280975341796875, 28.22832489013672, 29.175674438476562, 30.123023986816406, 31.07037353515625, 32.017723083496094]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 10.0, 7.0, 11.0, 32.0, 24.0, 44.0, 53.0, 83.0, 102.0, 161.0, 274.0, 469.0, 805.0, 1664.0, 3310.0, 7099.0, 17123.0, 46530.0, 136836.0, 373005.0, 298807.0, 101682.0, 35470.0, 13347.0, 5701.0, 2690.0, 1419.0, 699.0, 388.0, 236.0, 146.0, 106.0, 79.0, 44.0, 34.0, 28.0, 12.0, 9.0, 5.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.46875, -28.5439453125, -27.619140625, -26.6943359375, -25.76953125, -24.8447265625, -23.919921875, -22.9951171875, -22.0703125, -21.1455078125, -20.220703125, -19.2958984375, -18.37109375, -17.4462890625, -16.521484375, -15.5966796875, -14.671875, -13.7470703125, -12.822265625, -11.8974609375, -10.97265625, -10.0478515625, -9.123046875, -8.1982421875, -7.2734375, -6.3486328125, -5.423828125, -4.4990234375, -3.57421875, -2.6494140625, -1.724609375, -0.7998046875, 0.125, 1.0498046875, 1.974609375, 2.8994140625, 3.82421875, 4.7490234375, 5.673828125, 6.5986328125, 7.5234375, 8.4482421875, 9.373046875, 10.2978515625, 11.22265625, 12.1474609375, 13.072265625, 13.9970703125, 14.921875, 15.8466796875, 16.771484375, 17.6962890625, 18.62109375, 19.5458984375, 20.470703125, 21.3955078125, 22.3203125, 23.2451171875, 24.169921875, 25.0947265625, 26.01953125, 26.9443359375, 27.869140625, 28.7939453125, 29.71875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 6.0, 7.0, 11.0, 11.0, 17.0, 14.0, 23.0, 23.0, 23.0, 24.0, 32.0, 28.0, 33.0, 38.0, 40.0, 38.0, 49.0, 38.0, 46.0, 36.0, 42.0, 52.0, 43.0, 26.0, 27.0, 28.0, 45.0, 38.0, 21.0, 29.0, 22.0, 11.0, 13.0, 14.0, 8.0, 6.0, 5.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.484375, -25.528564453125, -24.57275390625, -23.616943359375, -22.6611328125, -21.705322265625, -20.74951171875, -19.793701171875, -18.837890625, -17.882080078125, -16.92626953125, -15.970458984375, -15.0146484375, -14.058837890625, -13.10302734375, -12.147216796875, -11.19140625, -10.235595703125, -9.27978515625, -8.323974609375, -7.3681640625, -6.412353515625, -5.45654296875, -4.500732421875, -3.544921875, -2.589111328125, -1.63330078125, -0.677490234375, 0.2783203125, 1.234130859375, 2.18994140625, 3.145751953125, 4.1015625, 5.057373046875, 6.01318359375, 6.968994140625, 7.9248046875, 8.880615234375, 9.83642578125, 10.792236328125, 11.748046875, 12.703857421875, 13.65966796875, 14.615478515625, 15.5712890625, 16.527099609375, 17.48291015625, 18.438720703125, 19.39453125, 20.350341796875, 21.30615234375, 22.261962890625, 23.2177734375, 24.173583984375, 25.12939453125, 26.085205078125, 27.041015625, 27.996826171875, 28.95263671875, 29.908447265625, 30.8642578125, 31.820068359375, 32.77587890625, 33.731689453125, 34.6875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 9.0, 5.0, 8.0, 14.0, 13.0, 24.0, 42.0, 66.0, 75.0, 95.0, 161.0, 269.0, 458.0, 804.0, 1500.0, 2870.0, 5635.0, 12593.0, 29733.0, 72656.0, 185306.0, 368667.0, 218039.0, 86300.0, 34525.0, 14820.0, 6658.0, 3264.0, 1650.0, 874.0, 547.0, 278.0, 189.0, 113.0, 85.0, 55.0, 40.0, 41.0, 22.0, 7.0, 15.0, 10.0, 4.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.3828125, -12.97216796875, -12.5615234375, -12.15087890625, -11.740234375, -11.32958984375, -10.9189453125, -10.50830078125, -10.09765625, -9.68701171875, -9.2763671875, -8.86572265625, -8.455078125, -8.04443359375, -7.6337890625, -7.22314453125, -6.8125, -6.40185546875, -5.9912109375, -5.58056640625, -5.169921875, -4.75927734375, -4.3486328125, -3.93798828125, -3.52734375, -3.11669921875, -2.7060546875, -2.29541015625, -1.884765625, -1.47412109375, -1.0634765625, -0.65283203125, -0.2421875, 0.16845703125, 0.5791015625, 0.98974609375, 1.400390625, 1.81103515625, 2.2216796875, 2.63232421875, 3.04296875, 3.45361328125, 3.8642578125, 4.27490234375, 4.685546875, 5.09619140625, 5.5068359375, 5.91748046875, 6.328125, 6.73876953125, 7.1494140625, 7.56005859375, 7.970703125, 8.38134765625, 8.7919921875, 9.20263671875, 9.61328125, 10.02392578125, 10.4345703125, 10.84521484375, 11.255859375, 11.66650390625, 12.0771484375, 12.48779296875, 12.8984375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 8.0, 11.0, 9.0, 9.0, 13.0, 14.0, 17.0, 28.0, 25.0, 27.0, 36.0, 22.0, 37.0, 28.0, 46.0, 50.0, 46.0, 30.0, 42.0, 33.0, 45.0, 39.0, 43.0, 37.0, 37.0, 35.0, 32.0, 24.0, 30.0, 16.0, 27.0, 24.0, 14.0, 15.0, 13.0, 7.0, 5.0, 7.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.203125, -20.576904296875, -19.95068359375, -19.324462890625, -18.6982421875, -18.072021484375, -17.44580078125, -16.819580078125, -16.193359375, -15.567138671875, -14.94091796875, -14.314697265625, -13.6884765625, -13.062255859375, -12.43603515625, -11.809814453125, -11.18359375, -10.557373046875, -9.93115234375, -9.304931640625, -8.6787109375, -8.052490234375, -7.42626953125, -6.800048828125, -6.173828125, -5.547607421875, -4.92138671875, -4.295166015625, -3.6689453125, -3.042724609375, -2.41650390625, -1.790283203125, -1.1640625, -0.537841796875, 0.08837890625, 0.714599609375, 1.3408203125, 1.967041015625, 2.59326171875, 3.219482421875, 3.845703125, 4.471923828125, 5.09814453125, 5.724365234375, 6.3505859375, 6.976806640625, 7.60302734375, 8.229248046875, 8.85546875, 9.481689453125, 10.10791015625, 10.734130859375, 11.3603515625, 11.986572265625, 12.61279296875, 13.239013671875, 13.865234375, 14.491455078125, 15.11767578125, 15.743896484375, 16.3701171875, 16.996337890625, 17.62255859375, 18.248779296875, 18.875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 8.0, 11.0, 16.0, 20.0, 26.0, 28.0, 41.0, 58.0, 85.0, 110.0, 162.0, 235.0, 375.0, 492.0, 812.0, 1315.0, 2088.0, 3668.0, 7114.0, 16840.0, 69126.0, 577572.0, 300733.0, 41070.0, 12514.0, 5654.0, 3208.0, 1827.0, 1084.0, 692.0, 504.0, 296.0, 215.0, 141.0, 126.0, 71.0, 52.0, 52.0, 30.0, 21.0, 15.0, 10.0, 11.0, 5.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0], "bins": [-6.9375, -6.7384033203125, -6.539306640625, -6.3402099609375, -6.14111328125, -5.9420166015625, -5.742919921875, -5.5438232421875, -5.3447265625, -5.1456298828125, -4.946533203125, -4.7474365234375, -4.54833984375, -4.3492431640625, -4.150146484375, -3.9510498046875, -3.751953125, -3.5528564453125, -3.353759765625, -3.1546630859375, -2.95556640625, -2.7564697265625, -2.557373046875, -2.3582763671875, -2.1591796875, -1.9600830078125, -1.760986328125, -1.5618896484375, -1.36279296875, -1.1636962890625, -0.964599609375, -0.7655029296875, -0.56640625, -0.3673095703125, -0.168212890625, 0.0308837890625, 0.22998046875, 0.4290771484375, 0.628173828125, 0.8272705078125, 1.0263671875, 1.2254638671875, 1.424560546875, 1.6236572265625, 1.82275390625, 2.0218505859375, 2.220947265625, 2.4200439453125, 2.619140625, 2.8182373046875, 3.017333984375, 3.2164306640625, 3.41552734375, 3.6146240234375, 3.813720703125, 4.0128173828125, 4.2119140625, 4.4110107421875, 4.610107421875, 4.8092041015625, 5.00830078125, 5.2073974609375, 5.406494140625, 5.6055908203125, 5.8046875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 11.0, 8.0, 21.0, 35.0, 54.0, 86.0, 182.0, 247.0, 158.0, 82.0, 37.0, 26.0, 15.0, 11.0, 12.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007305145263671875, -0.0006980001926422119, -0.0006654858589172363, -0.0006329715251922607, -0.0006004571914672852, -0.0005679428577423096, -0.000535428524017334, -0.0005029141902923584, -0.0004703998565673828, -0.0004378855228424072, -0.00040537118911743164, -0.00037285685539245605, -0.00034034252166748047, -0.0003078281879425049, -0.0002753138542175293, -0.0002427995204925537, -0.00021028518676757812, -0.00017777085304260254, -0.00014525651931762695, -0.00011274218559265137, -8.022785186767578e-05, -4.7713518142700195e-05, -1.519918441772461e-05, 1.7315149307250977e-05, 4.982948303222656e-05, 8.234381675720215e-05, 0.00011485815048217773, 0.00014737248420715332, 0.0001798868179321289, 0.0002124011516571045, 0.0002449154853820801, 0.00027742981910705566, 0.00030994415283203125, 0.00034245848655700684, 0.0003749728202819824, 0.000407487154006958, 0.0004400014877319336, 0.0004725158214569092, 0.0005050301551818848, 0.0005375444889068604, 0.0005700588226318359, 0.0006025731563568115, 0.0006350874900817871, 0.0006676018238067627, 0.0007001161575317383, 0.0007326304912567139, 0.0007651448249816895, 0.000797659158706665, 0.0008301734924316406, 0.0008626878261566162, 0.0008952021598815918, 0.0009277164936065674, 0.000960230827331543, 0.0009927451610565186, 0.0010252594947814941, 0.0010577738285064697, 0.0010902881622314453, 0.001122802495956421, 0.0011553168296813965, 0.001187831163406372, 0.0012203454971313477, 0.0012528598308563232, 0.0012853741645812988, 0.0013178884983062744, 0.00135040283203125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 4.0, 7.0, 12.0, 33.0, 29.0, 53.0, 101.0, 137.0, 215.0, 309.0, 492.0, 585.0, 1010.0, 1468.0, 2415.0, 4036.0, 8881.0, 28437.0, 161650.0, 664559.0, 130885.0, 24760.0, 8123.0, 3785.0, 2269.0, 1424.0, 960.0, 620.0, 434.0, 305.0, 180.0, 146.0, 90.0, 48.0, 38.0, 20.0, 17.0, 6.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8203125, -9.508056640625, -9.19580078125, -8.883544921875, -8.5712890625, -8.259033203125, -7.94677734375, -7.634521484375, -7.322265625, -7.010009765625, -6.69775390625, -6.385498046875, -6.0732421875, -5.760986328125, -5.44873046875, -5.136474609375, -4.82421875, -4.511962890625, -4.19970703125, -3.887451171875, -3.5751953125, -3.262939453125, -2.95068359375, -2.638427734375, -2.326171875, -2.013916015625, -1.70166015625, -1.389404296875, -1.0771484375, -0.764892578125, -0.45263671875, -0.140380859375, 0.171875, 0.484130859375, 0.79638671875, 1.108642578125, 1.4208984375, 1.733154296875, 2.04541015625, 2.357666015625, 2.669921875, 2.982177734375, 3.29443359375, 3.606689453125, 3.9189453125, 4.231201171875, 4.54345703125, 4.855712890625, 5.16796875, 5.480224609375, 5.79248046875, 6.104736328125, 6.4169921875, 6.729248046875, 7.04150390625, 7.353759765625, 7.666015625, 7.978271484375, 8.29052734375, 8.602783203125, 8.9150390625, 9.227294921875, 9.53955078125, 9.851806640625, 10.1640625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 14.0, 22.0, 26.0, 34.0, 65.0, 170.0, 231.0, 200.0, 93.0, 40.0, 23.0, 19.0, 9.0, 11.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.3570556640625, -2.282470703125, -2.2078857421875, -2.13330078125, -2.0587158203125, -1.984130859375, -1.9095458984375, -1.8349609375, -1.7603759765625, -1.685791015625, -1.6112060546875, -1.53662109375, -1.4620361328125, -1.387451171875, -1.3128662109375, -1.23828125, -1.1636962890625, -1.089111328125, -1.0145263671875, -0.93994140625, -0.8653564453125, -0.790771484375, -0.7161865234375, -0.6416015625, -0.5670166015625, -0.492431640625, -0.4178466796875, -0.34326171875, -0.2686767578125, -0.194091796875, -0.1195068359375, -0.044921875, 0.0296630859375, 0.104248046875, 0.1788330078125, 0.25341796875, 0.3280029296875, 0.402587890625, 0.4771728515625, 0.5517578125, 0.6263427734375, 0.700927734375, 0.7755126953125, 0.85009765625, 0.9246826171875, 0.999267578125, 1.0738525390625, 1.1484375, 1.2230224609375, 1.297607421875, 1.3721923828125, 1.44677734375, 1.5213623046875, 1.595947265625, 1.6705322265625, 1.7451171875, 1.8197021484375, 1.894287109375, 1.9688720703125, 2.04345703125, 2.1180419921875, 2.192626953125, 2.2672119140625, 2.341796875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 4.0, 4.0, 7.0, 5.0, 4.0, 7.0, 11.0, 15.0, 21.0, 10.0, 11.0, 22.0, 29.0, 31.0, 33.0, 41.0, 36.0, 45.0, 56.0, 40.0, 50.0, 47.0, 63.0, 47.0, 46.0, 48.0, 36.0, 32.0, 25.0, 23.0, 28.0, 25.0, 18.0, 20.0, 12.0, 6.0, 9.0, 6.0, 3.0, 1.0, 6.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 3.0], "bins": [-31.633893966674805, -30.776430130004883, -29.91896629333496, -29.061500549316406, -28.204036712646484, -27.346572875976562, -26.48910903930664, -25.63164520263672, -24.774179458618164, -23.916715621948242, -23.05925178527832, -22.201786041259766, -21.344322204589844, -20.486858367919922, -19.62939453125, -18.771930694580078, -17.914466857910156, -17.057003021240234, -16.199539184570312, -15.342074394226074, -14.484609603881836, -13.627145767211914, -12.769681930541992, -11.912217140197754, -11.054752349853516, -10.197288513183594, -9.339823722839355, -8.482359886169434, -7.624895095825195, -6.767431259155273, -5.909966945648193, -5.052502632141113, -4.195037841796875, -3.337573528289795, -2.480109214782715, -1.6226451396942139, -0.7651808261871338, 0.09228324890136719, 0.9497475624084473, 1.8072118759155273, 2.6646761894226074, 3.5221405029296875, 4.379604816436768, 5.237069129943848, 6.0945329666137695, 6.95199728012085, 7.80946159362793, 8.666925430297852, 9.52439022064209, 10.381854057312012, 11.23931884765625, 12.096782684326172, 12.95424747467041, 13.811711311340332, 14.66917610168457, 15.526639938354492, 16.384103775024414, 17.241567611694336, 18.099031448364258, 18.956497192382812, 19.813961029052734, 20.671424865722656, 21.528888702392578, 22.3863525390625, 23.243818283081055]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 4.0, 6.0, 9.0, 13.0, 26.0, 13.0, 18.0, 17.0, 23.0, 21.0, 29.0, 32.0, 26.0, 38.0, 31.0, 43.0, 38.0, 47.0, 43.0, 35.0, 39.0, 46.0, 43.0, 38.0, 42.0, 32.0, 35.0, 30.0, 17.0, 29.0, 16.0, 24.0, 12.0, 14.0, 12.0, 7.0, 11.0, 4.0, 11.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.001211166381836, -26.108997344970703, -25.216781616210938, -24.324567794799805, -23.43235206604004, -22.540138244628906, -21.64792251586914, -20.755708694458008, -19.863492965698242, -18.97127914428711, -18.079063415527344, -17.18684959411621, -16.294633865356445, -15.402420043945312, -14.510204315185547, -13.617990493774414, -12.725775718688965, -11.833560943603516, -10.941346168518066, -10.049131393432617, -9.156916618347168, -8.264701843261719, -7.372487545013428, -6.4802727699279785, -5.588057994842529, -4.69584321975708, -3.803628444671631, -2.9114139080047607, -2.0191991329193115, -1.1269845962524414, -0.2347698211669922, 0.657444953918457, 1.5496597290039062, 2.4418745040893555, 3.3340892791748047, 4.226304054260254, 5.118518829345703, 6.010733127593994, 6.902947902679443, 7.795162677764893, 8.6873779296875, 9.57959270477295, 10.471807479858398, 11.364022254943848, 12.256237030029297, 13.14845085144043, 14.040666580200195, 14.932880401611328, 15.825095176696777, 16.717309951782227, 17.60952377319336, 18.501739501953125, 19.393953323364258, 20.286169052124023, 21.178382873535156, 22.070598602294922, 22.962812423706055, 23.855026245117188, 24.747241973876953, 25.639455795288086, 26.53167152404785, 27.423885345458984, 28.31610107421875, 29.208314895629883, 30.10053062438965]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 9.0, 3.0, 14.0, 18.0, 20.0, 46.0, 53.0, 101.0, 135.0, 209.0, 353.0, 540.0, 776.0, 1241.0, 2091.0, 3279.0, 5350.0, 8902.0, 14572.0, 24577.0, 40552.0, 65332.0, 99648.0, 138200.0, 161441.0, 152456.0, 117861.0, 80800.0, 51069.0, 31281.0, 18624.0, 11216.0, 6768.0, 4115.0, 2500.0, 1596.0, 980.0, 645.0, 408.0, 262.0, 155.0, 127.0, 78.0, 43.0, 32.0, 23.0, 17.0, 14.0, 7.0, 11.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-34.0625, -33.02197265625, -31.9814453125, -30.94091796875, -29.900390625, -28.85986328125, -27.8193359375, -26.77880859375, -25.73828125, -24.69775390625, -23.6572265625, -22.61669921875, -21.576171875, -20.53564453125, -19.4951171875, -18.45458984375, -17.4140625, -16.37353515625, -15.3330078125, -14.29248046875, -13.251953125, -12.21142578125, -11.1708984375, -10.13037109375, -9.08984375, -8.04931640625, -7.0087890625, -5.96826171875, -4.927734375, -3.88720703125, -2.8466796875, -1.80615234375, -0.765625, 0.27490234375, 1.3154296875, 2.35595703125, 3.396484375, 4.43701171875, 5.4775390625, 6.51806640625, 7.55859375, 8.59912109375, 9.6396484375, 10.68017578125, 11.720703125, 12.76123046875, 13.8017578125, 14.84228515625, 15.8828125, 16.92333984375, 17.9638671875, 19.00439453125, 20.044921875, 21.08544921875, 22.1259765625, 23.16650390625, 24.20703125, 25.24755859375, 26.2880859375, 27.32861328125, 28.369140625, 29.40966796875, 30.4501953125, 31.49072265625, 32.53125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 6.0, 8.0, 5.0, 9.0, 10.0, 16.0, 18.0, 20.0, 20.0, 14.0, 26.0, 28.0, 31.0, 39.0, 24.0, 35.0, 35.0, 35.0, 39.0, 42.0, 30.0, 41.0, 43.0, 39.0, 44.0, 37.0, 37.0, 33.0, 24.0, 23.0, 30.0, 30.0, 18.0, 18.0, 13.0, 8.0, 11.0, 10.0, 8.0, 5.0, 11.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.71875, -21.953125, -21.1875, -20.421875, -19.65625, -18.890625, -18.125, -17.359375, -16.59375, -15.828125, -15.0625, -14.296875, -13.53125, -12.765625, -12.0, -11.234375, -10.46875, -9.703125, -8.9375, -8.171875, -7.40625, -6.640625, -5.875, -5.109375, -4.34375, -3.578125, -2.8125, -2.046875, -1.28125, -0.515625, 0.25, 1.015625, 1.78125, 2.546875, 3.3125, 4.078125, 4.84375, 5.609375, 6.375, 7.140625, 7.90625, 8.671875, 9.4375, 10.203125, 10.96875, 11.734375, 12.5, 13.265625, 14.03125, 14.796875, 15.5625, 16.328125, 17.09375, 17.859375, 18.625, 19.390625, 20.15625, 20.921875, 21.6875, 22.453125, 23.21875, 23.984375, 24.75, 25.515625, 26.28125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 17.0, 15.0, 43.0, 47.0, 78.0, 110.0, 154.0, 248.0, 369.0, 549.0, 818.0, 1195.0, 1873.0, 2829.0, 4303.0, 6571.0, 10080.0, 15766.0, 24520.0, 38350.0, 59935.0, 88508.0, 121930.0, 146183.0, 145991.0, 121704.0, 88888.0, 59658.0, 38281.0, 24434.0, 15821.0, 10181.0, 6423.0, 4278.0, 2790.0, 1827.0, 1234.0, 826.0, 548.0, 368.0, 265.0, 209.0, 108.0, 90.0, 55.0, 33.0, 13.0, 6.0, 8.0, 9.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.515625, -28.5634765625, -27.611328125, -26.6591796875, -25.70703125, -24.7548828125, -23.802734375, -22.8505859375, -21.8984375, -20.9462890625, -19.994140625, -19.0419921875, -18.08984375, -17.1376953125, -16.185546875, -15.2333984375, -14.28125, -13.3291015625, -12.376953125, -11.4248046875, -10.47265625, -9.5205078125, -8.568359375, -7.6162109375, -6.6640625, -5.7119140625, -4.759765625, -3.8076171875, -2.85546875, -1.9033203125, -0.951171875, 0.0009765625, 0.953125, 1.9052734375, 2.857421875, 3.8095703125, 4.76171875, 5.7138671875, 6.666015625, 7.6181640625, 8.5703125, 9.5224609375, 10.474609375, 11.4267578125, 12.37890625, 13.3310546875, 14.283203125, 15.2353515625, 16.1875, 17.1396484375, 18.091796875, 19.0439453125, 19.99609375, 20.9482421875, 21.900390625, 22.8525390625, 23.8046875, 24.7568359375, 25.708984375, 26.6611328125, 27.61328125, 28.5654296875, 29.517578125, 30.4697265625, 31.421875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 9.0, 6.0, 7.0, 8.0, 16.0, 12.0, 10.0, 15.0, 17.0, 14.0, 25.0, 19.0, 32.0, 30.0, 34.0, 28.0, 36.0, 45.0, 36.0, 38.0, 36.0, 39.0, 41.0, 30.0, 38.0, 40.0, 46.0, 35.0, 32.0, 23.0, 21.0, 24.0, 27.0, 29.0, 18.0, 11.0, 13.0, 8.0, 9.0, 12.0, 11.0, 1.0, 6.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-15.3671875, -14.8751220703125, -14.383056640625, -13.8909912109375, -13.39892578125, -12.9068603515625, -12.414794921875, -11.9227294921875, -11.4306640625, -10.9385986328125, -10.446533203125, -9.9544677734375, -9.46240234375, -8.9703369140625, -8.478271484375, -7.9862060546875, -7.494140625, -7.0020751953125, -6.510009765625, -6.0179443359375, -5.52587890625, -5.0338134765625, -4.541748046875, -4.0496826171875, -3.5576171875, -3.0655517578125, -2.573486328125, -2.0814208984375, -1.58935546875, -1.0972900390625, -0.605224609375, -0.1131591796875, 0.37890625, 0.8709716796875, 1.363037109375, 1.8551025390625, 2.34716796875, 2.8392333984375, 3.331298828125, 3.8233642578125, 4.3154296875, 4.8074951171875, 5.299560546875, 5.7916259765625, 6.28369140625, 6.7757568359375, 7.267822265625, 7.7598876953125, 8.251953125, 8.7440185546875, 9.236083984375, 9.7281494140625, 10.22021484375, 10.7122802734375, 11.204345703125, 11.6964111328125, 12.1884765625, 12.6805419921875, 13.172607421875, 13.6646728515625, 14.15673828125, 14.6488037109375, 15.140869140625, 15.6329345703125, 16.125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 11.0, 3.0, 2.0, 4.0, 9.0, 18.0, 15.0, 19.0, 34.0, 60.0, 79.0, 110.0, 170.0, 270.0, 462.0, 706.0, 1148.0, 2107.0, 3790.0, 7645.0, 16357.0, 36915.0, 84360.0, 178003.0, 269863.0, 226793.0, 120709.0, 53419.0, 23364.0, 10627.0, 4977.0, 2738.0, 1466.0, 831.0, 484.0, 324.0, 201.0, 162.0, 93.0, 75.0, 40.0, 24.0, 18.0, 16.0, 14.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.9453125, -9.62158203125, -9.2978515625, -8.97412109375, -8.650390625, -8.32666015625, -8.0029296875, -7.67919921875, -7.35546875, -7.03173828125, -6.7080078125, -6.38427734375, -6.060546875, -5.73681640625, -5.4130859375, -5.08935546875, -4.765625, -4.44189453125, -4.1181640625, -3.79443359375, -3.470703125, -3.14697265625, -2.8232421875, -2.49951171875, -2.17578125, -1.85205078125, -1.5283203125, -1.20458984375, -0.880859375, -0.55712890625, -0.2333984375, 0.09033203125, 0.4140625, 0.73779296875, 1.0615234375, 1.38525390625, 1.708984375, 2.03271484375, 2.3564453125, 2.68017578125, 3.00390625, 3.32763671875, 3.6513671875, 3.97509765625, 4.298828125, 4.62255859375, 4.9462890625, 5.27001953125, 5.59375, 5.91748046875, 6.2412109375, 6.56494140625, 6.888671875, 7.21240234375, 7.5361328125, 7.85986328125, 8.18359375, 8.50732421875, 8.8310546875, 9.15478515625, 9.478515625, 9.80224609375, 10.1259765625, 10.44970703125, 10.7734375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 1.0, 6.0, 12.0, 11.0, 16.0, 12.0, 19.0, 22.0, 29.0, 27.0, 35.0, 42.0, 50.0, 61.0, 52.0, 52.0, 68.0, 72.0, 48.0, 57.0, 48.0, 57.0, 30.0, 27.0, 23.0, 22.0, 17.0, 16.0, 8.0, 13.0, 8.0, 10.0, 6.0, 2.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0006327629089355469, -0.0006127581000328064, -0.0005927532911300659, -0.0005727484822273254, -0.000552743673324585, -0.0005327388644218445, -0.000512734055519104, -0.0004927292466163635, -0.00047272443771362305, -0.00045271962881088257, -0.0004327148199081421, -0.0004127100110054016, -0.00039270520210266113, -0.00037270039319992065, -0.0003526955842971802, -0.0003326907753944397, -0.0003126859664916992, -0.00029268115758895874, -0.00027267634868621826, -0.0002526715397834778, -0.0002326667308807373, -0.00021266192197799683, -0.00019265711307525635, -0.00017265230417251587, -0.0001526474952697754, -0.0001326426863670349, -0.00011263787746429443, -9.263306856155396e-05, -7.262825965881348e-05, -5.2623450756073e-05, -3.261864185333252e-05, -1.2613832950592041e-05, 7.3909759521484375e-06, 2.7395784854888916e-05, 4.7400593757629395e-05, 6.740540266036987e-05, 8.741021156311035e-05, 0.00010741502046585083, 0.0001274198293685913, 0.0001474246382713318, 0.00016742944717407227, 0.00018743425607681274, 0.00020743906497955322, 0.0002274438738822937, 0.0002474486827850342, 0.00026745349168777466, 0.00028745830059051514, 0.0003074631094932556, 0.0003274679183959961, 0.00034747272729873657, 0.00036747753620147705, 0.00038748234510421753, 0.000407487154006958, 0.0004274919629096985, 0.00044749677181243896, 0.00046750158071517944, 0.0004875063896179199, 0.0005075111985206604, 0.0005275160074234009, 0.0005475208163261414, 0.0005675256252288818, 0.0005875304341316223, 0.0006075352430343628, 0.0006275400519371033, 0.0006475448608398438]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 16.0, 14.0, 22.0, 34.0, 37.0, 45.0, 82.0, 119.0, 186.0, 284.0, 397.0, 664.0, 939.0, 1475.0, 2242.0, 3474.0, 5651.0, 8912.0, 14861.0, 23932.0, 38435.0, 61462.0, 93520.0, 129658.0, 154977.0, 152149.0, 121845.0, 85316.0, 55912.0, 34908.0, 21381.0, 13075.0, 8082.0, 5194.0, 3278.0, 2136.0, 1271.0, 859.0, 549.0, 388.0, 242.0, 168.0, 95.0, 75.0, 73.0, 38.0, 21.0, 31.0, 10.0, 13.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.69140625, -5.512939453125, -5.33447265625, -5.156005859375, -4.9775390625, -4.799072265625, -4.62060546875, -4.442138671875, -4.263671875, -4.085205078125, -3.90673828125, -3.728271484375, -3.5498046875, -3.371337890625, -3.19287109375, -3.014404296875, -2.8359375, -2.657470703125, -2.47900390625, -2.300537109375, -2.1220703125, -1.943603515625, -1.76513671875, -1.586669921875, -1.408203125, -1.229736328125, -1.05126953125, -0.872802734375, -0.6943359375, -0.515869140625, -0.33740234375, -0.158935546875, 0.01953125, 0.197998046875, 0.37646484375, 0.554931640625, 0.7333984375, 0.911865234375, 1.09033203125, 1.268798828125, 1.447265625, 1.625732421875, 1.80419921875, 1.982666015625, 2.1611328125, 2.339599609375, 2.51806640625, 2.696533203125, 2.875, 3.053466796875, 3.23193359375, 3.410400390625, 3.5888671875, 3.767333984375, 3.94580078125, 4.124267578125, 4.302734375, 4.481201171875, 4.65966796875, 4.838134765625, 5.0166015625, 5.195068359375, 5.37353515625, 5.552001953125, 5.73046875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 9.0, 4.0, 8.0, 11.0, 9.0, 17.0, 20.0, 27.0, 27.0, 31.0, 49.0, 38.0, 47.0, 42.0, 61.0, 54.0, 58.0, 60.0, 50.0, 56.0, 45.0, 45.0, 40.0, 29.0, 32.0, 28.0, 14.0, 23.0, 13.0, 14.0, 6.0, 4.0, 8.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.884765625, -2.805572509765625, -2.72637939453125, -2.647186279296875, -2.5679931640625, -2.488800048828125, -2.40960693359375, -2.330413818359375, -2.251220703125, -2.172027587890625, -2.09283447265625, -2.013641357421875, -1.9344482421875, -1.855255126953125, -1.77606201171875, -1.696868896484375, -1.61767578125, -1.538482666015625, -1.45928955078125, -1.380096435546875, -1.3009033203125, -1.221710205078125, -1.14251708984375, -1.063323974609375, -0.984130859375, -0.904937744140625, -0.82574462890625, -0.746551513671875, -0.6673583984375, -0.588165283203125, -0.50897216796875, -0.429779052734375, -0.3505859375, -0.271392822265625, -0.19219970703125, -0.113006591796875, -0.0338134765625, 0.045379638671875, 0.12457275390625, 0.203765869140625, 0.282958984375, 0.362152099609375, 0.44134521484375, 0.520538330078125, 0.5997314453125, 0.678924560546875, 0.75811767578125, 0.837310791015625, 0.91650390625, 0.995697021484375, 1.07489013671875, 1.154083251953125, 1.2332763671875, 1.312469482421875, 1.39166259765625, 1.470855712890625, 1.550048828125, 1.629241943359375, 1.70843505859375, 1.787628173828125, 1.8668212890625, 1.946014404296875, 2.02520751953125, 2.104400634765625, 2.18359375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 7.0, 7.0, 19.0, 10.0, 18.0, 10.0, 23.0, 21.0, 23.0, 21.0, 30.0, 35.0, 36.0, 39.0, 51.0, 41.0, 44.0, 50.0, 47.0, 44.0, 47.0, 34.0, 35.0, 38.0, 29.0, 31.0, 36.0, 24.0, 23.0, 14.0, 18.0, 18.0, 12.0, 4.0, 6.0, 5.0, 6.0, 7.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-26.111114501953125, -25.375850677490234, -24.640588760375977, -23.905324935913086, -23.170061111450195, -22.434797286987305, -21.699535369873047, -20.964271545410156, -20.229007720947266, -19.493743896484375, -18.758481979370117, -18.023218154907227, -17.287954330444336, -16.552690505981445, -15.817428588867188, -15.082164764404297, -14.346901893615723, -13.611639022827148, -12.876375198364258, -12.141112327575684, -11.405848503112793, -10.670585632324219, -9.935321807861328, -9.200058937072754, -8.46479606628418, -7.729532718658447, -6.994269371032715, -6.259006500244141, -5.52374267578125, -4.788479804992676, -4.053216457366943, -3.317953109741211, -2.5826892852783203, -1.847425937652588, -1.112162709236145, -0.37689948081970215, 0.3583638668060303, 1.0936272144317627, 1.828890323638916, 2.5641536712646484, 3.299417018890381, 4.034680366516113, 4.769943714141846, 5.505207061767578, 6.240469932556152, 6.975733757019043, 7.710996627807617, 8.446260452270508, 9.181523323059082, 9.916786193847656, 10.652050018310547, 11.387312889099121, 12.122576713562012, 12.857839584350586, 13.593103408813477, 14.32836627960205, 15.063629150390625, 15.7988920211792, 16.534154891967773, 17.269418716430664, 18.004682540893555, 18.739946365356445, 19.475208282470703, 20.210472106933594, 20.945735931396484]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 5.0, 6.0, 7.0, 11.0, 15.0, 14.0, 14.0, 23.0, 17.0, 32.0, 25.0, 29.0, 35.0, 39.0, 45.0, 43.0, 36.0, 51.0, 28.0, 53.0, 41.0, 41.0, 52.0, 42.0, 38.0, 30.0, 32.0, 31.0, 27.0, 25.0, 17.0, 14.0, 15.0, 11.0, 9.0, 8.0, 9.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.850770950317383, -26.979263305664062, -26.107755661010742, -25.236248016357422, -24.3647403717041, -23.49323272705078, -22.621723175048828, -21.75021743774414, -20.878707885742188, -20.007200241088867, -19.135692596435547, -18.264184951782227, -17.392677307128906, -16.521169662475586, -15.64966106414795, -14.778153419494629, -13.906646728515625, -13.035139083862305, -12.163631439208984, -11.292123794555664, -10.420616149902344, -9.549108505249023, -8.677599906921387, -7.806092262268066, -6.934584617614746, -6.063076972961426, -5.1915693283081055, -4.320061206817627, -3.4485535621643066, -2.5770459175109863, -1.7055377960205078, -0.8340301513671875, 0.037479400634765625, 0.9089871644973755, 1.7804949283599854, 2.6520028114318848, 3.523510456085205, 4.395018100738525, 5.266526222229004, 6.138033866882324, 7.0095415115356445, 7.881049156188965, 8.752556800842285, 9.624065399169922, 10.495573043823242, 11.367080688476562, 12.238588333129883, 13.110095977783203, 13.981603622436523, 14.853111267089844, 15.724618911743164, 16.596126556396484, 17.467634201049805, 18.339141845703125, 19.210651397705078, 20.082157135009766, 20.95366668701172, 21.82517433166504, 22.69668197631836, 23.56818962097168, 24.439697265625, 25.31120491027832, 26.18271255493164, 27.054222106933594, 27.92572784423828]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 19.0, 29.0, 44.0, 68.0, 85.0, 131.0, 194.0, 303.0, 432.0, 712.0, 1093.0, 1642.0, 2530.0, 4008.0, 6309.0, 10255.0, 16271.0, 26443.0, 43319.0, 72788.0, 122876.0, 209738.0, 362195.0, 586805.0, 770826.0, 724285.0, 501361.0, 298156.0, 173080.0, 101618.0, 60584.0, 36765.0, 22082.0, 13829.0, 8680.0, 5331.0, 3447.0, 2102.0, 1382.0, 860.0, 525.0, 397.0, 228.0, 143.0, 102.0, 80.0, 43.0, 26.0, 17.0, 9.0, 6.0, 7.0, 3.0, 2.0], "bins": [-23.953125, -23.265380859375, -22.57763671875, -21.889892578125, -21.2021484375, -20.514404296875, -19.82666015625, -19.138916015625, -18.451171875, -17.763427734375, -17.07568359375, -16.387939453125, -15.7001953125, -15.012451171875, -14.32470703125, -13.636962890625, -12.94921875, -12.261474609375, -11.57373046875, -10.885986328125, -10.1982421875, -9.510498046875, -8.82275390625, -8.135009765625, -7.447265625, -6.759521484375, -6.07177734375, -5.384033203125, -4.6962890625, -4.008544921875, -3.32080078125, -2.633056640625, -1.9453125, -1.257568359375, -0.56982421875, 0.117919921875, 0.8056640625, 1.493408203125, 2.18115234375, 2.868896484375, 3.556640625, 4.244384765625, 4.93212890625, 5.619873046875, 6.3076171875, 6.995361328125, 7.68310546875, 8.370849609375, 9.05859375, 9.746337890625, 10.43408203125, 11.121826171875, 11.8095703125, 12.497314453125, 13.18505859375, 13.872802734375, 14.560546875, 15.248291015625, 15.93603515625, 16.623779296875, 17.3115234375, 17.999267578125, 18.68701171875, 19.374755859375, 20.0625]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 10.0, 5.0, 3.0, 5.0, 13.0, 17.0, 10.0, 20.0, 23.0, 14.0, 16.0, 23.0, 37.0, 33.0, 36.0, 42.0, 43.0, 39.0, 45.0, 45.0, 54.0, 33.0, 36.0, 42.0, 44.0, 42.0, 39.0, 36.0, 26.0, 25.0, 21.0, 18.0, 15.0, 21.0, 14.0, 9.0, 9.0, 6.0, 5.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.640625, -17.05908203125, -16.4775390625, -15.89599609375, -15.314453125, -14.73291015625, -14.1513671875, -13.56982421875, -12.98828125, -12.40673828125, -11.8251953125, -11.24365234375, -10.662109375, -10.08056640625, -9.4990234375, -8.91748046875, -8.3359375, -7.75439453125, -7.1728515625, -6.59130859375, -6.009765625, -5.42822265625, -4.8466796875, -4.26513671875, -3.68359375, -3.10205078125, -2.5205078125, -1.93896484375, -1.357421875, -0.77587890625, -0.1943359375, 0.38720703125, 0.96875, 1.55029296875, 2.1318359375, 2.71337890625, 3.294921875, 3.87646484375, 4.4580078125, 5.03955078125, 5.62109375, 6.20263671875, 6.7841796875, 7.36572265625, 7.947265625, 8.52880859375, 9.1103515625, 9.69189453125, 10.2734375, 10.85498046875, 11.4365234375, 12.01806640625, 12.599609375, 13.18115234375, 13.7626953125, 14.34423828125, 14.92578125, 15.50732421875, 16.0888671875, 16.67041015625, 17.251953125, 17.83349609375, 18.4150390625, 18.99658203125, 19.578125]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 10.0, 30.0, 41.0, 54.0, 78.0, 131.0, 198.0, 308.0, 525.0, 879.0, 1374.0, 2292.0, 3840.0, 6427.0, 10387.0, 17633.0, 29903.0, 50559.0, 85602.0, 142121.0, 233281.0, 364447.0, 531082.0, 668355.0, 653671.0, 505968.0, 343979.0, 216611.0, 131586.0, 78539.0, 46323.0, 27460.0, 16112.0, 9634.0, 5861.0, 3509.0, 2093.0, 1276.0, 762.0, 489.0, 325.0, 194.0, 108.0, 76.0, 57.0, 31.0, 26.0, 18.0, 9.0, 6.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0], "bins": [-19.34375, -18.73779296875, -18.1318359375, -17.52587890625, -16.919921875, -16.31396484375, -15.7080078125, -15.10205078125, -14.49609375, -13.89013671875, -13.2841796875, -12.67822265625, -12.072265625, -11.46630859375, -10.8603515625, -10.25439453125, -9.6484375, -9.04248046875, -8.4365234375, -7.83056640625, -7.224609375, -6.61865234375, -6.0126953125, -5.40673828125, -4.80078125, -4.19482421875, -3.5888671875, -2.98291015625, -2.376953125, -1.77099609375, -1.1650390625, -0.55908203125, 0.046875, 0.65283203125, 1.2587890625, 1.86474609375, 2.470703125, 3.07666015625, 3.6826171875, 4.28857421875, 4.89453125, 5.50048828125, 6.1064453125, 6.71240234375, 7.318359375, 7.92431640625, 8.5302734375, 9.13623046875, 9.7421875, 10.34814453125, 10.9541015625, 11.56005859375, 12.166015625, 12.77197265625, 13.3779296875, 13.98388671875, 14.58984375, 15.19580078125, 15.8017578125, 16.40771484375, 17.013671875, 17.61962890625, 18.2255859375, 18.83154296875, 19.4375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 9.0, 7.0, 10.0, 7.0, 7.0, 18.0, 13.0, 26.0, 33.0, 29.0, 41.0, 54.0, 53.0, 84.0, 86.0, 118.0, 114.0, 134.0, 155.0, 193.0, 223.0, 222.0, 231.0, 263.0, 276.0, 232.0, 240.0, 197.0, 191.0, 142.0, 124.0, 108.0, 84.0, 92.0, 56.0, 48.0, 45.0, 36.0, 15.0, 20.0, 9.0, 12.0, 10.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-10.7109375, -10.43408203125, -10.1572265625, -9.88037109375, -9.603515625, -9.32666015625, -9.0498046875, -8.77294921875, -8.49609375, -8.21923828125, -7.9423828125, -7.66552734375, -7.388671875, -7.11181640625, -6.8349609375, -6.55810546875, -6.28125, -6.00439453125, -5.7275390625, -5.45068359375, -5.173828125, -4.89697265625, -4.6201171875, -4.34326171875, -4.06640625, -3.78955078125, -3.5126953125, -3.23583984375, -2.958984375, -2.68212890625, -2.4052734375, -2.12841796875, -1.8515625, -1.57470703125, -1.2978515625, -1.02099609375, -0.744140625, -0.46728515625, -0.1904296875, 0.08642578125, 0.36328125, 0.64013671875, 0.9169921875, 1.19384765625, 1.470703125, 1.74755859375, 2.0244140625, 2.30126953125, 2.578125, 2.85498046875, 3.1318359375, 3.40869140625, 3.685546875, 3.96240234375, 4.2392578125, 4.51611328125, 4.79296875, 5.06982421875, 5.3466796875, 5.62353515625, 5.900390625, 6.17724609375, 6.4541015625, 6.73095703125, 7.0078125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 6.0, 7.0, 8.0, 1.0, 16.0, 16.0, 17.0, 20.0, 20.0, 16.0, 20.0, 35.0, 29.0, 33.0, 52.0, 48.0, 38.0, 51.0, 54.0, 49.0, 51.0, 38.0, 40.0, 52.0, 34.0, 36.0, 33.0, 35.0, 21.0, 13.0, 14.0, 26.0, 20.0, 11.0, 13.0, 8.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.13215446472168, -19.525615692138672, -18.919078826904297, -18.31254005432129, -17.706003189086914, -17.099464416503906, -16.49292755126953, -15.886388778686523, -15.279850006103516, -14.673312187194824, -14.066774368286133, -13.460235595703125, -12.853697776794434, -12.247159957885742, -11.64062213897705, -11.03408432006836, -10.427546501159668, -9.821008682250977, -9.214470863342285, -8.607933044433594, -8.001394271850586, -7.3948564529418945, -6.788318634033203, -6.1817803382873535, -5.575242519378662, -4.968704700469971, -4.362166404724121, -3.7556285858154297, -3.149090528488159, -2.5425524711608887, -1.9360146522521973, -1.3294763565063477, -0.7229385375976562, -0.11640053987503052, 0.4901374578475952, 1.0966753959655762, 1.7032134532928467, 2.309751510620117, 2.9162893295288086, 3.522827625274658, 4.12936544418335, 4.735903263092041, 5.342441558837891, 5.948979377746582, 6.555517196655273, 7.162055492401123, 7.7685933113098145, 8.375131607055664, 8.981669425964355, 9.588207244873047, 10.194745063781738, 10.80128288269043, 11.407821655273438, 12.014359474182129, 12.62089729309082, 13.227436065673828, 13.833972930908203, 14.440510749816895, 15.047048568725586, 15.653587341308594, 16.26012420654297, 16.866662979125977, 17.473201751708984, 18.07973861694336, 18.686277389526367]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 3.0, 5.0, 2.0, 4.0, 5.0, 7.0, 12.0, 9.0, 15.0, 24.0, 17.0, 23.0, 35.0, 37.0, 30.0, 24.0, 40.0, 34.0, 33.0, 38.0, 46.0, 38.0, 56.0, 41.0, 34.0, 43.0, 49.0, 37.0, 35.0, 32.0, 30.0, 30.0, 29.0, 14.0, 17.0, 13.0, 16.0, 12.0, 9.0, 8.0, 7.0, 8.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.753602981567383, -23.060516357421875, -22.367431640625, -21.674345016479492, -20.981260299682617, -20.28817367553711, -19.595088958740234, -18.902002334594727, -18.20891571044922, -17.51582908630371, -16.822744369506836, -16.129657745361328, -15.436572074890137, -14.743486404418945, -14.050400733947754, -13.357315063476562, -12.664229393005371, -11.97114372253418, -11.278058052062988, -10.584972381591797, -9.891885757446289, -9.198800086975098, -8.505714416503906, -7.812628269195557, -7.119542598724365, -6.426456928253174, -5.733370780944824, -5.040285110473633, -4.347199440002441, -3.654113292694092, -2.9610276222229004, -2.267941474914551, -1.5748558044433594, -0.8817699551582336, -0.1886841058731079, 0.504401683807373, 1.1974875926971436, 1.890573501586914, 2.5836591720581055, 3.276745319366455, 3.9698309898376465, 4.662916660308838, 5.3560028076171875, 6.049088478088379, 6.74217414855957, 7.43526029586792, 8.128345489501953, 8.821432113647461, 9.514517784118652, 10.207603454589844, 10.900689125061035, 11.593774795532227, 12.286861419677734, 12.979947090148926, 13.673032760620117, 14.366119384765625, 15.0592041015625, 15.752289772033691, 16.445375442504883, 17.13846206665039, 17.831546783447266, 18.524633407592773, 19.21772003173828, 19.910804748535156, 20.603891372680664]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 13.0, 8.0, 17.0, 19.0, 35.0, 39.0, 44.0, 65.0, 90.0, 110.0, 146.0, 185.0, 247.0, 344.0, 508.0, 656.0, 882.0, 1335.0, 2201.0, 4480.0, 11271.0, 36920.0, 130208.0, 402761.0, 318263.0, 92213.0, 26915.0, 8782.0, 3535.0, 1865.0, 1211.0, 840.0, 579.0, 446.0, 326.0, 235.0, 195.0, 142.0, 106.0, 73.0, 68.0, 39.0, 30.0, 25.0, 20.0, 14.0, 9.0, 8.0, 7.0, 4.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.515625, -17.915771484375, -17.31591796875, -16.716064453125, -16.1162109375, -15.516357421875, -14.91650390625, -14.316650390625, -13.716796875, -13.116943359375, -12.51708984375, -11.917236328125, -11.3173828125, -10.717529296875, -10.11767578125, -9.517822265625, -8.91796875, -8.318115234375, -7.71826171875, -7.118408203125, -6.5185546875, -5.918701171875, -5.31884765625, -4.718994140625, -4.119140625, -3.519287109375, -2.91943359375, -2.319580078125, -1.7197265625, -1.119873046875, -0.52001953125, 0.079833984375, 0.6796875, 1.279541015625, 1.87939453125, 2.479248046875, 3.0791015625, 3.678955078125, 4.27880859375, 4.878662109375, 5.478515625, 6.078369140625, 6.67822265625, 7.278076171875, 7.8779296875, 8.477783203125, 9.07763671875, 9.677490234375, 10.27734375, 10.877197265625, 11.47705078125, 12.076904296875, 12.6767578125, 13.276611328125, 13.87646484375, 14.476318359375, 15.076171875, 15.676025390625, 16.27587890625, 16.875732421875, 17.4755859375, 18.075439453125, 18.67529296875, 19.275146484375, 19.875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 16.0, 13.0, 16.0, 18.0, 19.0, 21.0, 41.0, 27.0, 30.0, 37.0, 47.0, 43.0, 36.0, 35.0, 42.0, 49.0, 51.0, 28.0, 46.0, 44.0, 39.0, 38.0, 40.0, 44.0, 22.0, 17.0, 22.0, 14.0, 15.0, 11.0, 13.0, 11.0, 5.0, 11.0, 4.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-24.921875, -24.22021484375, -23.5185546875, -22.81689453125, -22.115234375, -21.41357421875, -20.7119140625, -20.01025390625, -19.30859375, -18.60693359375, -17.9052734375, -17.20361328125, -16.501953125, -15.80029296875, -15.0986328125, -14.39697265625, -13.6953125, -12.99365234375, -12.2919921875, -11.59033203125, -10.888671875, -10.18701171875, -9.4853515625, -8.78369140625, -8.08203125, -7.38037109375, -6.6787109375, -5.97705078125, -5.275390625, -4.57373046875, -3.8720703125, -3.17041015625, -2.46875, -1.76708984375, -1.0654296875, -0.36376953125, 0.337890625, 1.03955078125, 1.7412109375, 2.44287109375, 3.14453125, 3.84619140625, 4.5478515625, 5.24951171875, 5.951171875, 6.65283203125, 7.3544921875, 8.05615234375, 8.7578125, 9.45947265625, 10.1611328125, 10.86279296875, 11.564453125, 12.26611328125, 12.9677734375, 13.66943359375, 14.37109375, 15.07275390625, 15.7744140625, 16.47607421875, 17.177734375, 17.87939453125, 18.5810546875, 19.28271484375, 19.984375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 8.0, 4.0, 6.0, 13.0, 15.0, 15.0, 28.0, 36.0, 40.0, 60.0, 83.0, 135.0, 214.0, 293.0, 446.0, 842.0, 1781.0, 4771.0, 14581.0, 51163.0, 194700.0, 479267.0, 217087.0, 57152.0, 16390.0, 5084.0, 1905.0, 972.0, 469.0, 288.0, 213.0, 140.0, 95.0, 60.0, 37.0, 36.0, 29.0, 27.0, 24.0, 13.0, 5.0, 9.0, 5.0, 3.0, 2.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0], "bins": [-13.0546875, -12.6767578125, -12.298828125, -11.9208984375, -11.54296875, -11.1650390625, -10.787109375, -10.4091796875, -10.03125, -9.6533203125, -9.275390625, -8.8974609375, -8.51953125, -8.1416015625, -7.763671875, -7.3857421875, -7.0078125, -6.6298828125, -6.251953125, -5.8740234375, -5.49609375, -5.1181640625, -4.740234375, -4.3623046875, -3.984375, -3.6064453125, -3.228515625, -2.8505859375, -2.47265625, -2.0947265625, -1.716796875, -1.3388671875, -0.9609375, -0.5830078125, -0.205078125, 0.1728515625, 0.55078125, 0.9287109375, 1.306640625, 1.6845703125, 2.0625, 2.4404296875, 2.818359375, 3.1962890625, 3.57421875, 3.9521484375, 4.330078125, 4.7080078125, 5.0859375, 5.4638671875, 5.841796875, 6.2197265625, 6.59765625, 6.9755859375, 7.353515625, 7.7314453125, 8.109375, 8.4873046875, 8.865234375, 9.2431640625, 9.62109375, 9.9990234375, 10.376953125, 10.7548828125, 11.1328125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 5.0, 9.0, 6.0, 9.0, 12.0, 14.0, 18.0, 20.0, 25.0, 24.0, 26.0, 34.0, 28.0, 45.0, 46.0, 45.0, 46.0, 33.0, 49.0, 40.0, 42.0, 53.0, 42.0, 46.0, 36.0, 42.0, 29.0, 28.0, 24.0, 22.0, 22.0, 14.0, 12.0, 12.0, 12.0, 6.0, 4.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4375, -13.948486328125, -13.45947265625, -12.970458984375, -12.4814453125, -11.992431640625, -11.50341796875, -11.014404296875, -10.525390625, -10.036376953125, -9.54736328125, -9.058349609375, -8.5693359375, -8.080322265625, -7.59130859375, -7.102294921875, -6.61328125, -6.124267578125, -5.63525390625, -5.146240234375, -4.6572265625, -4.168212890625, -3.67919921875, -3.190185546875, -2.701171875, -2.212158203125, -1.72314453125, -1.234130859375, -0.7451171875, -0.256103515625, 0.23291015625, 0.721923828125, 1.2109375, 1.699951171875, 2.18896484375, 2.677978515625, 3.1669921875, 3.656005859375, 4.14501953125, 4.634033203125, 5.123046875, 5.612060546875, 6.10107421875, 6.590087890625, 7.0791015625, 7.568115234375, 8.05712890625, 8.546142578125, 9.03515625, 9.524169921875, 10.01318359375, 10.502197265625, 10.9912109375, 11.480224609375, 11.96923828125, 12.458251953125, 12.947265625, 13.436279296875, 13.92529296875, 14.414306640625, 14.9033203125, 15.392333984375, 15.88134765625, 16.370361328125, 16.859375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 8.0, 12.0, 5.0, 27.0, 13.0, 42.0, 45.0, 58.0, 88.0, 139.0, 203.0, 370.0, 528.0, 907.0, 1493.0, 2616.0, 4876.0, 9259.0, 18208.0, 39220.0, 90723.0, 229883.0, 365744.0, 159472.0, 65213.0, 29281.0, 13990.0, 7132.0, 3609.0, 2143.0, 1218.0, 717.0, 454.0, 266.0, 182.0, 121.0, 99.0, 56.0, 45.0, 25.0, 25.0, 12.0, 15.0, 2.0, 9.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.587890625, -1.5387420654296875, -1.489593505859375, -1.4404449462890625, -1.39129638671875, -1.3421478271484375, -1.292999267578125, -1.2438507080078125, -1.1947021484375, -1.1455535888671875, -1.096405029296875, -1.0472564697265625, -0.99810791015625, -0.9489593505859375, -0.899810791015625, -0.8506622314453125, -0.801513671875, -0.7523651123046875, -0.703216552734375, -0.6540679931640625, -0.60491943359375, -0.5557708740234375, -0.506622314453125, -0.4574737548828125, -0.4083251953125, -0.3591766357421875, -0.310028076171875, -0.2608795166015625, -0.21173095703125, -0.1625823974609375, -0.113433837890625, -0.0642852783203125, -0.01513671875, 0.0340118408203125, 0.083160400390625, 0.1323089599609375, 0.18145751953125, 0.2306060791015625, 0.279754638671875, 0.3289031982421875, 0.3780517578125, 0.4272003173828125, 0.476348876953125, 0.5254974365234375, 0.57464599609375, 0.6237945556640625, 0.672943115234375, 0.7220916748046875, 0.771240234375, 0.8203887939453125, 0.869537353515625, 0.9186859130859375, 0.96783447265625, 1.0169830322265625, 1.066131591796875, 1.1152801513671875, 1.1644287109375, 1.2135772705078125, 1.262725830078125, 1.3118743896484375, 1.36102294921875, 1.4101715087890625, 1.459320068359375, 1.5084686279296875, 1.5576171875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 5.0, 7.0, 7.0, 5.0, 8.0, 11.0, 17.0, 17.0, 33.0, 53.0, 69.0, 112.0, 151.0, 137.0, 101.0, 75.0, 50.0, 27.0, 16.0, 14.0, 9.0, 10.0, 6.0, 7.0, 7.0, 4.0, 3.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003731250762939453, -0.0003617480397224426, -0.00035037100315093994, -0.00033899396657943726, -0.00032761693000793457, -0.0003162398934364319, -0.0003048628568649292, -0.0002934858202934265, -0.00028210878372192383, -0.00027073174715042114, -0.00025935471057891846, -0.00024797767400741577, -0.00023660063743591309, -0.0002252236008644104, -0.00021384656429290771, -0.00020246952772140503, -0.00019109249114990234, -0.00017971545457839966, -0.00016833841800689697, -0.0001569613814353943, -0.0001455843448638916, -0.00013420730829238892, -0.00012283027172088623, -0.00011145323514938354, -0.00010007619857788086, -8.869916200637817e-05, -7.732212543487549e-05, -6.59450888633728e-05, -5.456805229187012e-05, -4.319101572036743e-05, -3.1813979148864746e-05, -2.043694257736206e-05, -9.059906005859375e-06, 2.3171305656433105e-06, 1.3694167137145996e-05, 2.507120370864868e-05, 3.644824028015137e-05, 4.782527685165405e-05, 5.920231342315674e-05, 7.057934999465942e-05, 8.195638656616211e-05, 9.33334231376648e-05, 0.00010471045970916748, 0.00011608749628067017, 0.00012746453285217285, 0.00013884156942367554, 0.00015021860599517822, 0.0001615956425666809, 0.0001729726791381836, 0.00018434971570968628, 0.00019572675228118896, 0.00020710378885269165, 0.00021848082542419434, 0.00022985786199569702, 0.0002412348985671997, 0.0002526119351387024, 0.0002639889717102051, 0.00027536600828170776, 0.00028674304485321045, 0.00029812008142471313, 0.0003094971179962158, 0.0003208741545677185, 0.0003322511911392212, 0.0003436282277107239, 0.00035500526428222656]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 11.0, 23.0, 23.0, 36.0, 52.0, 83.0, 115.0, 193.0, 266.0, 429.0, 649.0, 912.0, 1353.0, 2176.0, 3073.0, 4903.0, 8134.0, 14300.0, 25834.0, 51517.0, 117330.0, 308363.0, 289250.0, 110671.0, 48700.0, 24651.0, 13683.0, 7949.0, 4860.0, 3006.0, 1985.0, 1282.0, 886.0, 621.0, 427.0, 265.0, 176.0, 134.0, 79.0, 47.0, 33.0, 21.0, 16.0, 9.0, 5.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.501953125, -2.426055908203125, -2.35015869140625, -2.274261474609375, -2.1983642578125, -2.122467041015625, -2.04656982421875, -1.970672607421875, -1.894775390625, -1.818878173828125, -1.74298095703125, -1.667083740234375, -1.5911865234375, -1.515289306640625, -1.43939208984375, -1.363494873046875, -1.28759765625, -1.211700439453125, -1.13580322265625, -1.059906005859375, -0.9840087890625, -0.908111572265625, -0.83221435546875, -0.756317138671875, -0.680419921875, -0.604522705078125, -0.52862548828125, -0.452728271484375, -0.3768310546875, -0.300933837890625, -0.22503662109375, -0.149139404296875, -0.0732421875, 0.002655029296875, 0.07855224609375, 0.154449462890625, 0.2303466796875, 0.306243896484375, 0.38214111328125, 0.458038330078125, 0.533935546875, 0.609832763671875, 0.68572998046875, 0.761627197265625, 0.8375244140625, 0.913421630859375, 0.98931884765625, 1.065216064453125, 1.14111328125, 1.217010498046875, 1.29290771484375, 1.368804931640625, 1.4447021484375, 1.520599365234375, 1.59649658203125, 1.672393798828125, 1.748291015625, 1.824188232421875, 1.90008544921875, 1.975982666015625, 2.0518798828125, 2.127777099609375, 2.20367431640625, 2.279571533203125, 2.35546875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 2.0, 9.0, 5.0, 10.0, 12.0, 18.0, 19.0, 11.0, 25.0, 24.0, 39.0, 59.0, 62.0, 87.0, 115.0, 120.0, 79.0, 61.0, 48.0, 34.0, 29.0, 28.0, 16.0, 14.0, 15.0, 8.0, 13.0, 8.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6533203125, -0.6334381103515625, -0.613555908203125, -0.5936737060546875, -0.57379150390625, -0.5539093017578125, -0.534027099609375, -0.5141448974609375, -0.4942626953125, -0.4743804931640625, -0.454498291015625, -0.4346160888671875, -0.41473388671875, -0.3948516845703125, -0.374969482421875, -0.3550872802734375, -0.335205078125, -0.3153228759765625, -0.295440673828125, -0.2755584716796875, -0.25567626953125, -0.2357940673828125, -0.215911865234375, -0.1960296630859375, -0.1761474609375, -0.1562652587890625, -0.136383056640625, -0.1165008544921875, -0.09661865234375, -0.0767364501953125, -0.056854248046875, -0.0369720458984375, -0.01708984375, 0.0027923583984375, 0.022674560546875, 0.0425567626953125, 0.06243896484375, 0.0823211669921875, 0.102203369140625, 0.1220855712890625, 0.1419677734375, 0.1618499755859375, 0.181732177734375, 0.2016143798828125, 0.22149658203125, 0.2413787841796875, 0.261260986328125, 0.2811431884765625, 0.301025390625, 0.3209075927734375, 0.340789794921875, 0.3606719970703125, 0.38055419921875, 0.4004364013671875, 0.420318603515625, 0.4402008056640625, 0.4600830078125, 0.4799652099609375, 0.499847412109375, 0.5197296142578125, 0.53961181640625, 0.5594940185546875, 0.579376220703125, 0.5992584228515625, 0.619140625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 7.0, 6.0, 10.0, 8.0, 29.0, 18.0, 19.0, 21.0, 22.0, 35.0, 34.0, 44.0, 44.0, 48.0, 51.0, 60.0, 48.0, 59.0, 49.0, 52.0, 49.0, 43.0, 32.0, 35.0, 28.0, 23.0, 16.0, 22.0, 19.0, 15.0, 15.0, 8.0, 8.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.031953811645508, -20.401432037353516, -19.770912170410156, -19.140390396118164, -18.509868621826172, -17.879348754882812, -17.24882698059082, -16.618305206298828, -15.987785339355469, -15.357264518737793, -14.7267427444458, -14.096221923828125, -13.46570110321045, -12.835180282592773, -12.204658508300781, -11.574137687683105, -10.943615913391113, -10.313095092773438, -9.682573318481445, -9.05205249786377, -8.421531677246094, -7.79101037979126, -7.160489082336426, -6.52996826171875, -5.899446964263916, -5.268925666809082, -4.638404846191406, -4.007883548736572, -3.3773624897003174, -2.7468414306640625, -2.1163201332092285, -1.4857993125915527, -0.8552780151367188, -0.2247568964958191, 0.40576422214508057, 1.036285400390625, 1.6668064594268799, 2.2973275184631348, 2.9278488159179688, 3.5583696365356445, 4.1888909339904785, 4.8194122314453125, 5.449933052062988, 6.080454349517822, 6.710975646972656, 7.341496467590332, 7.972017765045166, 8.6025390625, 9.233059883117676, 9.863580703735352, 10.494102478027344, 11.12462329864502, 11.755144119262695, 12.385665893554688, 13.016186714172363, 13.646707534790039, 14.277229309082031, 14.907750129699707, 15.5382719039917, 16.168792724609375, 16.799314498901367, 17.429834365844727, 18.06035614013672, 18.690876007080078, 19.32139778137207]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 5.0, 3.0, 3.0, 3.0, 6.0, 8.0, 10.0, 11.0, 14.0, 29.0, 13.0, 27.0, 32.0, 35.0, 32.0, 29.0, 36.0, 37.0, 30.0, 40.0, 41.0, 48.0, 48.0, 38.0, 40.0, 47.0, 47.0, 33.0, 37.0, 33.0, 25.0, 30.0, 29.0, 14.0, 19.0, 12.0, 15.0, 11.0, 9.0, 8.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.777612686157227, -22.109800338745117, -21.441987991333008, -20.774173736572266, -20.106361389160156, -19.438549041748047, -18.770736694335938, -18.102924346923828, -17.43511199951172, -16.76729965209961, -16.0994873046875, -15.431674003601074, -14.763860702514648, -14.096048355102539, -13.42823600769043, -12.76042366027832, -12.092609405517578, -11.424797058105469, -10.756983757019043, -10.089171409606934, -9.421358108520508, -8.753545761108398, -8.085733413696289, -7.4179205894470215, -6.750107765197754, -6.082294940948486, -5.414482116699219, -4.746669769287109, -4.078856945037842, -3.411044120788574, -2.743231773376465, -2.0754189491271973, -1.4076080322265625, -0.7397953271865845, -0.07198262214660645, 0.595829963684082, 1.2636427879333496, 1.9314556121826172, 2.5992679595947266, 3.267080783843994, 3.9348936080932617, 4.602706432342529, 5.270519256591797, 5.938331604003906, 6.606144428253174, 7.273957252502441, 7.941769599914551, 8.609582901000977, 9.277395248413086, 9.945207595825195, 10.613020896911621, 11.28083324432373, 11.948646545410156, 12.616458892822266, 13.284271240234375, 13.952083587646484, 14.61989688873291, 15.28770923614502, 15.955522537231445, 16.623334884643555, 17.291147232055664, 17.958961486816406, 18.626773834228516, 19.294586181640625, 19.962398529052734]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 14.0, 7.0, 27.0, 33.0, 49.0, 87.0, 96.0, 187.0, 325.0, 462.0, 733.0, 1146.0, 1836.0, 3146.0, 4815.0, 8065.0, 12798.0, 20948.0, 33083.0, 51346.0, 75246.0, 104146.0, 130155.0, 140793.0, 130762.0, 106978.0, 77894.0, 52798.0, 33878.0, 21691.0, 13189.0, 8285.0, 5128.0, 3197.0, 1965.0, 1188.0, 709.0, 493.0, 307.0, 178.0, 119.0, 86.0, 47.0, 49.0, 29.0, 16.0, 3.0, 10.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.734375, -19.108642578125, -18.48291015625, -17.857177734375, -17.2314453125, -16.605712890625, -15.97998046875, -15.354248046875, -14.728515625, -14.102783203125, -13.47705078125, -12.851318359375, -12.2255859375, -11.599853515625, -10.97412109375, -10.348388671875, -9.72265625, -9.096923828125, -8.47119140625, -7.845458984375, -7.2197265625, -6.593994140625, -5.96826171875, -5.342529296875, -4.716796875, -4.091064453125, -3.46533203125, -2.839599609375, -2.2138671875, -1.588134765625, -0.96240234375, -0.336669921875, 0.2890625, 0.914794921875, 1.54052734375, 2.166259765625, 2.7919921875, 3.417724609375, 4.04345703125, 4.669189453125, 5.294921875, 5.920654296875, 6.54638671875, 7.172119140625, 7.7978515625, 8.423583984375, 9.04931640625, 9.675048828125, 10.30078125, 10.926513671875, 11.55224609375, 12.177978515625, 12.8037109375, 13.429443359375, 14.05517578125, 14.680908203125, 15.306640625, 15.932373046875, 16.55810546875, 17.183837890625, 17.8095703125, 18.435302734375, 19.06103515625, 19.686767578125, 20.3125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 3.0, 9.0, 15.0, 10.0, 16.0, 20.0, 21.0, 29.0, 34.0, 41.0, 33.0, 29.0, 33.0, 34.0, 44.0, 39.0, 40.0, 43.0, 48.0, 47.0, 46.0, 43.0, 37.0, 36.0, 30.0, 39.0, 22.0, 28.0, 16.0, 24.0, 15.0, 18.0, 11.0, 7.0, 6.0, 7.0, 7.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.9375, -21.30517578125, -20.6728515625, -20.04052734375, -19.408203125, -18.77587890625, -18.1435546875, -17.51123046875, -16.87890625, -16.24658203125, -15.6142578125, -14.98193359375, -14.349609375, -13.71728515625, -13.0849609375, -12.45263671875, -11.8203125, -11.18798828125, -10.5556640625, -9.92333984375, -9.291015625, -8.65869140625, -8.0263671875, -7.39404296875, -6.76171875, -6.12939453125, -5.4970703125, -4.86474609375, -4.232421875, -3.60009765625, -2.9677734375, -2.33544921875, -1.703125, -1.07080078125, -0.4384765625, 0.19384765625, 0.826171875, 1.45849609375, 2.0908203125, 2.72314453125, 3.35546875, 3.98779296875, 4.6201171875, 5.25244140625, 5.884765625, 6.51708984375, 7.1494140625, 7.78173828125, 8.4140625, 9.04638671875, 9.6787109375, 10.31103515625, 10.943359375, 11.57568359375, 12.2080078125, 12.84033203125, 13.47265625, 14.10498046875, 14.7373046875, 15.36962890625, 16.001953125, 16.63427734375, 17.2666015625, 17.89892578125, 18.53125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 9.0, 18.0, 26.0, 31.0, 57.0, 75.0, 141.0, 196.0, 286.0, 447.0, 695.0, 1093.0, 1596.0, 2640.0, 4321.0, 7099.0, 11200.0, 18030.0, 28504.0, 45422.0, 68904.0, 98973.0, 127713.0, 144514.0, 137690.0, 113320.0, 83289.0, 55679.0, 36159.0, 22859.0, 14053.0, 8825.0, 5388.0, 3458.0, 2069.0, 1348.0, 846.0, 552.0, 354.0, 233.0, 144.0, 103.0, 64.0, 46.0, 26.0, 13.0, 15.0, 14.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-19.703125, -19.062255859375, -18.42138671875, -17.780517578125, -17.1396484375, -16.498779296875, -15.85791015625, -15.217041015625, -14.576171875, -13.935302734375, -13.29443359375, -12.653564453125, -12.0126953125, -11.371826171875, -10.73095703125, -10.090087890625, -9.44921875, -8.808349609375, -8.16748046875, -7.526611328125, -6.8857421875, -6.244873046875, -5.60400390625, -4.963134765625, -4.322265625, -3.681396484375, -3.04052734375, -2.399658203125, -1.7587890625, -1.117919921875, -0.47705078125, 0.163818359375, 0.8046875, 1.445556640625, 2.08642578125, 2.727294921875, 3.3681640625, 4.009033203125, 4.64990234375, 5.290771484375, 5.931640625, 6.572509765625, 7.21337890625, 7.854248046875, 8.4951171875, 9.135986328125, 9.77685546875, 10.417724609375, 11.05859375, 11.699462890625, 12.34033203125, 12.981201171875, 13.6220703125, 14.262939453125, 14.90380859375, 15.544677734375, 16.185546875, 16.826416015625, 17.46728515625, 18.108154296875, 18.7490234375, 19.389892578125, 20.03076171875, 20.671630859375, 21.3125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 1.0, 0.0, 5.0, 5.0, 7.0, 16.0, 16.0, 9.0, 15.0, 20.0, 21.0, 23.0, 32.0, 32.0, 38.0, 36.0, 37.0, 45.0, 40.0, 43.0, 55.0, 31.0, 55.0, 45.0, 43.0, 32.0, 36.0, 34.0, 33.0, 38.0, 25.0, 22.0, 20.0, 14.0, 13.0, 12.0, 11.0, 16.0, 8.0, 9.0, 9.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.0078125, -13.5943603515625, -13.180908203125, -12.7674560546875, -12.35400390625, -11.9405517578125, -11.527099609375, -11.1136474609375, -10.7001953125, -10.2867431640625, -9.873291015625, -9.4598388671875, -9.04638671875, -8.6329345703125, -8.219482421875, -7.8060302734375, -7.392578125, -6.9791259765625, -6.565673828125, -6.1522216796875, -5.73876953125, -5.3253173828125, -4.911865234375, -4.4984130859375, -4.0849609375, -3.6715087890625, -3.258056640625, -2.8446044921875, -2.43115234375, -2.0177001953125, -1.604248046875, -1.1907958984375, -0.77734375, -0.3638916015625, 0.049560546875, 0.4630126953125, 0.87646484375, 1.2899169921875, 1.703369140625, 2.1168212890625, 2.5302734375, 2.9437255859375, 3.357177734375, 3.7706298828125, 4.18408203125, 4.5975341796875, 5.010986328125, 5.4244384765625, 5.837890625, 6.2513427734375, 6.664794921875, 7.0782470703125, 7.49169921875, 7.9051513671875, 8.318603515625, 8.7320556640625, 9.1455078125, 9.5589599609375, 9.972412109375, 10.3858642578125, 10.79931640625, 11.2127685546875, 11.626220703125, 12.0396728515625, 12.453125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 13.0, 10.0, 23.0, 48.0, 54.0, 72.0, 119.0, 160.0, 275.0, 447.0, 750.0, 1256.0, 1999.0, 3342.0, 5463.0, 9286.0, 15929.0, 27114.0, 45764.0, 75108.0, 115328.0, 157881.0, 173558.0, 147568.0, 103591.0, 65929.0, 40057.0, 23469.0, 13820.0, 8039.0, 4787.0, 2766.0, 1700.0, 1063.0, 626.0, 421.0, 252.0, 165.0, 102.0, 74.0, 45.0, 27.0, 14.0, 14.0, 8.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.265625, -5.0863037109375, -4.906982421875, -4.7276611328125, -4.54833984375, -4.3690185546875, -4.189697265625, -4.0103759765625, -3.8310546875, -3.6517333984375, -3.472412109375, -3.2930908203125, -3.11376953125, -2.9344482421875, -2.755126953125, -2.5758056640625, -2.396484375, -2.2171630859375, -2.037841796875, -1.8585205078125, -1.67919921875, -1.4998779296875, -1.320556640625, -1.1412353515625, -0.9619140625, -0.7825927734375, -0.603271484375, -0.4239501953125, -0.24462890625, -0.0653076171875, 0.114013671875, 0.2933349609375, 0.47265625, 0.6519775390625, 0.831298828125, 1.0106201171875, 1.18994140625, 1.3692626953125, 1.548583984375, 1.7279052734375, 1.9072265625, 2.0865478515625, 2.265869140625, 2.4451904296875, 2.62451171875, 2.8038330078125, 2.983154296875, 3.1624755859375, 3.341796875, 3.5211181640625, 3.700439453125, 3.8797607421875, 4.05908203125, 4.2384033203125, 4.417724609375, 4.5970458984375, 4.7763671875, 4.9556884765625, 5.135009765625, 5.3143310546875, 5.49365234375, 5.6729736328125, 5.852294921875, 6.0316162109375, 6.2109375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 10.0, 11.0, 5.0, 28.0, 24.0, 35.0, 35.0, 37.0, 37.0, 66.0, 58.0, 69.0, 59.0, 85.0, 65.0, 47.0, 47.0, 39.0, 38.0, 33.0, 36.0, 24.0, 18.0, 14.0, 14.0, 11.0, 10.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006766319274902344, -0.0006583631038665771, -0.0006400942802429199, -0.0006218254566192627, -0.0006035566329956055, -0.0005852878093719482, -0.000567018985748291, -0.0005487501621246338, -0.0005304813385009766, -0.0005122125148773193, -0.0004939436912536621, -0.0004756748676300049, -0.00045740604400634766, -0.00043913722038269043, -0.0004208683967590332, -0.000402599573135376, -0.00038433074951171875, -0.0003660619258880615, -0.0003477931022644043, -0.00032952427864074707, -0.00031125545501708984, -0.0002929866313934326, -0.0002747178077697754, -0.00025644898414611816, -0.00023818016052246094, -0.0002199113368988037, -0.00020164251327514648, -0.00018337368965148926, -0.00016510486602783203, -0.0001468360424041748, -0.00012856721878051758, -0.00011029839515686035, -9.202957153320312e-05, -7.37607479095459e-05, -5.549192428588867e-05, -3.7223100662231445e-05, -1.895427703857422e-05, -6.854534149169922e-07, 1.7583370208740234e-05, 3.585219383239746e-05, 5.412101745605469e-05, 7.238984107971191e-05, 9.065866470336914e-05, 0.00010892748832702637, 0.0001271963119506836, 0.00014546513557434082, 0.00016373395919799805, 0.00018200278282165527, 0.0002002716064453125, 0.00021854043006896973, 0.00023680925369262695, 0.0002550780773162842, 0.0002733469009399414, 0.00029161572456359863, 0.00030988454818725586, 0.0003281533718109131, 0.0003464221954345703, 0.00036469101905822754, 0.00038295984268188477, 0.000401228666305542, 0.0004194974899291992, 0.00043776631355285645, 0.00045603513717651367, 0.0004743039608001709, 0.0004925727844238281]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 5.0, 4.0, 8.0, 8.0, 8.0, 18.0, 39.0, 37.0, 48.0, 87.0, 133.0, 192.0, 249.0, 421.0, 658.0, 1085.0, 1579.0, 2375.0, 3842.0, 5830.0, 9224.0, 14802.0, 22856.0, 36248.0, 55656.0, 82548.0, 114791.0, 142052.0, 147771.0, 127001.0, 94783.0, 65516.0, 42587.0, 27614.0, 17436.0, 11167.0, 7109.0, 4575.0, 2852.0, 1808.0, 1226.0, 821.0, 526.0, 343.0, 212.0, 136.0, 100.0, 52.0, 44.0, 27.0, 19.0, 13.0, 6.0, 3.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-4.6953125, -4.5447998046875, -4.394287109375, -4.2437744140625, -4.09326171875, -3.9427490234375, -3.792236328125, -3.6417236328125, -3.4912109375, -3.3406982421875, -3.190185546875, -3.0396728515625, -2.88916015625, -2.7386474609375, -2.588134765625, -2.4376220703125, -2.287109375, -2.1365966796875, -1.986083984375, -1.8355712890625, -1.68505859375, -1.5345458984375, -1.384033203125, -1.2335205078125, -1.0830078125, -0.9324951171875, -0.781982421875, -0.6314697265625, -0.48095703125, -0.3304443359375, -0.179931640625, -0.0294189453125, 0.12109375, 0.2716064453125, 0.422119140625, 0.5726318359375, 0.72314453125, 0.8736572265625, 1.024169921875, 1.1746826171875, 1.3251953125, 1.4757080078125, 1.626220703125, 1.7767333984375, 1.92724609375, 2.0777587890625, 2.228271484375, 2.3787841796875, 2.529296875, 2.6798095703125, 2.830322265625, 2.9808349609375, 3.13134765625, 3.2818603515625, 3.432373046875, 3.5828857421875, 3.7333984375, 3.8839111328125, 4.034423828125, 4.1849365234375, 4.33544921875, 4.4859619140625, 4.636474609375, 4.7869873046875, 4.9375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 8.0, 6.0, 12.0, 15.0, 18.0, 11.0, 27.0, 32.0, 42.0, 39.0, 62.0, 72.0, 69.0, 70.0, 65.0, 65.0, 65.0, 52.0, 51.0, 44.0, 41.0, 34.0, 22.0, 12.0, 17.0, 7.0, 11.0, 3.0, 6.0, 10.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.705078125, -2.6207275390625, -2.536376953125, -2.4520263671875, -2.36767578125, -2.2833251953125, -2.198974609375, -2.1146240234375, -2.0302734375, -1.9459228515625, -1.861572265625, -1.7772216796875, -1.69287109375, -1.6085205078125, -1.524169921875, -1.4398193359375, -1.35546875, -1.2711181640625, -1.186767578125, -1.1024169921875, -1.01806640625, -0.9337158203125, -0.849365234375, -0.7650146484375, -0.6806640625, -0.5963134765625, -0.511962890625, -0.4276123046875, -0.34326171875, -0.2589111328125, -0.174560546875, -0.0902099609375, -0.005859375, 0.0784912109375, 0.162841796875, 0.2471923828125, 0.33154296875, 0.4158935546875, 0.500244140625, 0.5845947265625, 0.6689453125, 0.7532958984375, 0.837646484375, 0.9219970703125, 1.00634765625, 1.0906982421875, 1.175048828125, 1.2593994140625, 1.34375, 1.4281005859375, 1.512451171875, 1.5968017578125, 1.68115234375, 1.7655029296875, 1.849853515625, 1.9342041015625, 2.0185546875, 2.1029052734375, 2.187255859375, 2.2716064453125, 2.35595703125, 2.4403076171875, 2.524658203125, 2.6090087890625, 2.693359375]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 8.0, 3.0, 9.0, 14.0, 11.0, 11.0, 21.0, 20.0, 20.0, 23.0, 23.0, 32.0, 42.0, 46.0, 53.0, 43.0, 55.0, 59.0, 45.0, 61.0, 51.0, 46.0, 48.0, 49.0, 29.0, 27.0, 27.0, 25.0, 19.0, 15.0, 14.0, 15.0, 8.0, 5.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.220605850219727, -20.625181198120117, -20.029754638671875, -19.434329986572266, -18.838905334472656, -18.243478775024414, -17.648054122924805, -17.052627563476562, -16.457202911376953, -15.861777305603027, -15.266351699829102, -14.670927047729492, -14.075501441955566, -13.48007583618164, -12.884651184082031, -12.289225578308105, -11.69379997253418, -11.098374366760254, -10.502948760986328, -9.907524108886719, -9.312098503112793, -8.716672897338867, -8.121248245239258, -7.525822639465332, -6.930397033691406, -6.3349714279174805, -5.739546298980713, -5.144121170043945, -4.5486955642700195, -3.953270196914673, -3.357844829559326, -2.7624197006225586, -2.166994094848633, -1.5715687274932861, -0.9761433601379395, -0.3807179927825928, 0.2147073745727539, 0.8101327419281006, 1.4055581092834473, 2.000983238220215, 2.5964088439941406, 3.1918342113494873, 3.787259578704834, 4.382684707641602, 4.978110313415527, 5.573535919189453, 6.168961048126221, 6.764386177062988, 7.359811782836914, 7.95523738861084, 8.550662994384766, 9.146087646484375, 9.7415132522583, 10.336938858032227, 10.932363510131836, 11.527789115905762, 12.123214721679688, 12.718640327453613, 13.314065933227539, 13.909490585327148, 14.504916191101074, 15.100341796875, 15.69576644897461, 16.29119110107422, 16.88661766052246]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 6.0, 4.0, 0.0, 3.0, 2.0, 11.0, 15.0, 9.0, 13.0, 10.0, 15.0, 18.0, 25.0, 31.0, 21.0, 23.0, 34.0, 37.0, 33.0, 36.0, 34.0, 37.0, 47.0, 42.0, 40.0, 37.0, 42.0, 38.0, 31.0, 44.0, 33.0, 27.0, 31.0, 29.0, 33.0, 20.0, 16.0, 14.0, 9.0, 9.0, 12.0, 9.0, 12.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.57160186767578, -17.947532653808594, -17.32346534729004, -16.69939613342285, -16.075326919555664, -15.451258659362793, -14.827190399169922, -14.203121185302734, -13.579052925109863, -12.954984664916992, -12.330915451049805, -11.706847190856934, -11.082778930664062, -10.458709716796875, -9.834641456604004, -9.210573196411133, -8.586503982543945, -7.962435245513916, -7.338366508483887, -6.714298248291016, -6.090229511260986, -5.466160774230957, -4.842092514038086, -4.218023777008057, -3.5939550399780273, -2.969886302947998, -2.345817804336548, -1.721749186515808, -1.0976805686950684, -0.47361183166503906, 0.15045666694641113, 0.7745251655578613, 1.3985919952392578, 2.022660732269287, 2.6467292308807373, 3.2707977294921875, 3.894866466522217, 4.518935203552246, 5.143003463745117, 5.7670722007751465, 6.391140937805176, 7.015209674835205, 7.639278411865234, 8.263346672058105, 8.887414932250977, 9.511484146118164, 10.135552406311035, 10.759620666503906, 11.383689880371094, 12.007758140563965, 12.631827354431152, 13.255895614624023, 13.879964828491211, 14.504033088684082, 15.128101348876953, 15.75217056274414, 16.376239776611328, 17.000308990478516, 17.62437629699707, 18.248445510864258, 18.872514724731445, 19.49658203125, 20.120651245117188, 20.744720458984375, 21.36878776550293]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 16.0, 18.0, 40.0, 41.0, 50.0, 118.0, 166.0, 305.0, 428.0, 717.0, 1104.0, 1719.0, 2808.0, 4696.0, 7631.0, 12465.0, 20624.0, 34278.0, 57570.0, 98139.0, 166068.0, 278816.0, 445903.0, 631116.0, 713375.0, 618757.0, 431761.0, 269410.0, 159539.0, 94940.0, 56552.0, 33677.0, 20138.0, 12341.0, 7238.0, 4512.0, 2787.0, 1716.0, 1040.0, 650.0, 389.0, 244.0, 147.0, 97.0, 53.0, 33.0, 26.0, 9.0, 4.0, 8.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.15625, -15.673583984375, -15.19091796875, -14.708251953125, -14.2255859375, -13.742919921875, -13.26025390625, -12.777587890625, -12.294921875, -11.812255859375, -11.32958984375, -10.846923828125, -10.3642578125, -9.881591796875, -9.39892578125, -8.916259765625, -8.43359375, -7.950927734375, -7.46826171875, -6.985595703125, -6.5029296875, -6.020263671875, -5.53759765625, -5.054931640625, -4.572265625, -4.089599609375, -3.60693359375, -3.124267578125, -2.6416015625, -2.158935546875, -1.67626953125, -1.193603515625, -0.7109375, -0.228271484375, 0.25439453125, 0.737060546875, 1.2197265625, 1.702392578125, 2.18505859375, 2.667724609375, 3.150390625, 3.633056640625, 4.11572265625, 4.598388671875, 5.0810546875, 5.563720703125, 6.04638671875, 6.529052734375, 7.01171875, 7.494384765625, 7.97705078125, 8.459716796875, 8.9423828125, 9.425048828125, 9.90771484375, 10.390380859375, 10.873046875, 11.355712890625, 11.83837890625, 12.321044921875, 12.8037109375, 13.286376953125, 13.76904296875, 14.251708984375, 14.734375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 2.0, 4.0, 2.0, 8.0, 4.0, 11.0, 10.0, 10.0, 18.0, 13.0, 9.0, 20.0, 22.0, 17.0, 29.0, 26.0, 29.0, 42.0, 27.0, 38.0, 34.0, 32.0, 40.0, 48.0, 49.0, 40.0, 30.0, 38.0, 43.0, 30.0, 30.0, 30.0, 35.0, 30.0, 21.0, 22.0, 11.0, 16.0, 13.0, 10.0, 9.0, 9.0, 15.0, 10.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.8046875, -12.4061279296875, -12.007568359375, -11.6090087890625, -11.21044921875, -10.8118896484375, -10.413330078125, -10.0147705078125, -9.6162109375, -9.2176513671875, -8.819091796875, -8.4205322265625, -8.02197265625, -7.6234130859375, -7.224853515625, -6.8262939453125, -6.427734375, -6.0291748046875, -5.630615234375, -5.2320556640625, -4.83349609375, -4.4349365234375, -4.036376953125, -3.6378173828125, -3.2392578125, -2.8406982421875, -2.442138671875, -2.0435791015625, -1.64501953125, -1.2464599609375, -0.847900390625, -0.4493408203125, -0.05078125, 0.3477783203125, 0.746337890625, 1.1448974609375, 1.54345703125, 1.9420166015625, 2.340576171875, 2.7391357421875, 3.1376953125, 3.5362548828125, 3.934814453125, 4.3333740234375, 4.73193359375, 5.1304931640625, 5.529052734375, 5.9276123046875, 6.326171875, 6.7247314453125, 7.123291015625, 7.5218505859375, 7.92041015625, 8.3189697265625, 8.717529296875, 9.1160888671875, 9.5146484375, 9.9132080078125, 10.311767578125, 10.7103271484375, 11.10888671875, 11.5074462890625, 11.906005859375, 12.3045654296875, 12.703125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 8.0, 13.0, 13.0, 23.0, 34.0, 47.0, 72.0, 134.0, 195.0, 273.0, 420.0, 698.0, 1063.0, 1711.0, 2644.0, 4270.0, 6723.0, 10926.0, 17696.0, 28958.0, 46054.0, 74031.0, 117706.0, 182226.0, 270297.0, 379566.0, 488633.0, 552718.0, 539856.0, 455516.0, 343846.0, 239830.0, 158859.0, 101302.0, 63899.0, 39741.0, 24431.0, 15079.0, 9372.0, 5676.0, 3590.0, 2230.0, 1443.0, 868.0, 580.0, 389.0, 227.0, 159.0, 102.0, 61.0, 40.0, 25.0, 11.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.2109375, -10.835205078125, -10.45947265625, -10.083740234375, -9.7080078125, -9.332275390625, -8.95654296875, -8.580810546875, -8.205078125, -7.829345703125, -7.45361328125, -7.077880859375, -6.7021484375, -6.326416015625, -5.95068359375, -5.574951171875, -5.19921875, -4.823486328125, -4.44775390625, -4.072021484375, -3.6962890625, -3.320556640625, -2.94482421875, -2.569091796875, -2.193359375, -1.817626953125, -1.44189453125, -1.066162109375, -0.6904296875, -0.314697265625, 0.06103515625, 0.436767578125, 0.8125, 1.188232421875, 1.56396484375, 1.939697265625, 2.3154296875, 2.691162109375, 3.06689453125, 3.442626953125, 3.818359375, 4.194091796875, 4.56982421875, 4.945556640625, 5.3212890625, 5.697021484375, 6.07275390625, 6.448486328125, 6.82421875, 7.199951171875, 7.57568359375, 7.951416015625, 8.3271484375, 8.702880859375, 9.07861328125, 9.454345703125, 9.830078125, 10.205810546875, 10.58154296875, 10.957275390625, 11.3330078125, 11.708740234375, 12.08447265625, 12.460205078125, 12.8359375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 6.0, 19.0, 19.0, 19.0, 33.0, 30.0, 30.0, 48.0, 68.0, 96.0, 80.0, 103.0, 120.0, 132.0, 145.0, 136.0, 169.0, 187.0, 186.0, 194.0, 206.0, 227.0, 202.0, 194.0, 202.0, 185.0, 165.0, 133.0, 131.0, 83.0, 102.0, 81.0, 57.0, 57.0, 39.0, 38.0, 38.0, 23.0, 17.0, 13.0, 9.0, 3.0, 11.0, 10.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-6.0546875, -5.8720703125, -5.689453125, -5.5068359375, -5.32421875, -5.1416015625, -4.958984375, -4.7763671875, -4.59375, -4.4111328125, -4.228515625, -4.0458984375, -3.86328125, -3.6806640625, -3.498046875, -3.3154296875, -3.1328125, -2.9501953125, -2.767578125, -2.5849609375, -2.40234375, -2.2197265625, -2.037109375, -1.8544921875, -1.671875, -1.4892578125, -1.306640625, -1.1240234375, -0.94140625, -0.7587890625, -0.576171875, -0.3935546875, -0.2109375, -0.0283203125, 0.154296875, 0.3369140625, 0.51953125, 0.7021484375, 0.884765625, 1.0673828125, 1.25, 1.4326171875, 1.615234375, 1.7978515625, 1.98046875, 2.1630859375, 2.345703125, 2.5283203125, 2.7109375, 2.8935546875, 3.076171875, 3.2587890625, 3.44140625, 3.6240234375, 3.806640625, 3.9892578125, 4.171875, 4.3544921875, 4.537109375, 4.7197265625, 4.90234375, 5.0849609375, 5.267578125, 5.4501953125, 5.6328125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 6.0, 9.0, 15.0, 13.0, 18.0, 13.0, 19.0, 19.0, 34.0, 31.0, 37.0, 59.0, 52.0, 54.0, 51.0, 66.0, 68.0, 69.0, 47.0, 44.0, 52.0, 37.0, 28.0, 33.0, 24.0, 23.0, 17.0, 13.0, 3.0, 12.0, 9.0, 4.0, 4.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.218477249145508, -18.69745445251465, -18.176429748535156, -17.655406951904297, -17.134384155273438, -16.613359451293945, -16.092336654663086, -15.57131290435791, -15.050289154052734, -14.529265403747559, -14.008241653442383, -13.487218856811523, -12.966195106506348, -12.445171356201172, -11.924148559570312, -11.403124809265137, -10.882101058959961, -10.361077308654785, -9.84005355834961, -9.31903076171875, -8.798007011413574, -8.276983261108398, -7.755959987640381, -7.234936714172363, -6.7139129638671875, -6.192889213562012, -5.671865940093994, -5.150842666625977, -4.629818916320801, -4.108795166015625, -3.5877718925476074, -3.0667483806610107, -2.5457258224487305, -2.024702310562134, -1.503678798675537, -0.9826552867889404, -0.46163177490234375, 0.05939173698425293, 0.5804152488708496, 1.1014387607574463, 1.622462272644043, 2.1434857845306396, 2.6645092964172363, 3.185532808303833, 3.7065563201904297, 4.2275800704956055, 4.748603343963623, 5.269626617431641, 5.790650367736816, 6.311674118041992, 6.83269739151001, 7.353720664978027, 7.874744415283203, 8.395768165588379, 8.916791915893555, 9.437814712524414, 9.95883846282959, 10.479862213134766, 11.000885009765625, 11.5219087600708, 12.042932510375977, 12.563956260681152, 13.084980010986328, 13.606002807617188, 14.127026557922363]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 5.0, 6.0, 5.0, 5.0, 5.0, 10.0, 11.0, 7.0, 13.0, 18.0, 13.0, 25.0, 23.0, 31.0, 18.0, 27.0, 34.0, 19.0, 43.0, 30.0, 35.0, 43.0, 22.0, 39.0, 27.0, 36.0, 37.0, 32.0, 35.0, 30.0, 38.0, 32.0, 36.0, 32.0, 25.0, 19.0, 25.0, 26.0, 11.0, 9.0, 14.0, 10.0, 8.0, 9.0, 8.0, 8.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-15.207460403442383, -14.747198104858398, -14.286935806274414, -13.82667350769043, -13.366411209106445, -12.906148910522461, -12.445886611938477, -11.985624313354492, -11.525362014770508, -11.065099716186523, -10.604837417602539, -10.144575119018555, -9.68431282043457, -9.224050521850586, -8.763788223266602, -8.303525924682617, -7.843262672424316, -7.383000373840332, -6.922738075256348, -6.462475776672363, -6.002213478088379, -5.5419511795043945, -5.081688404083252, -4.621426105499268, -4.161163806915283, -3.700901508331299, -3.2406392097473145, -2.780376672744751, -2.3201143741607666, -1.8598520755767822, -1.3995895385742188, -0.9393272399902344, -0.4790658950805664, -0.018803536891937256, 0.4414588212966919, 0.9017212390899658, 1.3619835376739502, 1.8222458362579346, 2.282508373260498, 2.7427706718444824, 3.203032970428467, 3.663295269012451, 4.1235575675964355, 4.583820343017578, 5.0440826416015625, 5.504344940185547, 5.964607238769531, 6.424869537353516, 6.8851318359375, 7.345394134521484, 7.805656433105469, 8.265918731689453, 8.726181030273438, 9.186443328857422, 9.646705627441406, 10.10696792602539, 10.567230224609375, 11.02749252319336, 11.487754821777344, 11.948017120361328, 12.408279418945312, 12.868541717529297, 13.328804016113281, 13.789066314697266, 14.249329566955566]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 14.0, 18.0, 29.0, 35.0, 45.0, 39.0, 110.0, 140.0, 173.0, 276.0, 459.0, 737.0, 1178.0, 1779.0, 2953.0, 4730.0, 8091.0, 13756.0, 23422.0, 40439.0, 71634.0, 124372.0, 204183.0, 220151.0, 139103.0, 80264.0, 45853.0, 26127.0, 15174.0, 9252.0, 5363.0, 3150.0, 2040.0, 1244.0, 748.0, 501.0, 304.0, 211.0, 142.0, 102.0, 73.0, 32.0, 39.0, 21.0, 19.0, 9.0, 10.0, 6.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0], "bins": [-5.98046875, -5.7998046875, -5.619140625, -5.4384765625, -5.2578125, -5.0771484375, -4.896484375, -4.7158203125, -4.53515625, -4.3544921875, -4.173828125, -3.9931640625, -3.8125, -3.6318359375, -3.451171875, -3.2705078125, -3.08984375, -2.9091796875, -2.728515625, -2.5478515625, -2.3671875, -2.1865234375, -2.005859375, -1.8251953125, -1.64453125, -1.4638671875, -1.283203125, -1.1025390625, -0.921875, -0.7412109375, -0.560546875, -0.3798828125, -0.19921875, -0.0185546875, 0.162109375, 0.3427734375, 0.5234375, 0.7041015625, 0.884765625, 1.0654296875, 1.24609375, 1.4267578125, 1.607421875, 1.7880859375, 1.96875, 2.1494140625, 2.330078125, 2.5107421875, 2.69140625, 2.8720703125, 3.052734375, 3.2333984375, 3.4140625, 3.5947265625, 3.775390625, 3.9560546875, 4.13671875, 4.3173828125, 4.498046875, 4.6787109375, 4.859375, 5.0400390625, 5.220703125, 5.4013671875, 5.58203125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 6.0, 6.0, 7.0, 14.0, 11.0, 12.0, 10.0, 20.0, 19.0, 26.0, 27.0, 22.0, 20.0, 33.0, 20.0, 36.0, 42.0, 40.0, 38.0, 45.0, 37.0, 34.0, 34.0, 37.0, 33.0, 35.0, 31.0, 36.0, 39.0, 32.0, 30.0, 34.0, 28.0, 18.0, 16.0, 13.0, 11.0, 8.0, 7.0, 8.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-16.875, -16.3800048828125, -15.885009765625, -15.3900146484375, -14.89501953125, -14.4000244140625, -13.905029296875, -13.4100341796875, -12.9150390625, -12.4200439453125, -11.925048828125, -11.4300537109375, -10.93505859375, -10.4400634765625, -9.945068359375, -9.4500732421875, -8.955078125, -8.4600830078125, -7.965087890625, -7.4700927734375, -6.97509765625, -6.4801025390625, -5.985107421875, -5.4901123046875, -4.9951171875, -4.5001220703125, -4.005126953125, -3.5101318359375, -3.01513671875, -2.5201416015625, -2.025146484375, -1.5301513671875, -1.03515625, -0.5401611328125, -0.045166015625, 0.4498291015625, 0.94482421875, 1.4398193359375, 1.934814453125, 2.4298095703125, 2.9248046875, 3.4197998046875, 3.914794921875, 4.4097900390625, 4.90478515625, 5.3997802734375, 5.894775390625, 6.3897705078125, 6.884765625, 7.3797607421875, 7.874755859375, 8.3697509765625, 8.86474609375, 9.3597412109375, 9.854736328125, 10.3497314453125, 10.8447265625, 11.3397216796875, 11.834716796875, 12.3297119140625, 12.82470703125, 13.3197021484375, 13.814697265625, 14.3096923828125, 14.8046875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 12.0, 20.0, 22.0, 32.0, 66.0, 116.0, 178.0, 286.0, 497.0, 843.0, 1443.0, 2689.0, 4736.0, 8992.0, 17068.0, 34516.0, 68840.0, 135501.0, 243271.0, 246461.0, 139103.0, 70472.0, 35074.0, 17732.0, 9393.0, 4817.0, 2582.0, 1598.0, 866.0, 511.0, 315.0, 178.0, 112.0, 73.0, 34.0, 34.0, 18.0, 13.0, 7.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-4.89453125, -4.74627685546875, -4.5980224609375, -4.44976806640625, -4.301513671875, -4.15325927734375, -4.0050048828125, -3.85675048828125, -3.70849609375, -3.56024169921875, -3.4119873046875, -3.26373291015625, -3.115478515625, -2.96722412109375, -2.8189697265625, -2.67071533203125, -2.5224609375, -2.37420654296875, -2.2259521484375, -2.07769775390625, -1.929443359375, -1.78118896484375, -1.6329345703125, -1.48468017578125, -1.33642578125, -1.18817138671875, -1.0399169921875, -0.89166259765625, -0.743408203125, -0.59515380859375, -0.4468994140625, -0.29864501953125, -0.150390625, -0.00213623046875, 0.1461181640625, 0.29437255859375, 0.442626953125, 0.59088134765625, 0.7391357421875, 0.88739013671875, 1.03564453125, 1.18389892578125, 1.3321533203125, 1.48040771484375, 1.628662109375, 1.77691650390625, 1.9251708984375, 2.07342529296875, 2.2216796875, 2.36993408203125, 2.5181884765625, 2.66644287109375, 2.814697265625, 2.96295166015625, 3.1112060546875, 3.25946044921875, 3.40771484375, 3.55596923828125, 3.7042236328125, 3.85247802734375, 4.000732421875, 4.14898681640625, 4.2972412109375, 4.44549560546875, 4.59375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 2.0, 6.0, 4.0, 4.0, 3.0, 8.0, 13.0, 8.0, 11.0, 11.0, 14.0, 25.0, 26.0, 27.0, 39.0, 26.0, 28.0, 42.0, 34.0, 37.0, 53.0, 36.0, 46.0, 30.0, 55.0, 48.0, 41.0, 25.0, 29.0, 30.0, 25.0, 29.0, 26.0, 18.0, 25.0, 17.0, 20.0, 22.0, 14.0, 13.0, 5.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.1640625, -10.80908203125, -10.4541015625, -10.09912109375, -9.744140625, -9.38916015625, -9.0341796875, -8.67919921875, -8.32421875, -7.96923828125, -7.6142578125, -7.25927734375, -6.904296875, -6.54931640625, -6.1943359375, -5.83935546875, -5.484375, -5.12939453125, -4.7744140625, -4.41943359375, -4.064453125, -3.70947265625, -3.3544921875, -2.99951171875, -2.64453125, -2.28955078125, -1.9345703125, -1.57958984375, -1.224609375, -0.86962890625, -0.5146484375, -0.15966796875, 0.1953125, 0.55029296875, 0.9052734375, 1.26025390625, 1.615234375, 1.97021484375, 2.3251953125, 2.68017578125, 3.03515625, 3.39013671875, 3.7451171875, 4.10009765625, 4.455078125, 4.81005859375, 5.1650390625, 5.52001953125, 5.875, 6.22998046875, 6.5849609375, 6.93994140625, 7.294921875, 7.64990234375, 8.0048828125, 8.35986328125, 8.71484375, 9.06982421875, 9.4248046875, 9.77978515625, 10.134765625, 10.48974609375, 10.8447265625, 11.19970703125, 11.5546875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 11.0, 9.0, 25.0, 34.0, 41.0, 44.0, 80.0, 121.0, 179.0, 286.0, 413.0, 636.0, 935.0, 1594.0, 2560.0, 4322.0, 7675.0, 14412.0, 28094.0, 58789.0, 129384.0, 289155.0, 274057.0, 121112.0, 55468.0, 26920.0, 13813.0, 7393.0, 4233.0, 2499.0, 1518.0, 920.0, 613.0, 386.0, 271.0, 163.0, 133.0, 78.0, 49.0, 34.0, 33.0, 20.0, 11.0, 11.0, 3.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88134765625, -0.8528823852539062, -0.8244171142578125, -0.7959518432617188, -0.767486572265625, -0.7390213012695312, -0.7105560302734375, -0.6820907592773438, -0.65362548828125, -0.6251602172851562, -0.5966949462890625, -0.5682296752929688, -0.539764404296875, -0.5112991333007812, -0.4828338623046875, -0.45436859130859375, -0.4259033203125, -0.39743804931640625, -0.3689727783203125, -0.34050750732421875, -0.312042236328125, -0.28357696533203125, -0.2551116943359375, -0.22664642333984375, -0.19818115234375, -0.16971588134765625, -0.1412506103515625, -0.11278533935546875, -0.084320068359375, -0.05585479736328125, -0.0273895263671875, 0.00107574462890625, 0.029541015625, 0.05800628662109375, 0.0864715576171875, 0.11493682861328125, 0.143402099609375, 0.17186737060546875, 0.2003326416015625, 0.22879791259765625, 0.25726318359375, 0.28572845458984375, 0.3141937255859375, 0.34265899658203125, 0.371124267578125, 0.39958953857421875, 0.4280548095703125, 0.45652008056640625, 0.4849853515625, 0.5134506225585938, 0.5419158935546875, 0.5703811645507812, 0.598846435546875, 0.6273117065429688, 0.6557769775390625, 0.6842422485351562, 0.71270751953125, 0.7411727905273438, 0.7696380615234375, 0.7981033325195312, 0.826568603515625, 0.8550338745117188, 0.8834991455078125, 0.9119644165039062, 0.9404296875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 9.0, 6.0, 9.0, 8.0, 25.0, 22.0, 39.0, 37.0, 63.0, 88.0, 109.0, 106.0, 115.0, 91.0, 62.0, 39.0, 32.0, 25.0, 24.0, 19.0, 15.0, 10.0, 7.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021314620971679688, -0.00020592659711837769, -0.0001987069845199585, -0.0001914873719215393, -0.00018426775932312012, -0.00017704814672470093, -0.00016982853412628174, -0.00016260892152786255, -0.00015538930892944336, -0.00014816969633102417, -0.00014095008373260498, -0.0001337304711341858, -0.0001265108585357666, -0.00011929124593734741, -0.00011207163333892822, -0.00010485202074050903, -9.763240814208984e-05, -9.041279554367065e-05, -8.319318294525146e-05, -7.597357034683228e-05, -6.875395774841309e-05, -6.15343451499939e-05, -5.431473255157471e-05, -4.709511995315552e-05, -3.987550735473633e-05, -3.265589475631714e-05, -2.543628215789795e-05, -1.821666955947876e-05, -1.099705696105957e-05, -3.777444362640381e-06, 3.4421682357788086e-06, 1.0661780834197998e-05, 1.7881393432617188e-05, 2.5101006031036377e-05, 3.2320618629455566e-05, 3.9540231227874756e-05, 4.6759843826293945e-05, 5.3979456424713135e-05, 6.119906902313232e-05, 6.841868162155151e-05, 7.56382942199707e-05, 8.285790681838989e-05, 9.007751941680908e-05, 9.729713201522827e-05, 0.00010451674461364746, 0.00011173635721206665, 0.00011895596981048584, 0.00012617558240890503, 0.00013339519500732422, 0.0001406148076057434, 0.0001478344202041626, 0.0001550540328025818, 0.00016227364540100098, 0.00016949325799942017, 0.00017671287059783936, 0.00018393248319625854, 0.00019115209579467773, 0.00019837170839309692, 0.0002055913209915161, 0.0002128109335899353, 0.0002200305461883545, 0.00022725015878677368, 0.00023446977138519287, 0.00024168938398361206, 0.00024890899658203125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 13.0, 20.0, 23.0, 37.0, 70.0, 107.0, 155.0, 297.0, 429.0, 719.0, 1109.0, 1916.0, 3427.0, 6191.0, 12241.0, 25949.0, 58272.0, 143000.0, 342665.0, 264375.0, 103040.0, 43171.0, 19701.0, 9656.0, 5012.0, 2778.0, 1564.0, 996.0, 620.0, 377.0, 206.0, 157.0, 102.0, 52.0, 29.0, 19.0, 20.0, 8.0, 8.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.859375, -1.8009490966796875, -1.742523193359375, -1.6840972900390625, -1.62567138671875, -1.5672454833984375, -1.508819580078125, -1.4503936767578125, -1.3919677734375, -1.3335418701171875, -1.275115966796875, -1.2166900634765625, -1.15826416015625, -1.0998382568359375, -1.041412353515625, -0.9829864501953125, -0.924560546875, -0.8661346435546875, -0.807708740234375, -0.7492828369140625, -0.69085693359375, -0.6324310302734375, -0.574005126953125, -0.5155792236328125, -0.4571533203125, -0.3987274169921875, -0.340301513671875, -0.2818756103515625, -0.22344970703125, -0.1650238037109375, -0.106597900390625, -0.0481719970703125, 0.01025390625, 0.0686798095703125, 0.127105712890625, 0.1855316162109375, 0.24395751953125, 0.3023834228515625, 0.360809326171875, 0.4192352294921875, 0.4776611328125, 0.5360870361328125, 0.594512939453125, 0.6529388427734375, 0.71136474609375, 0.7697906494140625, 0.828216552734375, 0.8866424560546875, 0.945068359375, 1.0034942626953125, 1.061920166015625, 1.1203460693359375, 1.17877197265625, 1.2371978759765625, 1.295623779296875, 1.3540496826171875, 1.4124755859375, 1.4709014892578125, 1.529327392578125, 1.5877532958984375, 1.64617919921875, 1.7046051025390625, 1.763031005859375, 1.8214569091796875, 1.8798828125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 7.0, 2.0, 9.0, 11.0, 11.0, 16.0, 19.0, 40.0, 52.0, 102.0, 171.0, 167.0, 135.0, 85.0, 46.0, 34.0, 18.0, 15.0, 13.0, 5.0, 8.0, 1.0, 3.0, 6.0, 0.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.62255859375, -0.6006622314453125, -0.578765869140625, -0.5568695068359375, -0.53497314453125, -0.5130767822265625, -0.491180419921875, -0.4692840576171875, -0.4473876953125, -0.4254913330078125, -0.403594970703125, -0.3816986083984375, -0.35980224609375, -0.3379058837890625, -0.316009521484375, -0.2941131591796875, -0.272216796875, -0.2503204345703125, -0.228424072265625, -0.2065277099609375, -0.18463134765625, -0.1627349853515625, -0.140838623046875, -0.1189422607421875, -0.0970458984375, -0.0751495361328125, -0.053253173828125, -0.0313568115234375, -0.00946044921875, 0.0124359130859375, 0.034332275390625, 0.0562286376953125, 0.078125, 0.1000213623046875, 0.121917724609375, 0.1438140869140625, 0.16571044921875, 0.1876068115234375, 0.209503173828125, 0.2313995361328125, 0.2532958984375, 0.2751922607421875, 0.297088623046875, 0.3189849853515625, 0.34088134765625, 0.3627777099609375, 0.384674072265625, 0.4065704345703125, 0.428466796875, 0.4503631591796875, 0.472259521484375, 0.4941558837890625, 0.51605224609375, 0.5379486083984375, 0.559844970703125, 0.5817413330078125, 0.6036376953125, 0.6255340576171875, 0.647430419921875, 0.6693267822265625, 0.69122314453125, 0.7131195068359375, 0.735015869140625, 0.7569122314453125, 0.77880859375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 6.0, 5.0, 8.0, 12.0, 15.0, 16.0, 11.0, 22.0, 22.0, 21.0, 38.0, 32.0, 56.0, 45.0, 60.0, 56.0, 58.0, 66.0, 65.0, 50.0, 46.0, 50.0, 47.0, 27.0, 31.0, 31.0, 21.0, 15.0, 17.0, 10.0, 11.0, 9.0, 5.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-19.114295959472656, -18.61176872253418, -18.109243392944336, -17.60671615600586, -17.104188919067383, -16.60166358947754, -16.099136352539062, -15.596610069274902, -15.094083786010742, -14.591557502746582, -14.089030265808105, -13.586503982543945, -13.083977699279785, -12.581451416015625, -12.078924179077148, -11.576397895812988, -11.073870658874512, -10.571344375610352, -10.068817138671875, -9.566290855407715, -9.063764572143555, -8.561237335205078, -8.058711051940918, -7.556184768676758, -7.0536580085754395, -6.551131248474121, -6.048604965209961, -5.546078205108643, -5.043551445007324, -4.541025161743164, -4.038498401641846, -3.5359718799591064, -3.033444404602051, -2.5309178829193115, -2.0283913612365723, -1.525864601135254, -1.0233380794525146, -0.5208115577697754, -0.01828479766845703, 0.4842417240142822, 0.9867682456970215, 1.4892947673797607, 1.9918214082717896, 2.4943480491638184, 2.9968745708465576, 3.499401092529297, 4.001927852630615, 4.504454612731934, 5.006980895996094, 5.509507656097412, 6.012033939361572, 6.514560699462891, 7.017086982727051, 7.519613742828369, 8.022140502929688, 8.524666786193848, 9.027193069458008, 9.529719352722168, 10.032246589660645, 10.534772872924805, 11.037299156188965, 11.539825439453125, 12.042352676391602, 12.544878959655762, 13.047406196594238]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 5.0, 5.0, 9.0, 10.0, 6.0, 14.0, 18.0, 16.0, 17.0, 27.0, 24.0, 25.0, 18.0, 36.0, 22.0, 37.0, 36.0, 35.0, 38.0, 35.0, 31.0, 26.0, 29.0, 41.0, 31.0, 36.0, 29.0, 39.0, 38.0, 28.0, 34.0, 30.0, 16.0, 28.0, 23.0, 17.0, 10.0, 9.0, 13.0, 7.0, 10.0, 8.0, 11.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-14.888989448547363, -14.444135665893555, -13.999282836914062, -13.554429054260254, -13.109575271606445, -12.664722442626953, -12.219868659973145, -11.775014877319336, -11.330162048339844, -10.885308265686035, -10.440455436706543, -9.995601654052734, -9.550748825073242, -9.105895042419434, -8.661041259765625, -8.216188430786133, -7.771334648132324, -7.326481342315674, -6.881628036499023, -6.436774253845215, -5.9919209480285645, -5.547067642211914, -5.1022138595581055, -4.657360553741455, -4.212507247924805, -3.7676539421081543, -3.322800397872925, -2.8779468536376953, -2.433093547821045, -1.9882402420043945, -1.543386697769165, -1.0985331535339355, -0.6536808013916016, -0.20882737636566162, 0.23602604866027832, 0.6808794736862183, 1.1257328987121582, 1.5705862045288086, 2.015439748764038, 2.4602932929992676, 2.905146598815918, 3.3499999046325684, 3.794853448867798, 4.239706993103027, 4.684560298919678, 5.129413604736328, 5.574267387390137, 6.019120693206787, 6.4639739990234375, 6.908827304840088, 7.353680610656738, 7.798534393310547, 8.243387222290039, 8.688241004943848, 9.133094787597656, 9.577947616577148, 10.022801399230957, 10.467655181884766, 10.912508010864258, 11.357361793518066, 11.802215576171875, 12.247068405151367, 12.691922187805176, 13.136775970458984, 13.581628799438477]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 15.0, 16.0, 28.0, 32.0, 59.0, 66.0, 107.0, 167.0, 250.0, 320.0, 500.0, 711.0, 1170.0, 1687.0, 2571.0, 3827.0, 5681.0, 8317.0, 12439.0, 18298.0, 27030.0, 39222.0, 55427.0, 75800.0, 97947.0, 115806.0, 122375.0, 114855.0, 96201.0, 74314.0, 54024.0, 38322.0, 26038.0, 17737.0, 12473.0, 8222.0, 5502.0, 3676.0, 2421.0, 1602.0, 1100.0, 700.0, 467.0, 347.0, 215.0, 149.0, 92.0, 71.0, 48.0, 32.0, 21.0, 25.0, 14.0, 6.0, 6.0, 6.0, 1.0, 1.0], "bins": [-13.1171875, -12.713134765625, -12.30908203125, -11.905029296875, -11.5009765625, -11.096923828125, -10.69287109375, -10.288818359375, -9.884765625, -9.480712890625, -9.07666015625, -8.672607421875, -8.2685546875, -7.864501953125, -7.46044921875, -7.056396484375, -6.65234375, -6.248291015625, -5.84423828125, -5.440185546875, -5.0361328125, -4.632080078125, -4.22802734375, -3.823974609375, -3.419921875, -3.015869140625, -2.61181640625, -2.207763671875, -1.8037109375, -1.399658203125, -0.99560546875, -0.591552734375, -0.1875, 0.216552734375, 0.62060546875, 1.024658203125, 1.4287109375, 1.832763671875, 2.23681640625, 2.640869140625, 3.044921875, 3.448974609375, 3.85302734375, 4.257080078125, 4.6611328125, 5.065185546875, 5.46923828125, 5.873291015625, 6.27734375, 6.681396484375, 7.08544921875, 7.489501953125, 7.8935546875, 8.297607421875, 8.70166015625, 9.105712890625, 9.509765625, 9.913818359375, 10.31787109375, 10.721923828125, 11.1259765625, 11.530029296875, 11.93408203125, 12.338134765625, 12.7421875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 4.0, 7.0, 10.0, 10.0, 6.0, 13.0, 17.0, 16.0, 18.0, 23.0, 24.0, 15.0, 17.0, 25.0, 47.0, 25.0, 31.0, 30.0, 35.0, 40.0, 32.0, 35.0, 28.0, 37.0, 43.0, 30.0, 32.0, 39.0, 42.0, 25.0, 29.0, 29.0, 17.0, 22.0, 26.0, 18.0, 15.0, 16.0, 12.0, 5.0, 13.0, 8.0, 8.0, 3.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.6953125, -13.2691650390625, -12.843017578125, -12.4168701171875, -11.99072265625, -11.5645751953125, -11.138427734375, -10.7122802734375, -10.2861328125, -9.8599853515625, -9.433837890625, -9.0076904296875, -8.58154296875, -8.1553955078125, -7.729248046875, -7.3031005859375, -6.876953125, -6.4508056640625, -6.024658203125, -5.5985107421875, -5.17236328125, -4.7462158203125, -4.320068359375, -3.8939208984375, -3.4677734375, -3.0416259765625, -2.615478515625, -2.1893310546875, -1.76318359375, -1.3370361328125, -0.910888671875, -0.4847412109375, -0.05859375, 0.3675537109375, 0.793701171875, 1.2198486328125, 1.64599609375, 2.0721435546875, 2.498291015625, 2.9244384765625, 3.3505859375, 3.7767333984375, 4.202880859375, 4.6290283203125, 5.05517578125, 5.4813232421875, 5.907470703125, 6.3336181640625, 6.759765625, 7.1859130859375, 7.612060546875, 8.0382080078125, 8.46435546875, 8.8905029296875, 9.316650390625, 9.7427978515625, 10.1689453125, 10.5950927734375, 11.021240234375, 11.4473876953125, 11.87353515625, 12.2996826171875, 12.725830078125, 13.1519775390625, 13.578125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 10.0, 9.0, 33.0, 22.0, 40.0, 83.0, 126.0, 170.0, 257.0, 374.0, 635.0, 940.0, 1479.0, 2282.0, 3435.0, 5354.0, 8812.0, 13976.0, 22256.0, 34693.0, 54070.0, 80038.0, 110979.0, 136119.0, 143837.0, 128787.0, 100364.0, 70818.0, 46874.0, 30132.0, 18895.0, 11858.0, 7509.0, 4688.0, 2991.0, 1937.0, 1263.0, 839.0, 495.0, 366.0, 234.0, 166.0, 100.0, 71.0, 42.0, 27.0, 17.0, 22.0, 7.0, 7.0, 2.0, 6.0, 1.0, 1.0, 2.0], "bins": [-15.71875, -15.2471923828125, -14.775634765625, -14.3040771484375, -13.83251953125, -13.3609619140625, -12.889404296875, -12.4178466796875, -11.9462890625, -11.4747314453125, -11.003173828125, -10.5316162109375, -10.06005859375, -9.5885009765625, -9.116943359375, -8.6453857421875, -8.173828125, -7.7022705078125, -7.230712890625, -6.7591552734375, -6.28759765625, -5.8160400390625, -5.344482421875, -4.8729248046875, -4.4013671875, -3.9298095703125, -3.458251953125, -2.9866943359375, -2.51513671875, -2.0435791015625, -1.572021484375, -1.1004638671875, -0.62890625, -0.1573486328125, 0.314208984375, 0.7857666015625, 1.25732421875, 1.7288818359375, 2.200439453125, 2.6719970703125, 3.1435546875, 3.6151123046875, 4.086669921875, 4.5582275390625, 5.02978515625, 5.5013427734375, 5.972900390625, 6.4444580078125, 6.916015625, 7.3875732421875, 7.859130859375, 8.3306884765625, 8.80224609375, 9.2738037109375, 9.745361328125, 10.2169189453125, 10.6884765625, 11.1600341796875, 11.631591796875, 12.1031494140625, 12.57470703125, 13.0462646484375, 13.517822265625, 13.9893798828125, 14.4609375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 10.0, 2.0, 8.0, 15.0, 14.0, 15.0, 24.0, 18.0, 22.0, 27.0, 20.0, 23.0, 25.0, 27.0, 37.0, 40.0, 36.0, 48.0, 48.0, 33.0, 35.0, 33.0, 46.0, 38.0, 32.0, 40.0, 29.0, 32.0, 30.0, 18.0, 18.0, 24.0, 21.0, 16.0, 13.0, 11.0, 14.0, 10.0, 10.0, 10.0, 7.0, 2.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.5625, -9.2626953125, -8.962890625, -8.6630859375, -8.36328125, -8.0634765625, -7.763671875, -7.4638671875, -7.1640625, -6.8642578125, -6.564453125, -6.2646484375, -5.96484375, -5.6650390625, -5.365234375, -5.0654296875, -4.765625, -4.4658203125, -4.166015625, -3.8662109375, -3.56640625, -3.2666015625, -2.966796875, -2.6669921875, -2.3671875, -2.0673828125, -1.767578125, -1.4677734375, -1.16796875, -0.8681640625, -0.568359375, -0.2685546875, 0.03125, 0.3310546875, 0.630859375, 0.9306640625, 1.23046875, 1.5302734375, 1.830078125, 2.1298828125, 2.4296875, 2.7294921875, 3.029296875, 3.3291015625, 3.62890625, 3.9287109375, 4.228515625, 4.5283203125, 4.828125, 5.1279296875, 5.427734375, 5.7275390625, 6.02734375, 6.3271484375, 6.626953125, 6.9267578125, 7.2265625, 7.5263671875, 7.826171875, 8.1259765625, 8.42578125, 8.7255859375, 9.025390625, 9.3251953125, 9.625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 7.0, 15.0, 16.0, 31.0, 40.0, 39.0, 80.0, 107.0, 161.0, 227.0, 370.0, 589.0, 878.0, 1361.0, 2229.0, 3644.0, 5635.0, 9383.0, 15194.0, 25164.0, 41815.0, 68161.0, 106358.0, 149732.0, 172437.0, 152491.0, 110288.0, 71001.0, 43615.0, 26166.0, 15668.0, 9634.0, 5921.0, 3595.0, 2341.0, 1454.0, 936.0, 588.0, 383.0, 264.0, 181.0, 96.0, 80.0, 49.0, 37.0, 22.0, 24.0, 16.0, 4.0, 4.0, 7.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.453125, -4.30731201171875, -4.1614990234375, -4.01568603515625, -3.869873046875, -3.72406005859375, -3.5782470703125, -3.43243408203125, -3.28662109375, -3.14080810546875, -2.9949951171875, -2.84918212890625, -2.703369140625, -2.55755615234375, -2.4117431640625, -2.26593017578125, -2.1201171875, -1.97430419921875, -1.8284912109375, -1.68267822265625, -1.536865234375, -1.39105224609375, -1.2452392578125, -1.09942626953125, -0.95361328125, -0.80780029296875, -0.6619873046875, -0.51617431640625, -0.370361328125, -0.22454833984375, -0.0787353515625, 0.06707763671875, 0.212890625, 0.35870361328125, 0.5045166015625, 0.65032958984375, 0.796142578125, 0.94195556640625, 1.0877685546875, 1.23358154296875, 1.37939453125, 1.52520751953125, 1.6710205078125, 1.81683349609375, 1.962646484375, 2.10845947265625, 2.2542724609375, 2.40008544921875, 2.5458984375, 2.69171142578125, 2.8375244140625, 2.98333740234375, 3.129150390625, 3.27496337890625, 3.4207763671875, 3.56658935546875, 3.71240234375, 3.85821533203125, 4.0040283203125, 4.14984130859375, 4.295654296875, 4.44146728515625, 4.5872802734375, 4.73309326171875, 4.87890625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 10.0, 16.0, 14.0, 20.0, 15.0, 22.0, 30.0, 31.0, 33.0, 40.0, 41.0, 47.0, 68.0, 66.0, 60.0, 53.0, 56.0, 56.0, 46.0, 32.0, 51.0, 32.0, 28.0, 24.0, 19.0, 20.0, 17.0, 6.0, 7.0, 7.0, 8.0, 5.0, 5.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004067420959472656, -0.00039353594183921814, -0.00038032978773117065, -0.00036712363362312317, -0.0003539174795150757, -0.0003407113254070282, -0.0003275051712989807, -0.00031429901719093323, -0.00030109286308288574, -0.00028788670897483826, -0.00027468055486679077, -0.0002614744007587433, -0.0002482682466506958, -0.00023506209254264832, -0.00022185593843460083, -0.00020864978432655334, -0.00019544363021850586, -0.00018223747611045837, -0.0001690313220024109, -0.0001558251678943634, -0.00014261901378631592, -0.00012941285967826843, -0.00011620670557022095, -0.00010300055146217346, -8.979439735412598e-05, -7.658824324607849e-05, -6.3382089138031e-05, -5.017593502998352e-05, -3.6969780921936035e-05, -2.376362681388855e-05, -1.0557472705841064e-05, 2.648681402206421e-06, 1.5854835510253906e-05, 2.906098961830139e-05, 4.226714372634888e-05, 5.547329783439636e-05, 6.867945194244385e-05, 8.188560605049133e-05, 9.509176015853882e-05, 0.0001082979142665863, 0.00012150406837463379, 0.00013471022248268127, 0.00014791637659072876, 0.00016112253069877625, 0.00017432868480682373, 0.00018753483891487122, 0.0002007409930229187, 0.0002139471471309662, 0.00022715330123901367, 0.00024035945534706116, 0.00025356560945510864, 0.00026677176356315613, 0.0002799779176712036, 0.0002931840717792511, 0.0003063902258872986, 0.00031959637999534607, 0.00033280253410339355, 0.00034600868821144104, 0.0003592148423194885, 0.000372420996427536, 0.0003856271505355835, 0.000398833304643631, 0.00041203945875167847, 0.00042524561285972595, 0.00043845176696777344]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 12.0, 10.0, 21.0, 33.0, 39.0, 65.0, 92.0, 143.0, 232.0, 336.0, 532.0, 836.0, 1351.0, 2029.0, 3419.0, 5315.0, 8502.0, 13850.0, 22081.0, 35553.0, 57035.0, 86963.0, 124301.0, 152779.0, 155129.0, 128494.0, 90378.0, 59583.0, 37807.0, 23338.0, 14185.0, 8969.0, 5542.0, 3555.0, 2196.0, 1334.0, 871.0, 579.0, 341.0, 244.0, 158.0, 108.0, 73.0, 42.0, 41.0, 25.0, 9.0, 9.0, 8.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1875, -4.04815673828125, -3.9088134765625, -3.76947021484375, -3.630126953125, -3.49078369140625, -3.3514404296875, -3.21209716796875, -3.07275390625, -2.93341064453125, -2.7940673828125, -2.65472412109375, -2.515380859375, -2.37603759765625, -2.2366943359375, -2.09735107421875, -1.9580078125, -1.81866455078125, -1.6793212890625, -1.53997802734375, -1.400634765625, -1.26129150390625, -1.1219482421875, -0.98260498046875, -0.84326171875, -0.70391845703125, -0.5645751953125, -0.42523193359375, -0.285888671875, -0.14654541015625, -0.0072021484375, 0.13214111328125, 0.271484375, 0.41082763671875, 0.5501708984375, 0.68951416015625, 0.828857421875, 0.96820068359375, 1.1075439453125, 1.24688720703125, 1.38623046875, 1.52557373046875, 1.6649169921875, 1.80426025390625, 1.943603515625, 2.08294677734375, 2.2222900390625, 2.36163330078125, 2.5009765625, 2.64031982421875, 2.7796630859375, 2.91900634765625, 3.058349609375, 3.19769287109375, 3.3370361328125, 3.47637939453125, 3.61572265625, 3.75506591796875, 3.8944091796875, 4.03375244140625, 4.173095703125, 4.31243896484375, 4.4517822265625, 4.59112548828125, 4.73046875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 9.0, 4.0, 6.0, 8.0, 14.0, 9.0, 18.0, 13.0, 17.0, 19.0, 29.0, 34.0, 37.0, 36.0, 44.0, 39.0, 49.0, 50.0, 60.0, 46.0, 50.0, 47.0, 49.0, 42.0, 30.0, 46.0, 29.0, 24.0, 24.0, 17.0, 16.0, 19.0, 9.0, 11.0, 4.0, 4.0, 6.0, 9.0, 8.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6083984375, -1.5534515380859375, -1.498504638671875, -1.4435577392578125, -1.38861083984375, -1.3336639404296875, -1.278717041015625, -1.2237701416015625, -1.1688232421875, -1.1138763427734375, -1.058929443359375, -1.0039825439453125, -0.94903564453125, -0.8940887451171875, -0.839141845703125, -0.7841949462890625, -0.729248046875, -0.6743011474609375, -0.619354248046875, -0.5644073486328125, -0.50946044921875, -0.4545135498046875, -0.399566650390625, -0.3446197509765625, -0.2896728515625, -0.2347259521484375, -0.179779052734375, -0.1248321533203125, -0.06988525390625, -0.0149383544921875, 0.040008544921875, 0.0949554443359375, 0.14990234375, 0.2048492431640625, 0.259796142578125, 0.3147430419921875, 0.36968994140625, 0.4246368408203125, 0.479583740234375, 0.5345306396484375, 0.5894775390625, 0.6444244384765625, 0.699371337890625, 0.7543182373046875, 0.80926513671875, 0.8642120361328125, 0.919158935546875, 0.9741058349609375, 1.029052734375, 1.0839996337890625, 1.138946533203125, 1.1938934326171875, 1.24884033203125, 1.3037872314453125, 1.358734130859375, 1.4136810302734375, 1.4686279296875, 1.5235748291015625, 1.578521728515625, 1.6334686279296875, 1.68841552734375, 1.7433624267578125, 1.798309326171875, 1.8532562255859375, 1.908203125]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 11.0, 9.0, 11.0, 21.0, 21.0, 25.0, 28.0, 39.0, 49.0, 44.0, 63.0, 64.0, 55.0, 61.0, 60.0, 63.0, 51.0, 67.0, 41.0, 32.0, 36.0, 24.0, 32.0, 18.0, 14.0, 12.0, 10.0, 5.0, 5.0, 3.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.917743682861328, -17.398929595947266, -16.880115509033203, -16.36130142211914, -15.842487335205078, -15.323673248291016, -14.80486011505127, -14.286046028137207, -13.767231941223145, -13.248417854309082, -12.72960376739502, -12.210789680480957, -11.691976547241211, -11.173162460327148, -10.654348373413086, -10.135534286499023, -9.616720199584961, -9.097906112670898, -8.579092025756836, -8.060277938842773, -7.541464328765869, -7.022650241851807, -6.503836631774902, -5.98502254486084, -5.466208457946777, -4.947394371032715, -4.428580284118652, -3.909766674041748, -3.3909525871276855, -2.872138500213623, -2.3533246517181396, -1.8345108032226562, -1.3156976699829102, -0.7968837022781372, -0.27806973457336426, 0.2407442331314087, 0.7595582008361816, 1.2783722877502441, 1.7971861362457275, 2.315999984741211, 2.8348140716552734, 3.353628158569336, 3.8724420070648193, 4.391255855560303, 4.910069942474365, 5.428884029388428, 5.947697639465332, 6.4665117263793945, 6.985325813293457, 7.5041399002075195, 8.022953987121582, 8.541768074035645, 9.06058120727539, 9.579395294189453, 10.098209381103516, 10.617023468017578, 11.13583755493164, 11.654651641845703, 12.173465728759766, 12.692279815673828, 13.21109390258789, 13.729907989501953, 14.2487211227417, 14.767535209655762, 15.286349296569824]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 7.0, 6.0, 4.0, 12.0, 20.0, 9.0, 26.0, 19.0, 22.0, 19.0, 26.0, 21.0, 28.0, 47.0, 29.0, 30.0, 35.0, 34.0, 37.0, 44.0, 33.0, 33.0, 44.0, 29.0, 42.0, 37.0, 27.0, 44.0, 35.0, 30.0, 21.0, 17.0, 16.0, 18.0, 25.0, 15.0, 9.0, 6.0, 12.0, 7.0, 5.0, 1.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-15.75961971282959, -15.26988410949707, -14.78014850616455, -14.290412902832031, -13.800678253173828, -13.310941696166992, -12.821207046508789, -12.33147144317627, -11.84173583984375, -11.35200023651123, -10.862264633178711, -10.372529029846191, -9.882793426513672, -9.393058776855469, -8.90332317352295, -8.41358757019043, -7.92385196685791, -7.434116363525391, -6.944380760192871, -6.45464563369751, -5.96491003036499, -5.475174427032471, -4.985439300537109, -4.49570369720459, -4.00596809387207, -3.516232490539551, -3.0264971256256104, -2.53676176071167, -2.0470261573791504, -1.5572905540466309, -1.0675551891326904, -0.57781982421875, -0.08808422088623047, 0.4016512632369995, 0.8913867473602295, 1.3811222314834595, 1.8708577156066895, 2.360593318939209, 2.8503286838531494, 3.34006404876709, 3.8297996520996094, 4.319535255432129, 4.809270858764648, 5.29900598526001, 5.788741588592529, 6.278477191925049, 6.76821231842041, 7.25794792175293, 7.747683525085449, 8.237419128417969, 8.727154731750488, 9.216890335083008, 9.706624984741211, 10.196361541748047, 10.68609619140625, 11.17583179473877, 11.665567398071289, 12.155303001403809, 12.645038604736328, 13.134774208068848, 13.624509811401367, 14.11424446105957, 14.60398006439209, 15.09371566772461, 15.583451271057129]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 6.0, 10.0, 14.0, 26.0, 29.0, 45.0, 62.0, 111.0, 186.0, 271.0, 473.0, 702.0, 1155.0, 1747.0, 2780.0, 4482.0, 7040.0, 10771.0, 17391.0, 27393.0, 42986.0, 69075.0, 108234.0, 172628.0, 267496.0, 401026.0, 544386.0, 624074.0, 578256.0, 448024.0, 309395.0, 202470.0, 129683.0, 82485.0, 51440.0, 32605.0, 20343.0, 12845.0, 8154.0, 5051.0, 3275.0, 2093.0, 1298.0, 845.0, 537.0, 321.0, 230.0, 136.0, 68.0, 54.0, 33.0, 17.0, 16.0, 10.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-10.15625, -9.824951171875, -9.49365234375, -9.162353515625, -8.8310546875, -8.499755859375, -8.16845703125, -7.837158203125, -7.505859375, -7.174560546875, -6.84326171875, -6.511962890625, -6.1806640625, -5.849365234375, -5.51806640625, -5.186767578125, -4.85546875, -4.524169921875, -4.19287109375, -3.861572265625, -3.5302734375, -3.198974609375, -2.86767578125, -2.536376953125, -2.205078125, -1.873779296875, -1.54248046875, -1.211181640625, -0.8798828125, -0.548583984375, -0.21728515625, 0.114013671875, 0.4453125, 0.776611328125, 1.10791015625, 1.439208984375, 1.7705078125, 2.101806640625, 2.43310546875, 2.764404296875, 3.095703125, 3.427001953125, 3.75830078125, 4.089599609375, 4.4208984375, 4.752197265625, 5.08349609375, 5.414794921875, 5.74609375, 6.077392578125, 6.40869140625, 6.739990234375, 7.0712890625, 7.402587890625, 7.73388671875, 8.065185546875, 8.396484375, 8.727783203125, 9.05908203125, 9.390380859375, 9.7216796875, 10.052978515625, 10.38427734375, 10.715576171875, 11.046875]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 0.0, 5.0, 8.0, 5.0, 6.0, 9.0, 5.0, 6.0, 14.0, 10.0, 12.0, 17.0, 14.0, 17.0, 23.0, 22.0, 17.0, 20.0, 25.0, 33.0, 39.0, 34.0, 38.0, 34.0, 39.0, 27.0, 29.0, 37.0, 35.0, 40.0, 34.0, 34.0, 27.0, 36.0, 41.0, 11.0, 37.0, 18.0, 32.0, 15.0, 20.0, 17.0, 11.0, 8.0, 9.0, 10.0, 7.0, 9.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.1171875, -8.8170166015625, -8.516845703125, -8.2166748046875, -7.91650390625, -7.6163330078125, -7.316162109375, -7.0159912109375, -6.7158203125, -6.4156494140625, -6.115478515625, -5.8153076171875, -5.51513671875, -5.2149658203125, -4.914794921875, -4.6146240234375, -4.314453125, -4.0142822265625, -3.714111328125, -3.4139404296875, -3.11376953125, -2.8135986328125, -2.513427734375, -2.2132568359375, -1.9130859375, -1.6129150390625, -1.312744140625, -1.0125732421875, -0.71240234375, -0.4122314453125, -0.112060546875, 0.1881103515625, 0.48828125, 0.7884521484375, 1.088623046875, 1.3887939453125, 1.68896484375, 1.9891357421875, 2.289306640625, 2.5894775390625, 2.8896484375, 3.1898193359375, 3.489990234375, 3.7901611328125, 4.09033203125, 4.3905029296875, 4.690673828125, 4.9908447265625, 5.291015625, 5.5911865234375, 5.891357421875, 6.1915283203125, 6.49169921875, 6.7918701171875, 7.092041015625, 7.3922119140625, 7.6923828125, 7.9925537109375, 8.292724609375, 8.5928955078125, 8.89306640625, 9.1932373046875, 9.493408203125, 9.7935791015625, 10.09375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 12.0, 12.0, 33.0, 31.0, 69.0, 102.0, 183.0, 299.0, 477.0, 834.0, 1442.0, 2551.0, 4479.0, 7747.0, 13807.0, 25324.0, 44052.0, 78945.0, 137607.0, 230515.0, 364646.0, 518243.0, 637228.0, 643049.0, 533434.0, 377211.0, 240428.0, 143236.0, 82546.0, 46398.0, 25926.0, 14462.0, 8061.0, 4583.0, 2660.0, 1481.0, 883.0, 507.0, 307.0, 173.0, 107.0, 87.0, 34.0, 26.0, 17.0, 13.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-11.5390625, -11.1898193359375, -10.840576171875, -10.4913330078125, -10.14208984375, -9.7928466796875, -9.443603515625, -9.0943603515625, -8.7451171875, -8.3958740234375, -8.046630859375, -7.6973876953125, -7.34814453125, -6.9989013671875, -6.649658203125, -6.3004150390625, -5.951171875, -5.6019287109375, -5.252685546875, -4.9034423828125, -4.55419921875, -4.2049560546875, -3.855712890625, -3.5064697265625, -3.1572265625, -2.8079833984375, -2.458740234375, -2.1094970703125, -1.76025390625, -1.4110107421875, -1.061767578125, -0.7125244140625, -0.36328125, -0.0140380859375, 0.335205078125, 0.6844482421875, 1.03369140625, 1.3829345703125, 1.732177734375, 2.0814208984375, 2.4306640625, 2.7799072265625, 3.129150390625, 3.4783935546875, 3.82763671875, 4.1768798828125, 4.526123046875, 4.8753662109375, 5.224609375, 5.5738525390625, 5.923095703125, 6.2723388671875, 6.62158203125, 6.9708251953125, 7.320068359375, 7.6693115234375, 8.0185546875, 8.3677978515625, 8.717041015625, 9.0662841796875, 9.41552734375, 9.7647705078125, 10.114013671875, 10.4632568359375, 10.8125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 7.0, 5.0, 8.0, 10.0, 8.0, 16.0, 21.0, 34.0, 45.0, 46.0, 61.0, 79.0, 76.0, 98.0, 112.0, 148.0, 130.0, 164.0, 175.0, 181.0, 216.0, 220.0, 216.0, 212.0, 215.0, 182.0, 201.0, 163.0, 168.0, 151.0, 115.0, 106.0, 81.0, 93.0, 69.0, 52.0, 36.0, 36.0, 32.0, 28.0, 11.0, 19.0, 5.0, 5.0, 6.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.26953125, -5.1107177734375, -4.951904296875, -4.7930908203125, -4.63427734375, -4.4754638671875, -4.316650390625, -4.1578369140625, -3.9990234375, -3.8402099609375, -3.681396484375, -3.5225830078125, -3.36376953125, -3.2049560546875, -3.046142578125, -2.8873291015625, -2.728515625, -2.5697021484375, -2.410888671875, -2.2520751953125, -2.09326171875, -1.9344482421875, -1.775634765625, -1.6168212890625, -1.4580078125, -1.2991943359375, -1.140380859375, -0.9815673828125, -0.82275390625, -0.6639404296875, -0.505126953125, -0.3463134765625, -0.1875, -0.0286865234375, 0.130126953125, 0.2889404296875, 0.44775390625, 0.6065673828125, 0.765380859375, 0.9241943359375, 1.0830078125, 1.2418212890625, 1.400634765625, 1.5594482421875, 1.71826171875, 1.8770751953125, 2.035888671875, 2.1947021484375, 2.353515625, 2.5123291015625, 2.671142578125, 2.8299560546875, 2.98876953125, 3.1475830078125, 3.306396484375, 3.4652099609375, 3.6240234375, 3.7828369140625, 3.941650390625, 4.1004638671875, 4.25927734375, 4.4180908203125, 4.576904296875, 4.7357177734375, 4.89453125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 2.0, 9.0, 7.0, 2.0, 7.0, 11.0, 13.0, 12.0, 15.0, 22.0, 25.0, 29.0, 37.0, 30.0, 50.0, 60.0, 43.0, 41.0, 55.0, 54.0, 53.0, 44.0, 60.0, 46.0, 61.0, 32.0, 42.0, 18.0, 20.0, 20.0, 15.0, 18.0, 9.0, 8.0, 10.0, 6.0, 7.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.890774726867676, -10.520845413208008, -10.150915145874023, -9.780985832214355, -9.411056518554688, -9.041126251220703, -8.671196937561035, -8.301267623901367, -7.931337356567383, -7.561407566070557, -7.1914777755737305, -6.8215484619140625, -6.451618671417236, -6.08168888092041, -5.711759567260742, -5.341829776763916, -4.97189998626709, -4.601970195770264, -4.2320404052734375, -3.8621110916137695, -3.4921813011169434, -3.122251510620117, -2.75232195854187, -2.382392406463623, -2.012462615966797, -1.6425329446792603, -1.2726032733917236, -0.902673602104187, -0.5327439308166504, -0.16281425952911377, 0.20711541175842285, 0.5770449638366699, 0.9469738006591797, 1.3169034719467163, 1.686833143234253, 2.0567626953125, 2.426692485809326, 2.7966222763061523, 3.1665518283843994, 3.5364813804626465, 3.9064111709594727, 4.276340961456299, 4.646270751953125, 5.016200065612793, 5.386129856109619, 5.756059646606445, 6.125988960266113, 6.4959187507629395, 6.865848541259766, 7.235778331756592, 7.605708122253418, 7.975637435913086, 8.34556770324707, 8.715497016906738, 9.085426330566406, 9.45535659790039, 9.825285911560059, 10.195215225219727, 10.565145492553711, 10.935074806213379, 11.305004119873047, 11.674934387207031, 12.0448637008667, 12.414793014526367, 12.784723281860352]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 1.0, 6.0, 9.0, 9.0, 13.0, 12.0, 13.0, 16.0, 20.0, 29.0, 25.0, 29.0, 27.0, 29.0, 26.0, 35.0, 36.0, 45.0, 31.0, 34.0, 36.0, 27.0, 26.0, 34.0, 36.0, 41.0, 30.0, 30.0, 37.0, 25.0, 36.0, 29.0, 22.0, 26.0, 17.0, 17.0, 14.0, 15.0, 8.0, 6.0, 6.0, 6.0, 5.0, 8.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.173113822937012, -11.782267570495605, -11.3914213180542, -11.000574111938477, -10.60972785949707, -10.218881607055664, -9.828035354614258, -9.437189102172852, -9.046341896057129, -8.655495643615723, -8.264649391174316, -7.873802661895752, -7.4829559326171875, -7.092109680175781, -6.701263427734375, -6.3104166984558105, -5.919570446014404, -5.528724193572998, -5.137877464294434, -4.747031211853027, -4.356184482574463, -3.9653382301330566, -3.5744917392730713, -3.183645248413086, -2.7927987575531006, -2.4019522666931152, -2.01110577583313, -1.620259404182434, -1.2294129133224487, -0.8385664224624634, -0.4477200508117676, -0.05687355995178223, 0.3339729309082031, 0.7248194217681885, 1.1156659126281738, 1.5065122842788696, 1.897358775138855, 2.288205146789551, 2.679051637649536, 3.0698981285095215, 3.460744619369507, 3.851591110229492, 4.242437362670898, 4.633284091949463, 5.024130344390869, 5.414977073669434, 5.80582332611084, 6.196669578552246, 6.5875163078308105, 6.978362560272217, 7.369209289550781, 7.7600555419921875, 8.150901794433594, 8.541749000549316, 8.932595252990723, 9.323441505432129, 9.714287757873535, 10.105134010314941, 10.495980262756348, 10.88682746887207, 11.277673721313477, 11.668519973754883, 12.059366226196289, 12.450212478637695, 12.841059684753418]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 9.0, 11.0, 17.0, 20.0, 42.0, 40.0, 92.0, 101.0, 186.0, 276.0, 400.0, 573.0, 925.0, 1494.0, 2327.0, 3681.0, 5883.0, 9329.0, 15080.0, 24732.0, 40764.0, 65893.0, 105658.0, 163748.0, 196930.0, 153757.0, 98079.0, 60978.0, 37223.0, 22927.0, 14011.0, 8748.0, 5345.0, 3273.0, 2076.0, 1354.0, 855.0, 577.0, 381.0, 249.0, 159.0, 98.0, 87.0, 60.0, 33.0, 25.0, 16.0, 11.0, 12.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.34765625, -3.244384765625, -3.14111328125, -3.037841796875, -2.9345703125, -2.831298828125, -2.72802734375, -2.624755859375, -2.521484375, -2.418212890625, -2.31494140625, -2.211669921875, -2.1083984375, -2.005126953125, -1.90185546875, -1.798583984375, -1.6953125, -1.592041015625, -1.48876953125, -1.385498046875, -1.2822265625, -1.178955078125, -1.07568359375, -0.972412109375, -0.869140625, -0.765869140625, -0.66259765625, -0.559326171875, -0.4560546875, -0.352783203125, -0.24951171875, -0.146240234375, -0.04296875, 0.060302734375, 0.16357421875, 0.266845703125, 0.3701171875, 0.473388671875, 0.57666015625, 0.679931640625, 0.783203125, 0.886474609375, 0.98974609375, 1.093017578125, 1.1962890625, 1.299560546875, 1.40283203125, 1.506103515625, 1.609375, 1.712646484375, 1.81591796875, 1.919189453125, 2.0224609375, 2.125732421875, 2.22900390625, 2.332275390625, 2.435546875, 2.538818359375, 2.64208984375, 2.745361328125, 2.8486328125, 2.951904296875, 3.05517578125, 3.158447265625, 3.26171875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 4.0, 12.0, 5.0, 10.0, 7.0, 15.0, 9.0, 19.0, 15.0, 16.0, 16.0, 21.0, 28.0, 24.0, 35.0, 35.0, 37.0, 30.0, 42.0, 33.0, 34.0, 27.0, 35.0, 34.0, 34.0, 34.0, 40.0, 33.0, 35.0, 33.0, 27.0, 35.0, 29.0, 17.0, 30.0, 16.0, 19.0, 12.0, 10.0, 11.0, 7.0, 6.0, 11.0, 7.0, 1.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-12.015625, -11.6214599609375, -11.227294921875, -10.8331298828125, -10.43896484375, -10.0447998046875, -9.650634765625, -9.2564697265625, -8.8623046875, -8.4681396484375, -8.073974609375, -7.6798095703125, -7.28564453125, -6.8914794921875, -6.497314453125, -6.1031494140625, -5.708984375, -5.3148193359375, -4.920654296875, -4.5264892578125, -4.13232421875, -3.7381591796875, -3.343994140625, -2.9498291015625, -2.5556640625, -2.1614990234375, -1.767333984375, -1.3731689453125, -0.97900390625, -0.5848388671875, -0.190673828125, 0.2034912109375, 0.59765625, 0.9918212890625, 1.385986328125, 1.7801513671875, 2.17431640625, 2.5684814453125, 2.962646484375, 3.3568115234375, 3.7509765625, 4.1451416015625, 4.539306640625, 4.9334716796875, 5.32763671875, 5.7218017578125, 6.115966796875, 6.5101318359375, 6.904296875, 7.2984619140625, 7.692626953125, 8.0867919921875, 8.48095703125, 8.8751220703125, 9.269287109375, 9.6634521484375, 10.0576171875, 10.4517822265625, 10.845947265625, 11.2401123046875, 11.63427734375, 12.0284423828125, 12.422607421875, 12.8167724609375, 13.2109375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 11.0, 12.0, 24.0, 46.0, 68.0, 102.0, 178.0, 255.0, 462.0, 769.0, 1389.0, 2298.0, 4152.0, 6983.0, 12662.0, 23422.0, 42726.0, 79322.0, 141927.0, 228530.0, 215251.0, 129890.0, 71766.0, 38769.0, 20761.0, 11587.0, 6440.0, 3612.0, 2066.0, 1283.0, 711.0, 419.0, 258.0, 144.0, 90.0, 63.0, 33.0, 26.0, 16.0, 6.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.291015625, -3.1910400390625, -3.091064453125, -2.9910888671875, -2.89111328125, -2.7911376953125, -2.691162109375, -2.5911865234375, -2.4912109375, -2.3912353515625, -2.291259765625, -2.1912841796875, -2.09130859375, -1.9913330078125, -1.891357421875, -1.7913818359375, -1.69140625, -1.5914306640625, -1.491455078125, -1.3914794921875, -1.29150390625, -1.1915283203125, -1.091552734375, -0.9915771484375, -0.8916015625, -0.7916259765625, -0.691650390625, -0.5916748046875, -0.49169921875, -0.3917236328125, -0.291748046875, -0.1917724609375, -0.091796875, 0.0081787109375, 0.108154296875, 0.2081298828125, 0.30810546875, 0.4080810546875, 0.508056640625, 0.6080322265625, 0.7080078125, 0.8079833984375, 0.907958984375, 1.0079345703125, 1.10791015625, 1.2078857421875, 1.307861328125, 1.4078369140625, 1.5078125, 1.6077880859375, 1.707763671875, 1.8077392578125, 1.90771484375, 2.0076904296875, 2.107666015625, 2.2076416015625, 2.3076171875, 2.4075927734375, 2.507568359375, 2.6075439453125, 2.70751953125, 2.8074951171875, 2.907470703125, 3.0074462890625, 3.107421875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 10.0, 5.0, 8.0, 12.0, 19.0, 9.0, 19.0, 20.0, 22.0, 28.0, 20.0, 33.0, 32.0, 34.0, 28.0, 31.0, 39.0, 31.0, 43.0, 31.0, 44.0, 48.0, 23.0, 32.0, 38.0, 31.0, 25.0, 28.0, 28.0, 32.0, 29.0, 21.0, 19.0, 17.0, 23.0, 13.0, 9.0, 6.0, 13.0, 7.0, 2.0, 3.0, 5.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.4453125, -8.180419921875, -7.91552734375, -7.650634765625, -7.3857421875, -7.120849609375, -6.85595703125, -6.591064453125, -6.326171875, -6.061279296875, -5.79638671875, -5.531494140625, -5.2666015625, -5.001708984375, -4.73681640625, -4.471923828125, -4.20703125, -3.942138671875, -3.67724609375, -3.412353515625, -3.1474609375, -2.882568359375, -2.61767578125, -2.352783203125, -2.087890625, -1.822998046875, -1.55810546875, -1.293212890625, -1.0283203125, -0.763427734375, -0.49853515625, -0.233642578125, 0.03125, 0.296142578125, 0.56103515625, 0.825927734375, 1.0908203125, 1.355712890625, 1.62060546875, 1.885498046875, 2.150390625, 2.415283203125, 2.68017578125, 2.945068359375, 3.2099609375, 3.474853515625, 3.73974609375, 4.004638671875, 4.26953125, 4.534423828125, 4.79931640625, 5.064208984375, 5.3291015625, 5.593994140625, 5.85888671875, 6.123779296875, 6.388671875, 6.653564453125, 6.91845703125, 7.183349609375, 7.4482421875, 7.713134765625, 7.97802734375, 8.242919921875, 8.5078125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 12.0, 11.0, 28.0, 35.0, 47.0, 89.0, 115.0, 151.0, 291.0, 394.0, 519.0, 959.0, 1347.0, 2278.0, 3830.0, 6488.0, 10998.0, 19991.0, 36109.0, 67521.0, 126344.0, 221558.0, 239469.0, 141079.0, 76118.0, 40604.0, 21825.0, 12250.0, 6968.0, 4226.0, 2558.0, 1580.0, 946.0, 606.0, 409.0, 256.0, 169.0, 105.0, 86.0, 51.0, 43.0, 30.0, 22.0, 10.0, 11.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4296875, -0.41629791259765625, -0.4029083251953125, -0.38951873779296875, -0.376129150390625, -0.36273956298828125, -0.3493499755859375, -0.33596038818359375, -0.32257080078125, -0.30918121337890625, -0.2957916259765625, -0.28240203857421875, -0.269012451171875, -0.25562286376953125, -0.2422332763671875, -0.22884368896484375, -0.2154541015625, -0.20206451416015625, -0.1886749267578125, -0.17528533935546875, -0.161895751953125, -0.14850616455078125, -0.1351165771484375, -0.12172698974609375, -0.10833740234375, -0.09494781494140625, -0.0815582275390625, -0.06816864013671875, -0.054779052734375, -0.04138946533203125, -0.0279998779296875, -0.01461029052734375, -0.001220703125, 0.01216888427734375, 0.0255584716796875, 0.03894805908203125, 0.052337646484375, 0.06572723388671875, 0.0791168212890625, 0.09250640869140625, 0.10589599609375, 0.11928558349609375, 0.1326751708984375, 0.14606475830078125, 0.159454345703125, 0.17284393310546875, 0.1862335205078125, 0.19962310791015625, 0.2130126953125, 0.22640228271484375, 0.2397918701171875, 0.25318145751953125, 0.266571044921875, 0.27996063232421875, 0.2933502197265625, 0.30673980712890625, 0.32012939453125, 0.33351898193359375, 0.3469085693359375, 0.36029815673828125, 0.373687744140625, 0.38707733154296875, 0.4004669189453125, 0.41385650634765625, 0.42724609375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 9.0, 9.0, 10.0, 11.0, 10.0, 20.0, 24.0, 21.0, 37.0, 47.0, 73.0, 94.0, 100.0, 121.0, 101.0, 80.0, 65.0, 34.0, 28.0, 17.0, 19.0, 11.0, 9.0, 7.0, 5.0, 11.0, 6.0, 9.0, 3.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00012969970703125, -0.00012600235641002655, -0.0001223050057888031, -0.00011860765516757965, -0.0001149103045463562, -0.00011121295392513275, -0.0001075156033039093, -0.00010381825268268585, -0.0001001209020614624, -9.642355144023895e-05, -9.27262008190155e-05, -8.902885019779205e-05, -8.53314995765686e-05, -8.163414895534515e-05, -7.79367983341217e-05, -7.423944771289825e-05, -7.05420970916748e-05, -6.684474647045135e-05, -6.31473958492279e-05, -5.9450045228004456e-05, -5.5752694606781006e-05, -5.2055343985557556e-05, -4.8357993364334106e-05, -4.466064274311066e-05, -4.096329212188721e-05, -3.726594150066376e-05, -3.356859087944031e-05, -2.9871240258216858e-05, -2.6173889636993408e-05, -2.247653901576996e-05, -1.877918839454651e-05, -1.5081837773323059e-05, -1.138448715209961e-05, -7.68713653087616e-06, -3.98978590965271e-06, -2.9243528842926025e-07, 3.4049153327941895e-06, 7.102265954017639e-06, 1.0799616575241089e-05, 1.4496967196464539e-05, 1.8194317817687988e-05, 2.1891668438911438e-05, 2.5589019060134888e-05, 2.9286369681358337e-05, 3.298372030258179e-05, 3.668107092380524e-05, 4.0378421545028687e-05, 4.4075772166252136e-05, 4.7773122787475586e-05, 5.1470473408699036e-05, 5.5167824029922485e-05, 5.8865174651145935e-05, 6.256252527236938e-05, 6.625987589359283e-05, 6.995722651481628e-05, 7.365457713603973e-05, 7.735192775726318e-05, 8.104927837848663e-05, 8.474662899971008e-05, 8.844397962093353e-05, 9.214133024215698e-05, 9.583868086338043e-05, 9.953603148460388e-05, 0.00010323338210582733, 0.00010693073272705078]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 11.0, 12.0, 19.0, 30.0, 43.0, 59.0, 113.0, 154.0, 210.0, 279.0, 459.0, 639.0, 1015.0, 1539.0, 2165.0, 3299.0, 4971.0, 7584.0, 11356.0, 17527.0, 27295.0, 42802.0, 67432.0, 105626.0, 165007.0, 198610.0, 140163.0, 89722.0, 57179.0, 35770.0, 23229.0, 14729.0, 9791.0, 6554.0, 4300.0, 2800.0, 1984.0, 1374.0, 893.0, 587.0, 404.0, 258.0, 170.0, 130.0, 93.0, 58.0, 37.0, 26.0, 20.0, 10.0, 5.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.53662109375, -0.5194854736328125, -0.502349853515625, -0.4852142333984375, -0.46807861328125, -0.4509429931640625, -0.433807373046875, -0.4166717529296875, -0.3995361328125, -0.3824005126953125, -0.365264892578125, -0.3481292724609375, -0.33099365234375, -0.3138580322265625, -0.296722412109375, -0.2795867919921875, -0.262451171875, -0.2453155517578125, -0.228179931640625, -0.2110443115234375, -0.19390869140625, -0.1767730712890625, -0.159637451171875, -0.1425018310546875, -0.1253662109375, -0.1082305908203125, -0.091094970703125, -0.0739593505859375, -0.05682373046875, -0.0396881103515625, -0.022552490234375, -0.0054168701171875, 0.01171875, 0.0288543701171875, 0.045989990234375, 0.0631256103515625, 0.08026123046875, 0.0973968505859375, 0.114532470703125, 0.1316680908203125, 0.1488037109375, 0.1659393310546875, 0.183074951171875, 0.2002105712890625, 0.21734619140625, 0.2344818115234375, 0.251617431640625, 0.2687530517578125, 0.285888671875, 0.3030242919921875, 0.320159912109375, 0.3372955322265625, 0.35443115234375, 0.3715667724609375, 0.388702392578125, 0.4058380126953125, 0.4229736328125, 0.4401092529296875, 0.457244873046875, 0.4743804931640625, 0.49151611328125, 0.5086517333984375, 0.525787353515625, 0.5429229736328125, 0.56005859375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 14.0, 8.0, 14.0, 13.0, 17.0, 24.0, 24.0, 34.0, 39.0, 38.0, 43.0, 50.0, 53.0, 54.0, 52.0, 60.0, 63.0, 53.0, 61.0, 44.0, 42.0, 34.0, 29.0, 22.0, 20.0, 19.0, 12.0, 11.0, 8.0, 7.0, 4.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.205078125, -0.19904708862304688, -0.19301605224609375, -0.18698501586914062, -0.1809539794921875, -0.17492294311523438, -0.16889190673828125, -0.16286087036132812, -0.156829833984375, -0.15079879760742188, -0.14476776123046875, -0.13873672485351562, -0.1327056884765625, -0.12667465209960938, -0.12064361572265625, -0.11461257934570312, -0.10858154296875, -0.10255050659179688, -0.09651947021484375, -0.09048843383789062, -0.0844573974609375, -0.07842636108398438, -0.07239532470703125, -0.06636428833007812, -0.060333251953125, -0.054302215576171875, -0.04827117919921875, -0.042240142822265625, -0.0362091064453125, -0.030178070068359375, -0.02414703369140625, -0.018115997314453125, -0.0120849609375, -0.006053924560546875, -2.288818359375e-05, 0.006008148193359375, 0.0120391845703125, 0.018070220947265625, 0.02410125732421875, 0.030132293701171875, 0.036163330078125, 0.042194366455078125, 0.04822540283203125, 0.054256439208984375, 0.0602874755859375, 0.06631851196289062, 0.07234954833984375, 0.07838058471679688, 0.08441162109375, 0.09044265747070312, 0.09647369384765625, 0.10250473022460938, 0.1085357666015625, 0.11456680297851562, 0.12059783935546875, 0.12662887573242188, 0.132659912109375, 0.13869094848632812, 0.14472198486328125, 0.15075302124023438, 0.1567840576171875, 0.16281509399414062, 0.16884613037109375, 0.17487716674804688, 0.180908203125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 8.0, 4.0, 10.0, 10.0, 9.0, 12.0, 13.0, 21.0, 26.0, 23.0, 47.0, 42.0, 42.0, 55.0, 42.0, 48.0, 62.0, 53.0, 61.0, 56.0, 52.0, 53.0, 52.0, 33.0, 31.0, 28.0, 15.0, 14.0, 18.0, 15.0, 11.0, 7.0, 6.0, 7.0, 5.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.044512748718262, -10.664385795593262, -10.284258842468262, -9.904131889343262, -9.524004936218262, -9.143877029418945, -8.763750076293945, -8.383623123168945, -8.003496170043945, -7.623369216918945, -7.243242263793945, -6.863115310668945, -6.482987880706787, -6.102860927581787, -5.722733974456787, -5.342606544494629, -4.962480068206787, -4.582353115081787, -4.202226161956787, -3.822098970413208, -3.441971778869629, -3.061844825744629, -2.681717872619629, -2.30159068107605, -1.9214637279510498, -1.5413366556167603, -1.1612095832824707, -0.7810826301574707, -0.40095555782318115, -0.0208284854888916, 0.3592984676361084, 0.7394256591796875, 1.1195526123046875, 1.499679684638977, 1.8798067569732666, 2.2599337100982666, 2.6400609016418457, 3.0201878547668457, 3.4003148078918457, 3.780441999435425, 4.160569190979004, 4.540696144104004, 4.920823097229004, 5.300950050354004, 5.681077480316162, 6.061204433441162, 6.441331386566162, 6.82145881652832, 7.201585292816162, 7.581712245941162, 7.961839199066162, 8.34196662902832, 8.72209358215332, 9.10222053527832, 9.48234748840332, 9.86247444152832, 10.24260139465332, 10.62272834777832, 11.00285530090332, 11.38298225402832, 11.76310920715332, 12.14323616027832, 12.52336311340332, 12.903491020202637, 13.283617973327637]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 2.0, 4.0, 6.0, 13.0, 13.0, 12.0, 14.0, 15.0, 19.0, 31.0, 30.0, 25.0, 26.0, 32.0, 25.0, 31.0, 40.0, 42.0, 32.0, 37.0, 34.0, 28.0, 28.0, 30.0, 40.0, 35.0, 32.0, 34.0, 37.0, 26.0, 33.0, 31.0, 22.0, 27.0, 13.0, 17.0, 15.0, 15.0, 6.0, 6.0, 6.0, 8.0, 4.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.044835090637207, -11.658997535705566, -11.273159980773926, -10.887322425842285, -10.501484870910645, -10.115647315979004, -9.72981071472168, -9.343973159790039, -8.958135604858398, -8.572298049926758, -8.186460494995117, -7.800622940063477, -7.414785385131836, -7.028947830200195, -6.643110752105713, -6.257273197174072, -5.871435165405273, -5.485597610473633, -5.099760055541992, -4.713922500610352, -4.328084945678711, -3.9422476291656494, -3.556410312652588, -3.1705727577209473, -2.7847352027893066, -2.398897647857666, -2.0130600929260254, -1.6272227764129639, -1.2413852214813232, -0.8555476665496826, -0.4697103500366211, -0.08387279510498047, 0.30196475982666016, 0.687802255153656, 1.0736397504806519, 1.459477186203003, 1.8453147411346436, 2.231152296066284, 2.6169896125793457, 3.0028271675109863, 3.388664722442627, 3.7745022773742676, 4.160339832305908, 4.546176910400391, 4.932014465332031, 5.317852020263672, 5.7036895751953125, 6.089527130126953, 6.475364685058594, 6.861202239990234, 7.247039794921875, 7.632877349853516, 8.018714904785156, 8.404552459716797, 8.790390014648438, 9.176227569580078, 9.562065124511719, 9.94790267944336, 10.333740234375, 10.71957778930664, 11.105415344238281, 11.491252899169922, 11.877090454101562, 12.262928009033203, 12.648764610290527]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 4.0, 12.0, 28.0, 33.0, 58.0, 96.0, 125.0, 216.0, 302.0, 499.0, 773.0, 1107.0, 1808.0, 2802.0, 4297.0, 6601.0, 10243.0, 15491.0, 23104.0, 34731.0, 49764.0, 69672.0, 92057.0, 112637.0, 123159.0, 120041.0, 104356.0, 83505.0, 61359.0, 43160.0, 29426.0, 19682.0, 13224.0, 8477.0, 5537.0, 3599.0, 2356.0, 1515.0, 905.0, 622.0, 421.0, 263.0, 186.0, 100.0, 63.0, 53.0, 36.0, 27.0, 11.0, 5.0, 2.0, 3.0, 3.0, 1.0], "bins": [-11.125, -10.8052978515625, -10.485595703125, -10.1658935546875, -9.84619140625, -9.5264892578125, -9.206787109375, -8.8870849609375, -8.5673828125, -8.2476806640625, -7.927978515625, -7.6082763671875, -7.28857421875, -6.9688720703125, -6.649169921875, -6.3294677734375, -6.009765625, -5.6900634765625, -5.370361328125, -5.0506591796875, -4.73095703125, -4.4112548828125, -4.091552734375, -3.7718505859375, -3.4521484375, -3.1324462890625, -2.812744140625, -2.4930419921875, -2.17333984375, -1.8536376953125, -1.533935546875, -1.2142333984375, -0.89453125, -0.5748291015625, -0.255126953125, 0.0645751953125, 0.38427734375, 0.7039794921875, 1.023681640625, 1.3433837890625, 1.6630859375, 1.9827880859375, 2.302490234375, 2.6221923828125, 2.94189453125, 3.2615966796875, 3.581298828125, 3.9010009765625, 4.220703125, 4.5404052734375, 4.860107421875, 5.1798095703125, 5.49951171875, 5.8192138671875, 6.138916015625, 6.4586181640625, 6.7783203125, 7.0980224609375, 7.417724609375, 7.7374267578125, 8.05712890625, 8.3768310546875, 8.696533203125, 9.0162353515625, 9.3359375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 4.0, 3.0, 6.0, 12.0, 16.0, 11.0, 33.0, 19.0, 23.0, 23.0, 25.0, 23.0, 28.0, 34.0, 34.0, 49.0, 37.0, 28.0, 36.0, 36.0, 43.0, 29.0, 35.0, 27.0, 43.0, 33.0, 32.0, 30.0, 34.0, 39.0, 30.0, 24.0, 20.0, 18.0, 14.0, 9.0, 11.0, 5.0, 6.0, 5.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.4453125, -11.063720703125, -10.68212890625, -10.300537109375, -9.9189453125, -9.537353515625, -9.15576171875, -8.774169921875, -8.392578125, -8.010986328125, -7.62939453125, -7.247802734375, -6.8662109375, -6.484619140625, -6.10302734375, -5.721435546875, -5.33984375, -4.958251953125, -4.57666015625, -4.195068359375, -3.8134765625, -3.431884765625, -3.05029296875, -2.668701171875, -2.287109375, -1.905517578125, -1.52392578125, -1.142333984375, -0.7607421875, -0.379150390625, 0.00244140625, 0.384033203125, 0.765625, 1.147216796875, 1.52880859375, 1.910400390625, 2.2919921875, 2.673583984375, 3.05517578125, 3.436767578125, 3.818359375, 4.199951171875, 4.58154296875, 4.963134765625, 5.3447265625, 5.726318359375, 6.10791015625, 6.489501953125, 6.87109375, 7.252685546875, 7.63427734375, 8.015869140625, 8.3974609375, 8.779052734375, 9.16064453125, 9.542236328125, 9.923828125, 10.305419921875, 10.68701171875, 11.068603515625, 11.4501953125, 11.831787109375, 12.21337890625, 12.594970703125, 12.9765625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 11.0, 20.0, 25.0, 59.0, 89.0, 131.0, 245.0, 391.0, 646.0, 964.0, 1627.0, 2728.0, 4357.0, 7427.0, 12340.0, 20248.0, 33336.0, 53845.0, 83570.0, 120419.0, 150584.0, 156384.0, 133760.0, 97837.0, 64498.0, 40598.0, 24643.0, 14951.0, 9114.0, 5391.0, 3190.0, 2022.0, 1173.0, 725.0, 458.0, 296.0, 162.0, 119.0, 77.0, 34.0, 26.0, 11.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4296875, -12.03125, -11.6328125, -11.234375, -10.8359375, -10.4375, -10.0390625, -9.640625, -9.2421875, -8.84375, -8.4453125, -8.046875, -7.6484375, -7.25, -6.8515625, -6.453125, -6.0546875, -5.65625, -5.2578125, -4.859375, -4.4609375, -4.0625, -3.6640625, -3.265625, -2.8671875, -2.46875, -2.0703125, -1.671875, -1.2734375, -0.875, -0.4765625, -0.078125, 0.3203125, 0.71875, 1.1171875, 1.515625, 1.9140625, 2.3125, 2.7109375, 3.109375, 3.5078125, 3.90625, 4.3046875, 4.703125, 5.1015625, 5.5, 5.8984375, 6.296875, 6.6953125, 7.09375, 7.4921875, 7.890625, 8.2890625, 8.6875, 9.0859375, 9.484375, 9.8828125, 10.28125, 10.6796875, 11.078125, 11.4765625, 11.875, 12.2734375, 12.671875, 13.0703125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 9.0, 1.0, 6.0, 9.0, 14.0, 12.0, 10.0, 12.0, 13.0, 21.0, 15.0, 23.0, 29.0, 30.0, 33.0, 26.0, 54.0, 32.0, 39.0, 44.0, 38.0, 41.0, 40.0, 29.0, 33.0, 36.0, 30.0, 31.0, 28.0, 28.0, 33.0, 25.0, 20.0, 20.0, 22.0, 20.0, 10.0, 15.0, 17.0, 5.0, 14.0, 6.0, 4.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-8.125, -7.88507080078125, -7.6451416015625, -7.40521240234375, -7.165283203125, -6.92535400390625, -6.6854248046875, -6.44549560546875, -6.20556640625, -5.96563720703125, -5.7257080078125, -5.48577880859375, -5.245849609375, -5.00592041015625, -4.7659912109375, -4.52606201171875, -4.2861328125, -4.04620361328125, -3.8062744140625, -3.56634521484375, -3.326416015625, -3.08648681640625, -2.8465576171875, -2.60662841796875, -2.36669921875, -2.12677001953125, -1.8868408203125, -1.64691162109375, -1.406982421875, -1.16705322265625, -0.9271240234375, -0.68719482421875, -0.447265625, -0.20733642578125, 0.0325927734375, 0.27252197265625, 0.512451171875, 0.75238037109375, 0.9923095703125, 1.23223876953125, 1.47216796875, 1.71209716796875, 1.9520263671875, 2.19195556640625, 2.431884765625, 2.67181396484375, 2.9117431640625, 3.15167236328125, 3.3916015625, 3.63153076171875, 3.8714599609375, 4.11138916015625, 4.351318359375, 4.59124755859375, 4.8311767578125, 5.07110595703125, 5.31103515625, 5.55096435546875, 5.7908935546875, 6.03082275390625, 6.270751953125, 6.51068115234375, 6.7506103515625, 6.99053955078125, 7.23046875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 11.0, 8.0, 16.0, 27.0, 36.0, 62.0, 100.0, 126.0, 268.0, 368.0, 599.0, 1089.0, 1811.0, 3112.0, 5474.0, 10060.0, 18967.0, 35228.0, 66106.0, 118423.0, 182460.0, 209619.0, 168190.0, 102989.0, 57002.0, 30462.0, 15773.0, 8651.0, 4790.0, 2712.0, 1618.0, 955.0, 533.0, 312.0, 202.0, 133.0, 76.0, 50.0, 40.0, 24.0, 11.0, 14.0, 12.0, 7.0, 3.0, 1.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-5.2109375, -5.04998779296875, -4.8890380859375, -4.72808837890625, -4.567138671875, -4.40618896484375, -4.2452392578125, -4.08428955078125, -3.92333984375, -3.76239013671875, -3.6014404296875, -3.44049072265625, -3.279541015625, -3.11859130859375, -2.9576416015625, -2.79669189453125, -2.6357421875, -2.47479248046875, -2.3138427734375, -2.15289306640625, -1.991943359375, -1.83099365234375, -1.6700439453125, -1.50909423828125, -1.34814453125, -1.18719482421875, -1.0262451171875, -0.86529541015625, -0.704345703125, -0.54339599609375, -0.3824462890625, -0.22149658203125, -0.060546875, 0.10040283203125, 0.2613525390625, 0.42230224609375, 0.583251953125, 0.74420166015625, 0.9051513671875, 1.06610107421875, 1.22705078125, 1.38800048828125, 1.5489501953125, 1.70989990234375, 1.870849609375, 2.03179931640625, 2.1927490234375, 2.35369873046875, 2.5146484375, 2.67559814453125, 2.8365478515625, 2.99749755859375, 3.158447265625, 3.31939697265625, 3.4803466796875, 3.64129638671875, 3.80224609375, 3.96319580078125, 4.1241455078125, 4.28509521484375, 4.446044921875, 4.60699462890625, 4.7679443359375, 4.92889404296875, 5.08984375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 9.0, 2.0, 1.0, 3.0, 6.0, 11.0, 11.0, 11.0, 17.0, 19.0, 24.0, 30.0, 18.0, 28.0, 39.0, 33.0, 34.0, 43.0, 47.0, 51.0, 47.0, 59.0, 39.0, 62.0, 32.0, 47.0, 50.0, 30.0, 38.0, 23.0, 23.0, 22.0, 21.0, 15.0, 9.0, 6.0, 4.0, 7.0, 5.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0003371238708496094, -0.0003277696669101715, -0.00031841546297073364, -0.0003090612590312958, -0.0002997070550918579, -0.00029035285115242004, -0.0002809986472129822, -0.0002716444432735443, -0.00026229023933410645, -0.0002529360353946686, -0.0002435818314552307, -0.00023422762751579285, -0.00022487342357635498, -0.00021551921963691711, -0.00020616501569747925, -0.00019681081175804138, -0.00018745660781860352, -0.00017810240387916565, -0.00016874819993972778, -0.00015939399600028992, -0.00015003979206085205, -0.00014068558812141418, -0.00013133138418197632, -0.00012197718024253845, -0.00011262297630310059, -0.00010326877236366272, -9.391456842422485e-05, -8.456036448478699e-05, -7.520616054534912e-05, -6.585195660591125e-05, -5.649775266647339e-05, -4.714354872703552e-05, -3.7789344787597656e-05, -2.843514084815979e-05, -1.9080936908721924e-05, -9.726732969284058e-06, -3.725290298461914e-07, 8.981674909591675e-06, 1.833587884902954e-05, 2.7690082788467407e-05, 3.7044286727905273e-05, 4.639849066734314e-05, 5.5752694606781006e-05, 6.510689854621887e-05, 7.446110248565674e-05, 8.38153064250946e-05, 9.316951036453247e-05, 0.00010252371430397034, 0.0001118779182434082, 0.00012123212218284607, 0.00013058632612228394, 0.0001399405300617218, 0.00014929473400115967, 0.00015864893794059753, 0.0001680031418800354, 0.00017735734581947327, 0.00018671154975891113, 0.000196065753698349, 0.00020541995763778687, 0.00021477416157722473, 0.0002241283655166626, 0.00023348256945610046, 0.00024283677339553833, 0.0002521909773349762, 0.00026154518127441406]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 5.0, 8.0, 17.0, 18.0, 20.0, 30.0, 62.0, 88.0, 104.0, 188.0, 290.0, 457.0, 666.0, 1008.0, 1493.0, 2357.0, 3963.0, 6389.0, 10405.0, 17479.0, 30151.0, 52013.0, 86866.0, 135375.0, 179403.0, 177478.0, 133551.0, 84437.0, 50785.0, 29242.0, 17354.0, 10019.0, 6212.0, 3853.0, 2334.0, 1523.0, 991.0, 669.0, 408.0, 279.0, 183.0, 136.0, 84.0, 56.0, 46.0, 16.0, 20.0, 10.0, 12.0, 10.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.10333251953125, -3.9566650390625, -3.80999755859375, -3.663330078125, -3.51666259765625, -3.3699951171875, -3.22332763671875, -3.07666015625, -2.92999267578125, -2.7833251953125, -2.63665771484375, -2.489990234375, -2.34332275390625, -2.1966552734375, -2.04998779296875, -1.9033203125, -1.75665283203125, -1.6099853515625, -1.46331787109375, -1.316650390625, -1.16998291015625, -1.0233154296875, -0.87664794921875, -0.72998046875, -0.58331298828125, -0.4366455078125, -0.28997802734375, -0.143310546875, 0.00335693359375, 0.1500244140625, 0.29669189453125, 0.443359375, 0.59002685546875, 0.7366943359375, 0.88336181640625, 1.030029296875, 1.17669677734375, 1.3233642578125, 1.47003173828125, 1.61669921875, 1.76336669921875, 1.9100341796875, 2.05670166015625, 2.203369140625, 2.35003662109375, 2.4967041015625, 2.64337158203125, 2.7900390625, 2.93670654296875, 3.0833740234375, 3.23004150390625, 3.376708984375, 3.52337646484375, 3.6700439453125, 3.81671142578125, 3.96337890625, 4.11004638671875, 4.2567138671875, 4.40338134765625, 4.550048828125, 4.69671630859375, 4.8433837890625, 4.99005126953125, 5.13671875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 4.0, 7.0, 15.0, 10.0, 13.0, 21.0, 23.0, 27.0, 34.0, 36.0, 49.0, 52.0, 48.0, 44.0, 58.0, 51.0, 64.0, 46.0, 64.0, 50.0, 45.0, 37.0, 39.0, 30.0, 23.0, 18.0, 20.0, 11.0, 11.0, 5.0, 8.0, 6.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.107421875, -2.0464324951171875, -1.985443115234375, -1.9244537353515625, -1.86346435546875, -1.8024749755859375, -1.741485595703125, -1.6804962158203125, -1.6195068359375, -1.5585174560546875, -1.497528076171875, -1.4365386962890625, -1.37554931640625, -1.3145599365234375, -1.253570556640625, -1.1925811767578125, -1.131591796875, -1.0706024169921875, -1.009613037109375, -0.9486236572265625, -0.88763427734375, -0.8266448974609375, -0.765655517578125, -0.7046661376953125, -0.6436767578125, -0.5826873779296875, -0.521697998046875, -0.4607086181640625, -0.39971923828125, -0.3387298583984375, -0.277740478515625, -0.2167510986328125, -0.15576171875, -0.0947723388671875, -0.033782958984375, 0.0272064208984375, 0.08819580078125, 0.1491851806640625, 0.210174560546875, 0.2711639404296875, 0.3321533203125, 0.3931427001953125, 0.454132080078125, 0.5151214599609375, 0.57611083984375, 0.6371002197265625, 0.698089599609375, 0.7590789794921875, 0.820068359375, 0.8810577392578125, 0.942047119140625, 1.0030364990234375, 1.06402587890625, 1.1250152587890625, 1.186004638671875, 1.2469940185546875, 1.3079833984375, 1.3689727783203125, 1.429962158203125, 1.4909515380859375, 1.55194091796875, 1.6129302978515625, 1.673919677734375, 1.7349090576171875, 1.7958984375]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 3.0, 7.0, 7.0, 7.0, 13.0, 9.0, 7.0, 11.0, 20.0, 16.0, 32.0, 24.0, 34.0, 22.0, 37.0, 44.0, 56.0, 48.0, 44.0, 57.0, 42.0, 58.0, 52.0, 41.0, 39.0, 41.0, 26.0, 25.0, 34.0, 24.0, 30.0, 16.0, 16.0, 11.0, 9.0, 7.0, 6.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.165904998779297, -9.844802856445312, -9.523701667785645, -9.20259952545166, -8.881498336791992, -8.560396194458008, -8.23929500579834, -7.9181928634643555, -7.597091197967529, -7.275989532470703, -6.954887866973877, -6.633786201477051, -6.312684059143066, -5.991582870483398, -5.670480728149414, -5.349379062652588, -5.028277397155762, -4.7071757316589355, -4.386074066162109, -4.064972400665283, -3.743870496749878, -3.4227688312530518, -3.1016669273376465, -2.7805652618408203, -2.459463596343994, -2.138361930847168, -1.8172601461410522, -1.4961583614349365, -1.1750566959381104, -0.8539550304412842, -0.5328532457351685, -0.21175146102905273, 0.10934925079345703, 0.430450975894928, 0.7515527009963989, 1.0726544857025146, 1.3937561511993408, 1.714857816696167, 2.0359597206115723, 2.3570613861083984, 2.6781630516052246, 2.999264717102051, 3.320366382598877, 3.6414682865142822, 3.9625699520111084, 4.2836713790893555, 4.60477352142334, 4.925875186920166, 5.246976852416992, 5.568078517913818, 5.8891801834106445, 6.210281848907471, 6.531383514404297, 6.852485656738281, 7.173587322235107, 7.494688987731934, 7.81579065322876, 8.136892318725586, 8.45799446105957, 8.779095649719238, 9.100197792053223, 9.42129898071289, 9.742401123046875, 10.06350326538086, 10.384604454040527]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 6.0, 8.0, 6.0, 0.0, 8.0, 10.0, 16.0, 20.0, 18.0, 18.0, 22.0, 23.0, 29.0, 29.0, 27.0, 32.0, 43.0, 39.0, 31.0, 45.0, 38.0, 41.0, 34.0, 42.0, 42.0, 40.0, 27.0, 45.0, 37.0, 41.0, 29.0, 23.0, 27.0, 18.0, 16.0, 16.0, 9.0, 13.0, 6.0, 12.0, 8.0, 3.0, 7.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-14.527395248413086, -14.108781814575195, -13.690168380737305, -13.271554946899414, -12.852941513061523, -12.434328079223633, -12.015714645385742, -11.597101211547852, -11.178487777709961, -10.75987434387207, -10.34126091003418, -9.922647476196289, -9.504034042358398, -9.085420608520508, -8.666807174682617, -8.248193740844727, -7.829580783843994, -7.4109673500061035, -6.992353916168213, -6.573740482330322, -6.155127048492432, -5.736514091491699, -5.317900657653809, -4.899287223815918, -4.480673789978027, -4.062060356140137, -3.643446922302246, -3.2248334884643555, -2.806220054626465, -2.3876068592071533, -1.9689934253692627, -1.550379991531372, -1.1317663192749023, -0.7131528854370117, -0.29453951120376587, 0.12407386302947998, 0.5426872968673706, 0.9613006114959717, 1.3799140453338623, 1.798527479171753, 2.2171409130096436, 2.635754346847534, 3.054367780685425, 3.4729809761047363, 3.891594409942627, 4.310207843780518, 4.728821277618408, 5.147434711456299, 5.5660481452941895, 5.98466157913208, 6.403275012969971, 6.821888446807861, 7.240501880645752, 7.659114837646484, 8.077728271484375, 8.496341705322266, 8.914955139160156, 9.333568572998047, 9.752182006835938, 10.170795440673828, 10.589408874511719, 11.00802230834961, 11.4266357421875, 11.84524917602539, 12.263862609863281]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 17.0, 19.0, 32.0, 40.0, 93.0, 136.0, 195.0, 355.0, 459.0, 751.0, 1217.0, 1860.0, 2917.0, 4516.0, 7158.0, 11396.0, 18352.0, 28887.0, 47338.0, 76895.0, 124669.0, 202194.0, 321455.0, 480628.0, 624163.0, 655135.0, 546431.0, 382897.0, 247302.0, 153888.0, 95505.0, 58808.0, 36630.0, 22895.0, 14460.0, 9044.0, 5708.0, 3602.0, 2308.0, 1443.0, 932.0, 581.0, 356.0, 245.0, 138.0, 81.0, 57.0, 42.0, 26.0, 8.0, 10.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.6875, -8.4093017578125, -8.131103515625, -7.8529052734375, -7.57470703125, -7.2965087890625, -7.018310546875, -6.7401123046875, -6.4619140625, -6.1837158203125, -5.905517578125, -5.6273193359375, -5.34912109375, -5.0709228515625, -4.792724609375, -4.5145263671875, -4.236328125, -3.9581298828125, -3.679931640625, -3.4017333984375, -3.12353515625, -2.8453369140625, -2.567138671875, -2.2889404296875, -2.0107421875, -1.7325439453125, -1.454345703125, -1.1761474609375, -0.89794921875, -0.6197509765625, -0.341552734375, -0.0633544921875, 0.21484375, 0.4930419921875, 0.771240234375, 1.0494384765625, 1.32763671875, 1.6058349609375, 1.884033203125, 2.1622314453125, 2.4404296875, 2.7186279296875, 2.996826171875, 3.2750244140625, 3.55322265625, 3.8314208984375, 4.109619140625, 4.3878173828125, 4.666015625, 4.9442138671875, 5.222412109375, 5.5006103515625, 5.77880859375, 6.0570068359375, 6.335205078125, 6.6134033203125, 6.8916015625, 7.1697998046875, 7.447998046875, 7.7261962890625, 8.00439453125, 8.2825927734375, 8.560791015625, 8.8389892578125, 9.1171875]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 6.0, 4.0, 3.0, 7.0, 12.0, 10.0, 18.0, 19.0, 16.0, 23.0, 21.0, 30.0, 28.0, 23.0, 37.0, 36.0, 36.0, 40.0, 47.0, 41.0, 44.0, 41.0, 43.0, 54.0, 36.0, 28.0, 31.0, 31.0, 44.0, 32.0, 24.0, 24.0, 26.0, 12.0, 17.0, 9.0, 11.0, 7.0, 5.0, 5.0, 9.0, 1.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.515625, -9.235595703125, -8.95556640625, -8.675537109375, -8.3955078125, -8.115478515625, -7.83544921875, -7.555419921875, -7.275390625, -6.995361328125, -6.71533203125, -6.435302734375, -6.1552734375, -5.875244140625, -5.59521484375, -5.315185546875, -5.03515625, -4.755126953125, -4.47509765625, -4.195068359375, -3.9150390625, -3.635009765625, -3.35498046875, -3.074951171875, -2.794921875, -2.514892578125, -2.23486328125, -1.954833984375, -1.6748046875, -1.394775390625, -1.11474609375, -0.834716796875, -0.5546875, -0.274658203125, 0.00537109375, 0.285400390625, 0.5654296875, 0.845458984375, 1.12548828125, 1.405517578125, 1.685546875, 1.965576171875, 2.24560546875, 2.525634765625, 2.8056640625, 3.085693359375, 3.36572265625, 3.645751953125, 3.92578125, 4.205810546875, 4.48583984375, 4.765869140625, 5.0458984375, 5.325927734375, 5.60595703125, 5.885986328125, 6.166015625, 6.446044921875, 6.72607421875, 7.006103515625, 7.2861328125, 7.566162109375, 7.84619140625, 8.126220703125, 8.40625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 3.0, 6.0, 10.0, 16.0, 28.0, 43.0, 67.0, 88.0, 126.0, 205.0, 332.0, 494.0, 697.0, 1168.0, 1871.0, 2840.0, 4373.0, 6982.0, 10958.0, 17110.0, 26945.0, 43192.0, 67240.0, 104896.0, 161008.0, 241150.0, 340689.0, 446485.0, 524990.0, 538427.0, 478375.0, 377982.0, 271735.0, 185884.0, 121733.0, 78465.0, 49776.0, 32052.0, 20188.0, 12628.0, 8242.0, 5225.0, 3330.0, 2194.0, 1391.0, 903.0, 564.0, 397.0, 280.0, 183.0, 113.0, 82.0, 46.0, 30.0, 24.0, 15.0, 8.0, 6.0, 4.0, 0.0, 2.0], "bins": [-7.31640625, -7.0889892578125, -6.861572265625, -6.6341552734375, -6.40673828125, -6.1793212890625, -5.951904296875, -5.7244873046875, -5.4970703125, -5.2696533203125, -5.042236328125, -4.8148193359375, -4.58740234375, -4.3599853515625, -4.132568359375, -3.9051513671875, -3.677734375, -3.4503173828125, -3.222900390625, -2.9954833984375, -2.76806640625, -2.5406494140625, -2.313232421875, -2.0858154296875, -1.8583984375, -1.6309814453125, -1.403564453125, -1.1761474609375, -0.94873046875, -0.7213134765625, -0.493896484375, -0.2664794921875, -0.0390625, 0.1883544921875, 0.415771484375, 0.6431884765625, 0.87060546875, 1.0980224609375, 1.325439453125, 1.5528564453125, 1.7802734375, 2.0076904296875, 2.235107421875, 2.4625244140625, 2.68994140625, 2.9173583984375, 3.144775390625, 3.3721923828125, 3.599609375, 3.8270263671875, 4.054443359375, 4.2818603515625, 4.50927734375, 4.7366943359375, 4.964111328125, 5.1915283203125, 5.4189453125, 5.6463623046875, 5.873779296875, 6.1011962890625, 6.32861328125, 6.5560302734375, 6.783447265625, 7.0108642578125, 7.23828125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 12.0, 9.0, 8.0, 11.0, 9.0, 18.0, 20.0, 23.0, 16.0, 40.0, 47.0, 50.0, 57.0, 74.0, 83.0, 89.0, 127.0, 123.0, 139.0, 165.0, 177.0, 155.0, 189.0, 194.0, 187.0, 213.0, 199.0, 171.0, 190.0, 174.0, 156.0, 127.0, 130.0, 101.0, 93.0, 89.0, 75.0, 68.0, 54.0, 45.0, 33.0, 31.0, 22.0, 17.0, 16.0, 13.0, 11.0, 5.0, 5.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.67578125, -3.558502197265625, -3.44122314453125, -3.323944091796875, -3.2066650390625, -3.089385986328125, -2.97210693359375, -2.854827880859375, -2.737548828125, -2.620269775390625, -2.50299072265625, -2.385711669921875, -2.2684326171875, -2.151153564453125, -2.03387451171875, -1.916595458984375, -1.79931640625, -1.682037353515625, -1.56475830078125, -1.447479248046875, -1.3302001953125, -1.212921142578125, -1.09564208984375, -0.978363037109375, -0.861083984375, -0.743804931640625, -0.62652587890625, -0.509246826171875, -0.3919677734375, -0.274688720703125, -0.15740966796875, -0.040130615234375, 0.0771484375, 0.194427490234375, 0.31170654296875, 0.428985595703125, 0.5462646484375, 0.663543701171875, 0.78082275390625, 0.898101806640625, 1.015380859375, 1.132659912109375, 1.24993896484375, 1.367218017578125, 1.4844970703125, 1.601776123046875, 1.71905517578125, 1.836334228515625, 1.95361328125, 2.070892333984375, 2.18817138671875, 2.305450439453125, 2.4227294921875, 2.540008544921875, 2.65728759765625, 2.774566650390625, 2.891845703125, 3.009124755859375, 3.12640380859375, 3.243682861328125, 3.3609619140625, 3.478240966796875, 3.59552001953125, 3.712799072265625, 3.830078125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 5.0, 3.0, 4.0, 9.0, 12.0, 9.0, 9.0, 16.0, 14.0, 21.0, 21.0, 36.0, 24.0, 36.0, 40.0, 39.0, 40.0, 57.0, 55.0, 53.0, 44.0, 73.0, 55.0, 48.0, 58.0, 31.0, 32.0, 24.0, 24.0, 23.0, 15.0, 11.0, 9.0, 8.0, 10.0, 13.0, 5.0, 4.0, 3.0, 6.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.423018455505371, -9.117729187011719, -8.812440872192383, -8.50715160369873, -8.201862335205078, -7.896574020385742, -7.59128475189209, -7.285995960235596, -6.980707168579102, -6.675418376922607, -6.370129585266113, -6.064840316772461, -5.759551525115967, -5.454262733459473, -5.14897346496582, -4.843684673309326, -4.538395881652832, -4.233107089996338, -3.9278180599212646, -3.6225290298461914, -3.3172402381896973, -3.011951446533203, -2.70666241645813, -2.4013733863830566, -2.0960845947265625, -1.7907956838607788, -1.4855067729949951, -1.1802178621292114, -0.8749289512634277, -0.569640040397644, -0.26435112953186035, 0.04093790054321289, 0.34622669219970703, 0.6515156030654907, 0.9568045139312744, 1.262093424797058, 1.5673823356628418, 1.8726712465286255, 2.177960157394409, 2.4832491874694824, 2.7885379791259766, 3.0938267707824707, 3.399115800857544, 3.704404830932617, 4.009693622589111, 4.3149824142456055, 4.620271682739258, 4.925560474395752, 5.230849266052246, 5.53613805770874, 5.841426849365234, 6.146716117858887, 6.452004909515381, 6.757293701171875, 7.062582969665527, 7.3678717613220215, 7.673160552978516, 7.97844934463501, 8.283738136291504, 8.589027404785156, 8.894315719604492, 9.199604988098145, 9.504894256591797, 9.810182571411133, 10.115471839904785]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 2.0, 12.0, 9.0, 8.0, 15.0, 14.0, 16.0, 11.0, 26.0, 22.0, 33.0, 25.0, 27.0, 39.0, 32.0, 33.0, 39.0, 45.0, 32.0, 37.0, 44.0, 41.0, 31.0, 47.0, 34.0, 39.0, 40.0, 27.0, 23.0, 29.0, 28.0, 22.0, 18.0, 26.0, 12.0, 18.0, 8.0, 5.0, 6.0, 4.0, 7.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.422914505004883, -12.060384750366211, -11.697854995727539, -11.33532428741455, -10.972794532775879, -10.610264778137207, -10.247734069824219, -9.885204315185547, -9.522674560546875, -9.160144805908203, -8.797615051269531, -8.435084342956543, -8.072554588317871, -7.710024833679199, -7.347494602203369, -6.984964370727539, -6.622434616088867, -6.259904861450195, -5.897374629974365, -5.534844398498535, -5.172314643859863, -4.809784889221191, -4.447254657745361, -4.084724426269531, -3.7221946716308594, -3.3596646785736084, -2.9971346855163574, -2.6346046924591064, -2.2720746994018555, -1.9095447063446045, -1.5470147132873535, -1.1844847202301025, -0.8219537734985352, -0.4594237804412842, -0.0968937873840332, 0.2656362056732178, 0.6281661987304688, 0.9906961917877197, 1.3532261848449707, 1.7157561779022217, 2.0782861709594727, 2.4408161640167236, 2.8033461570739746, 3.1658761501312256, 3.5284061431884766, 3.8909361362457275, 4.2534661293029785, 4.615996360778809, 4.9785261154174805, 5.341055870056152, 5.703586101531982, 6.0661163330078125, 6.428646087646484, 6.791175842285156, 7.153706073760986, 7.516236305236816, 7.878766059875488, 8.24129581451416, 8.603826522827148, 8.96635627746582, 9.328886032104492, 9.691415786743164, 10.053945541381836, 10.416476249694824, 10.779006004333496]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 4.0, 17.0, 12.0, 23.0, 38.0, 80.0, 102.0, 178.0, 274.0, 463.0, 755.0, 1283.0, 2183.0, 3824.0, 6610.0, 11271.0, 19019.0, 32860.0, 54986.0, 90038.0, 141933.0, 192940.0, 179188.0, 122123.0, 76527.0, 46158.0, 27258.0, 15807.0, 9523.0, 5454.0, 3107.0, 1793.0, 1044.0, 651.0, 370.0, 259.0, 152.0, 99.0, 52.0, 34.0, 22.0, 15.0, 13.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.29296875, -2.216094970703125, -2.13922119140625, -2.062347412109375, -1.9854736328125, -1.908599853515625, -1.83172607421875, -1.754852294921875, -1.677978515625, -1.601104736328125, -1.52423095703125, -1.447357177734375, -1.3704833984375, -1.293609619140625, -1.21673583984375, -1.139862060546875, -1.06298828125, -0.986114501953125, -0.90924072265625, -0.832366943359375, -0.7554931640625, -0.678619384765625, -0.60174560546875, -0.524871826171875, -0.447998046875, -0.371124267578125, -0.29425048828125, -0.217376708984375, -0.1405029296875, -0.063629150390625, 0.01324462890625, 0.090118408203125, 0.1669921875, 0.243865966796875, 0.32073974609375, 0.397613525390625, 0.4744873046875, 0.551361083984375, 0.62823486328125, 0.705108642578125, 0.781982421875, 0.858856201171875, 0.93572998046875, 1.012603759765625, 1.0894775390625, 1.166351318359375, 1.24322509765625, 1.320098876953125, 1.39697265625, 1.473846435546875, 1.55072021484375, 1.627593994140625, 1.7044677734375, 1.781341552734375, 1.85821533203125, 1.935089111328125, 2.011962890625, 2.088836669921875, 2.16571044921875, 2.242584228515625, 2.3194580078125, 2.396331787109375, 2.47320556640625, 2.550079345703125, 2.626953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 0.0, 5.0, 1.0, 5.0, 12.0, 5.0, 10.0, 14.0, 17.0, 18.0, 12.0, 17.0, 25.0, 25.0, 24.0, 33.0, 37.0, 41.0, 31.0, 27.0, 44.0, 43.0, 35.0, 32.0, 39.0, 40.0, 44.0, 40.0, 30.0, 39.0, 25.0, 39.0, 24.0, 21.0, 25.0, 21.0, 18.0, 21.0, 14.0, 15.0, 8.0, 9.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.4765625, -12.114013671875, -11.75146484375, -11.388916015625, -11.0263671875, -10.663818359375, -10.30126953125, -9.938720703125, -9.576171875, -9.213623046875, -8.85107421875, -8.488525390625, -8.1259765625, -7.763427734375, -7.40087890625, -7.038330078125, -6.67578125, -6.313232421875, -5.95068359375, -5.588134765625, -5.2255859375, -4.863037109375, -4.50048828125, -4.137939453125, -3.775390625, -3.412841796875, -3.05029296875, -2.687744140625, -2.3251953125, -1.962646484375, -1.60009765625, -1.237548828125, -0.875, -0.512451171875, -0.14990234375, 0.212646484375, 0.5751953125, 0.937744140625, 1.30029296875, 1.662841796875, 2.025390625, 2.387939453125, 2.75048828125, 3.113037109375, 3.4755859375, 3.838134765625, 4.20068359375, 4.563232421875, 4.92578125, 5.288330078125, 5.65087890625, 6.013427734375, 6.3759765625, 6.738525390625, 7.10107421875, 7.463623046875, 7.826171875, 8.188720703125, 8.55126953125, 8.913818359375, 9.2763671875, 9.638916015625, 10.00146484375, 10.364013671875, 10.7265625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 19.0, 18.0, 16.0, 43.0, 64.0, 80.0, 133.0, 181.0, 327.0, 512.0, 781.0, 1186.0, 1770.0, 2830.0, 4480.0, 7433.0, 11629.0, 18803.0, 29689.0, 47350.0, 74566.0, 114303.0, 165562.0, 181336.0, 137757.0, 90775.0, 58566.0, 36665.0, 22894.0, 14338.0, 8838.0, 5733.0, 3503.0, 2287.0, 1378.0, 961.0, 569.0, 383.0, 262.0, 180.0, 113.0, 76.0, 57.0, 46.0, 21.0, 12.0, 7.0, 5.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7890625, -1.733551025390625, -1.67803955078125, -1.622528076171875, -1.5670166015625, -1.511505126953125, -1.45599365234375, -1.400482177734375, -1.344970703125, -1.289459228515625, -1.23394775390625, -1.178436279296875, -1.1229248046875, -1.067413330078125, -1.01190185546875, -0.956390380859375, -0.90087890625, -0.845367431640625, -0.78985595703125, -0.734344482421875, -0.6788330078125, -0.623321533203125, -0.56781005859375, -0.512298583984375, -0.456787109375, -0.401275634765625, -0.34576416015625, -0.290252685546875, -0.2347412109375, -0.179229736328125, -0.12371826171875, -0.068206787109375, -0.0126953125, 0.042816162109375, 0.09832763671875, 0.153839111328125, 0.2093505859375, 0.264862060546875, 0.32037353515625, 0.375885009765625, 0.431396484375, 0.486907958984375, 0.54241943359375, 0.597930908203125, 0.6534423828125, 0.708953857421875, 0.76446533203125, 0.819976806640625, 0.87548828125, 0.930999755859375, 0.98651123046875, 1.042022705078125, 1.0975341796875, 1.153045654296875, 1.20855712890625, 1.264068603515625, 1.319580078125, 1.375091552734375, 1.43060302734375, 1.486114501953125, 1.5416259765625, 1.597137451171875, 1.65264892578125, 1.708160400390625, 1.763671875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 3.0, 9.0, 12.0, 15.0, 14.0, 16.0, 19.0, 22.0, 30.0, 28.0, 15.0, 37.0, 37.0, 26.0, 34.0, 38.0, 38.0, 41.0, 41.0, 39.0, 37.0, 44.0, 37.0, 44.0, 25.0, 33.0, 37.0, 25.0, 25.0, 20.0, 28.0, 30.0, 15.0, 21.0, 8.0, 9.0, 9.0, 6.0, 6.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.8515625, -7.61962890625, -7.3876953125, -7.15576171875, -6.923828125, -6.69189453125, -6.4599609375, -6.22802734375, -5.99609375, -5.76416015625, -5.5322265625, -5.30029296875, -5.068359375, -4.83642578125, -4.6044921875, -4.37255859375, -4.140625, -3.90869140625, -3.6767578125, -3.44482421875, -3.212890625, -2.98095703125, -2.7490234375, -2.51708984375, -2.28515625, -2.05322265625, -1.8212890625, -1.58935546875, -1.357421875, -1.12548828125, -0.8935546875, -0.66162109375, -0.4296875, -0.19775390625, 0.0341796875, 0.26611328125, 0.498046875, 0.72998046875, 0.9619140625, 1.19384765625, 1.42578125, 1.65771484375, 1.8896484375, 2.12158203125, 2.353515625, 2.58544921875, 2.8173828125, 3.04931640625, 3.28125, 3.51318359375, 3.7451171875, 3.97705078125, 4.208984375, 4.44091796875, 4.6728515625, 4.90478515625, 5.13671875, 5.36865234375, 5.6005859375, 5.83251953125, 6.064453125, 6.29638671875, 6.5283203125, 6.76025390625, 6.9921875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 10.0, 5.0, 12.0, 12.0, 29.0, 39.0, 43.0, 94.0, 125.0, 161.0, 197.0, 321.0, 544.0, 894.0, 1278.0, 2069.0, 4014.0, 9089.0, 29518.0, 137581.0, 533713.0, 252277.0, 51194.0, 13227.0, 5181.0, 2572.0, 1542.0, 954.0, 596.0, 395.0, 286.0, 178.0, 115.0, 86.0, 57.0, 44.0, 29.0, 24.0, 17.0, 11.0, 7.0, 3.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5576171875, -0.5388336181640625, -0.520050048828125, -0.5012664794921875, -0.48248291015625, -0.4636993408203125, -0.444915771484375, -0.4261322021484375, -0.4073486328125, -0.3885650634765625, -0.369781494140625, -0.3509979248046875, -0.33221435546875, -0.3134307861328125, -0.294647216796875, -0.2758636474609375, -0.257080078125, -0.2382965087890625, -0.219512939453125, -0.2007293701171875, -0.18194580078125, -0.1631622314453125, -0.144378662109375, -0.1255950927734375, -0.1068115234375, -0.0880279541015625, -0.069244384765625, -0.0504608154296875, -0.03167724609375, -0.0128936767578125, 0.005889892578125, 0.0246734619140625, 0.04345703125, 0.0622406005859375, 0.081024169921875, 0.0998077392578125, 0.11859130859375, 0.1373748779296875, 0.156158447265625, 0.1749420166015625, 0.1937255859375, 0.2125091552734375, 0.231292724609375, 0.2500762939453125, 0.26885986328125, 0.2876434326171875, 0.306427001953125, 0.3252105712890625, 0.343994140625, 0.3627777099609375, 0.381561279296875, 0.4003448486328125, 0.41912841796875, 0.4379119873046875, 0.456695556640625, 0.4754791259765625, 0.4942626953125, 0.5130462646484375, 0.531829833984375, 0.5506134033203125, 0.56939697265625, 0.5881805419921875, 0.606964111328125, 0.6257476806640625, 0.64453125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 10.0, 20.0, 40.0, 67.0, 126.0, 167.0, 185.0, 173.0, 84.0, 51.0, 31.0, 15.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.106231689453125e-05, -7.798522710800171e-05, -7.490813732147217e-05, -7.183104753494263e-05, -6.875395774841309e-05, -6.567686796188354e-05, -6.2599778175354e-05, -5.952268838882446e-05, -5.644559860229492e-05, -5.336850881576538e-05, -5.029141902923584e-05, -4.72143292427063e-05, -4.413723945617676e-05, -4.106014966964722e-05, -3.7983059883117676e-05, -3.4905970096588135e-05, -3.1828880310058594e-05, -2.8751790523529053e-05, -2.5674700736999512e-05, -2.259761095046997e-05, -1.952052116394043e-05, -1.644343137741089e-05, -1.3366341590881348e-05, -1.0289251804351807e-05, -7.212162017822266e-06, -4.135072231292725e-06, -1.0579824447631836e-06, 2.0191073417663574e-06, 5.0961971282958984e-06, 8.17328691482544e-06, 1.125037670135498e-05, 1.4327466487884521e-05, 1.7404556274414062e-05, 2.0481646060943604e-05, 2.3558735847473145e-05, 2.6635825634002686e-05, 2.9712915420532227e-05, 3.279000520706177e-05, 3.586709499359131e-05, 3.894418478012085e-05, 4.202127456665039e-05, 4.509836435317993e-05, 4.817545413970947e-05, 5.1252543926239014e-05, 5.4329633712768555e-05, 5.7406723499298096e-05, 6.048381328582764e-05, 6.356090307235718e-05, 6.663799285888672e-05, 6.971508264541626e-05, 7.27921724319458e-05, 7.586926221847534e-05, 7.894635200500488e-05, 8.202344179153442e-05, 8.510053157806396e-05, 8.81776213645935e-05, 9.125471115112305e-05, 9.433180093765259e-05, 9.740889072418213e-05, 0.00010048598051071167, 0.00010356307029724121, 0.00010664016008377075, 0.00010971724987030029, 0.00011279433965682983, 0.00011587142944335938]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 10.0, 16.0, 9.0, 27.0, 37.0, 46.0, 80.0, 141.0, 197.0, 256.0, 411.0, 746.0, 1227.0, 2077.0, 3887.0, 7500.0, 15714.0, 37049.0, 99904.0, 276961.0, 364655.0, 143536.0, 52409.0, 20786.0, 9677.0, 4867.0, 2468.0, 1488.0, 886.0, 525.0, 311.0, 203.0, 138.0, 93.0, 62.0, 39.0, 28.0, 20.0, 27.0, 10.0, 10.0, 11.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6630859375, -0.6436843872070312, -0.6242828369140625, -0.6048812866210938, -0.585479736328125, -0.5660781860351562, -0.5466766357421875, -0.5272750854492188, -0.50787353515625, -0.48847198486328125, -0.4690704345703125, -0.44966888427734375, -0.430267333984375, -0.41086578369140625, -0.3914642333984375, -0.37206268310546875, -0.3526611328125, -0.33325958251953125, -0.3138580322265625, -0.29445648193359375, -0.275054931640625, -0.25565338134765625, -0.2362518310546875, -0.21685028076171875, -0.19744873046875, -0.17804718017578125, -0.1586456298828125, -0.13924407958984375, -0.119842529296875, -0.10044097900390625, -0.0810394287109375, -0.06163787841796875, -0.042236328125, -0.02283477783203125, -0.0034332275390625, 0.01596832275390625, 0.035369873046875, 0.05477142333984375, 0.0741729736328125, 0.09357452392578125, 0.11297607421875, 0.13237762451171875, 0.1517791748046875, 0.17118072509765625, 0.190582275390625, 0.20998382568359375, 0.2293853759765625, 0.24878692626953125, 0.2681884765625, 0.28759002685546875, 0.3069915771484375, 0.32639312744140625, 0.345794677734375, 0.36519622802734375, 0.3845977783203125, 0.40399932861328125, 0.42340087890625, 0.44280242919921875, 0.4622039794921875, 0.48160552978515625, 0.501007080078125, 0.5204086303710938, 0.5398101806640625, 0.5592117309570312, 0.57861328125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 6.0, 12.0, 12.0, 27.0, 35.0, 48.0, 66.0, 86.0, 93.0, 82.0, 86.0, 95.0, 85.0, 60.0, 51.0, 37.0, 36.0, 23.0, 11.0, 13.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259765625, -0.25260353088378906, -0.24544143676757812, -0.2382793426513672, -0.23111724853515625, -0.2239551544189453, -0.21679306030273438, -0.20963096618652344, -0.2024688720703125, -0.19530677795410156, -0.18814468383789062, -0.1809825897216797, -0.17382049560546875, -0.1666584014892578, -0.15949630737304688, -0.15233421325683594, -0.145172119140625, -0.13801002502441406, -0.13084793090820312, -0.12368583679199219, -0.11652374267578125, -0.10936164855957031, -0.10219955444335938, -0.09503746032714844, -0.0878753662109375, -0.08071327209472656, -0.07355117797851562, -0.06638908386230469, -0.05922698974609375, -0.05206489562988281, -0.044902801513671875, -0.03774070739746094, -0.03057861328125, -0.023416519165039062, -0.016254425048828125, -0.009092330932617188, -0.00193023681640625, 0.0052318572998046875, 0.012393951416015625, 0.019556045532226562, 0.0267181396484375, 0.03388023376464844, 0.041042327880859375, 0.04820442199707031, 0.05536651611328125, 0.06252861022949219, 0.06969070434570312, 0.07685279846191406, 0.084014892578125, 0.09117698669433594, 0.09833908081054688, 0.10550117492675781, 0.11266326904296875, 0.11982536315917969, 0.12698745727539062, 0.13414955139160156, 0.1413116455078125, 0.14847373962402344, 0.15563583374023438, 0.1627979278564453, 0.16996002197265625, 0.1771221160888672, 0.18428421020507812, 0.19144630432128906, 0.1986083984375]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 6.0, 2.0, 5.0, 13.0, 10.0, 11.0, 7.0, 21.0, 15.0, 17.0, 23.0, 24.0, 39.0, 37.0, 31.0, 36.0, 52.0, 49.0, 56.0, 62.0, 49.0, 70.0, 45.0, 55.0, 55.0, 28.0, 31.0, 23.0, 20.0, 25.0, 15.0, 8.0, 8.0, 15.0, 9.0, 7.0, 6.0, 3.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.184307098388672, -8.884659767150879, -8.585012435913086, -8.285365104675293, -7.985718250274658, -7.686070919036865, -7.386423587799072, -7.0867767333984375, -6.7871294021606445, -6.487482070922852, -6.187834739685059, -5.888187408447266, -5.588540554046631, -5.288893222808838, -4.989245891571045, -4.68959903717041, -4.389951229095459, -4.090303897857666, -3.790656805038452, -3.491009473800659, -3.1913623809814453, -2.8917150497436523, -2.5920677185058594, -2.2924206256866455, -1.9927732944488525, -1.6931260824203491, -1.3934788703918457, -1.0938315391540527, -0.7941843271255493, -0.4945371150970459, -0.19488978385925293, 0.10475730895996094, 0.4044046401977539, 0.7040518522262573, 1.0036990642547607, 1.3033463954925537, 1.6029936075210571, 1.9026408195495605, 2.2022881507873535, 2.5019352436065674, 2.8015825748443604, 3.1012299060821533, 3.400876998901367, 3.70052433013916, 4.000171661376953, 4.299818992614746, 4.599466323852539, 4.899113178253174, 5.198760509490967, 5.49840784072876, 5.798055171966553, 6.0977020263671875, 6.3973493576049805, 6.696996688842773, 6.996644020080566, 7.296291351318359, 7.595938682556152, 7.895586013793945, 8.195233345031738, 8.494880676269531, 8.794528007507324, 9.094175338745117, 9.393821716308594, 9.693469047546387, 9.99311637878418]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 12.0, 8.0, 10.0, 15.0, 12.0, 16.0, 13.0, 24.0, 25.0, 27.0, 31.0, 26.0, 36.0, 35.0, 33.0, 36.0, 44.0, 33.0, 33.0, 47.0, 40.0, 30.0, 50.0, 34.0, 40.0, 40.0, 29.0, 23.0, 28.0, 27.0, 21.0, 20.0, 24.0, 17.0, 15.0, 7.0, 6.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.266376495361328, -11.908248901367188, -11.550122261047363, -11.191994667053223, -10.833867073059082, -10.475740432739258, -10.117612838745117, -9.759485244750977, -9.401357650756836, -9.043230056762695, -8.685103416442871, -8.32697582244873, -7.96884822845459, -7.610721111297607, -7.252593994140625, -6.894466400146484, -6.53633975982666, -6.178212642669678, -5.820085048675537, -5.461957931518555, -5.103830337524414, -4.745703220367432, -4.387576103210449, -4.029448509216309, -3.671321392059326, -3.3131940364837646, -2.955066680908203, -2.5969395637512207, -2.238812208175659, -1.8806848526000977, -1.5225577354431152, -1.1644303798675537, -0.8063020706176758, -0.44817477464675903, -0.09004747867584229, 0.2680797576904297, 0.6262071132659912, 0.9843344688415527, 1.3424615859985352, 1.7005889415740967, 2.058716297149658, 2.4168436527252197, 2.7749710083007812, 3.1330981254577637, 3.491225481033325, 3.8493528366088867, 4.207479953765869, 4.565607070922852, 4.923734664916992, 5.281861782073975, 5.639989376068115, 5.998116493225098, 6.356244087219238, 6.714371204376221, 7.072498321533203, 7.430625915527344, 7.788753032684326, 8.146880149841309, 8.50500774383545, 8.863134384155273, 9.221261978149414, 9.579389572143555, 9.937517166137695, 10.29564380645752, 10.65377140045166]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 10.0, 9.0, 14.0, 19.0, 23.0, 56.0, 78.0, 107.0, 161.0, 295.0, 452.0, 676.0, 1148.0, 1906.0, 3193.0, 5230.0, 8749.0, 14468.0, 23880.0, 38344.0, 58821.0, 86071.0, 117021.0, 141437.0, 144569.0, 125833.0, 95798.0, 66330.0, 43411.0, 27597.0, 17141.0, 10201.0, 6140.0, 3665.0, 2203.0, 1351.0, 786.0, 529.0, 323.0, 180.0, 125.0, 66.0, 49.0, 43.0, 22.0, 6.0, 9.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.234375, -8.9281005859375, -8.621826171875, -8.3155517578125, -8.00927734375, -7.7030029296875, -7.396728515625, -7.0904541015625, -6.7841796875, -6.4779052734375, -6.171630859375, -5.8653564453125, -5.55908203125, -5.2528076171875, -4.946533203125, -4.6402587890625, -4.333984375, -4.0277099609375, -3.721435546875, -3.4151611328125, -3.10888671875, -2.8026123046875, -2.496337890625, -2.1900634765625, -1.8837890625, -1.5775146484375, -1.271240234375, -0.9649658203125, -0.65869140625, -0.3524169921875, -0.046142578125, 0.2601318359375, 0.56640625, 0.8726806640625, 1.178955078125, 1.4852294921875, 1.79150390625, 2.0977783203125, 2.404052734375, 2.7103271484375, 3.0166015625, 3.3228759765625, 3.629150390625, 3.9354248046875, 4.24169921875, 4.5479736328125, 4.854248046875, 5.1605224609375, 5.466796875, 5.7730712890625, 6.079345703125, 6.3856201171875, 6.69189453125, 6.9981689453125, 7.304443359375, 7.6107177734375, 7.9169921875, 8.2232666015625, 8.529541015625, 8.8358154296875, 9.14208984375, 9.4483642578125, 9.754638671875, 10.0609130859375, 10.3671875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 8.0, 5.0, 6.0, 15.0, 16.0, 16.0, 27.0, 26.0, 22.0, 21.0, 29.0, 29.0, 26.0, 33.0, 35.0, 33.0, 51.0, 48.0, 43.0, 42.0, 44.0, 31.0, 36.0, 45.0, 39.0, 34.0, 31.0, 32.0, 23.0, 18.0, 27.0, 21.0, 11.0, 14.0, 20.0, 13.0, 9.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 2.0], "bins": [-12.9140625, -12.5556640625, -12.197265625, -11.8388671875, -11.48046875, -11.1220703125, -10.763671875, -10.4052734375, -10.046875, -9.6884765625, -9.330078125, -8.9716796875, -8.61328125, -8.2548828125, -7.896484375, -7.5380859375, -7.1796875, -6.8212890625, -6.462890625, -6.1044921875, -5.74609375, -5.3876953125, -5.029296875, -4.6708984375, -4.3125, -3.9541015625, -3.595703125, -3.2373046875, -2.87890625, -2.5205078125, -2.162109375, -1.8037109375, -1.4453125, -1.0869140625, -0.728515625, -0.3701171875, -0.01171875, 0.3466796875, 0.705078125, 1.0634765625, 1.421875, 1.7802734375, 2.138671875, 2.4970703125, 2.85546875, 3.2138671875, 3.572265625, 3.9306640625, 4.2890625, 4.6474609375, 5.005859375, 5.3642578125, 5.72265625, 6.0810546875, 6.439453125, 6.7978515625, 7.15625, 7.5146484375, 7.873046875, 8.2314453125, 8.58984375, 8.9482421875, 9.306640625, 9.6650390625, 10.0234375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 9.0, 10.0, 12.0, 9.0, 26.0, 37.0, 42.0, 99.0, 135.0, 224.0, 368.0, 620.0, 1121.0, 1811.0, 3240.0, 5525.0, 9592.0, 16382.0, 28358.0, 48311.0, 78847.0, 118017.0, 154146.0, 166588.0, 145121.0, 104551.0, 67451.0, 41203.0, 23675.0, 13876.0, 8010.0, 4495.0, 2672.0, 1625.0, 944.0, 580.0, 315.0, 189.0, 116.0, 86.0, 51.0, 30.0, 18.0, 7.0, 11.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.46875, -9.1346435546875, -8.800537109375, -8.4664306640625, -8.13232421875, -7.7982177734375, -7.464111328125, -7.1300048828125, -6.7958984375, -6.4617919921875, -6.127685546875, -5.7935791015625, -5.45947265625, -5.1253662109375, -4.791259765625, -4.4571533203125, -4.123046875, -3.7889404296875, -3.454833984375, -3.1207275390625, -2.78662109375, -2.4525146484375, -2.118408203125, -1.7843017578125, -1.4501953125, -1.1160888671875, -0.781982421875, -0.4478759765625, -0.11376953125, 0.2203369140625, 0.554443359375, 0.8885498046875, 1.22265625, 1.5567626953125, 1.890869140625, 2.2249755859375, 2.55908203125, 2.8931884765625, 3.227294921875, 3.5614013671875, 3.8955078125, 4.2296142578125, 4.563720703125, 4.8978271484375, 5.23193359375, 5.5660400390625, 5.900146484375, 6.2342529296875, 6.568359375, 6.9024658203125, 7.236572265625, 7.5706787109375, 7.90478515625, 8.2388916015625, 8.572998046875, 8.9071044921875, 9.2412109375, 9.5753173828125, 9.909423828125, 10.2435302734375, 10.57763671875, 10.9117431640625, 11.245849609375, 11.5799560546875, 11.9140625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 7.0, 4.0, 6.0, 8.0, 5.0, 17.0, 23.0, 13.0, 12.0, 25.0, 22.0, 26.0, 30.0, 28.0, 40.0, 36.0, 51.0, 46.0, 51.0, 51.0, 57.0, 47.0, 59.0, 49.0, 40.0, 29.0, 37.0, 28.0, 30.0, 21.0, 23.0, 21.0, 14.0, 13.0, 8.0, 10.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21875, -6.960693359375, -6.70263671875, -6.444580078125, -6.1865234375, -5.928466796875, -5.67041015625, -5.412353515625, -5.154296875, -4.896240234375, -4.63818359375, -4.380126953125, -4.1220703125, -3.864013671875, -3.60595703125, -3.347900390625, -3.08984375, -2.831787109375, -2.57373046875, -2.315673828125, -2.0576171875, -1.799560546875, -1.54150390625, -1.283447265625, -1.025390625, -0.767333984375, -0.50927734375, -0.251220703125, 0.0068359375, 0.264892578125, 0.52294921875, 0.781005859375, 1.0390625, 1.297119140625, 1.55517578125, 1.813232421875, 2.0712890625, 2.329345703125, 2.58740234375, 2.845458984375, 3.103515625, 3.361572265625, 3.61962890625, 3.877685546875, 4.1357421875, 4.393798828125, 4.65185546875, 4.909912109375, 5.16796875, 5.426025390625, 5.68408203125, 5.942138671875, 6.2001953125, 6.458251953125, 6.71630859375, 6.974365234375, 7.232421875, 7.490478515625, 7.74853515625, 8.006591796875, 8.2646484375, 8.522705078125, 8.78076171875, 9.038818359375, 9.296875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 10.0, 19.0, 15.0, 41.0, 65.0, 90.0, 122.0, 198.0, 317.0, 544.0, 828.0, 1379.0, 2255.0, 3784.0, 6683.0, 11427.0, 19931.0, 34756.0, 58798.0, 96599.0, 144462.0, 180435.0, 170379.0, 123915.0, 78845.0, 47176.0, 27580.0, 15709.0, 8994.0, 5359.0, 3116.0, 1821.0, 1075.0, 667.0, 439.0, 240.0, 167.0, 112.0, 65.0, 53.0, 26.0, 27.0, 12.0, 10.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.990234375, -3.864715576171875, -3.73919677734375, -3.613677978515625, -3.4881591796875, -3.362640380859375, -3.23712158203125, -3.111602783203125, -2.986083984375, -2.860565185546875, -2.73504638671875, -2.609527587890625, -2.4840087890625, -2.358489990234375, -2.23297119140625, -2.107452392578125, -1.98193359375, -1.856414794921875, -1.73089599609375, -1.605377197265625, -1.4798583984375, -1.354339599609375, -1.22882080078125, -1.103302001953125, -0.977783203125, -0.852264404296875, -0.72674560546875, -0.601226806640625, -0.4757080078125, -0.350189208984375, -0.22467041015625, -0.099151611328125, 0.0263671875, 0.151885986328125, 0.27740478515625, 0.402923583984375, 0.5284423828125, 0.653961181640625, 0.77947998046875, 0.904998779296875, 1.030517578125, 1.156036376953125, 1.28155517578125, 1.407073974609375, 1.5325927734375, 1.658111572265625, 1.78363037109375, 1.909149169921875, 2.03466796875, 2.160186767578125, 2.28570556640625, 2.411224365234375, 2.5367431640625, 2.662261962890625, 2.78778076171875, 2.913299560546875, 3.038818359375, 3.164337158203125, 3.28985595703125, 3.415374755859375, 3.5408935546875, 3.666412353515625, 3.79193115234375, 3.917449951171875, 4.04296875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 5.0, 14.0, 16.0, 17.0, 17.0, 16.0, 23.0, 26.0, 30.0, 34.0, 50.0, 52.0, 58.0, 49.0, 42.0, 65.0, 55.0, 61.0, 51.0, 48.0, 50.0, 33.0, 35.0, 21.0, 21.0, 10.0, 16.0, 10.0, 9.0, 13.0, 12.0, 4.0, 10.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002665519714355469, -0.00025672465562820435, -0.0002468973398208618, -0.0002370700240135193, -0.00022724270820617676, -0.00021741539239883423, -0.0002075880765914917, -0.00019776076078414917, -0.00018793344497680664, -0.0001781061291694641, -0.00016827881336212158, -0.00015845149755477905, -0.00014862418174743652, -0.000138796865940094, -0.00012896955013275146, -0.00011914223432540894, -0.0001093149185180664, -9.948760271072388e-05, -8.966028690338135e-05, -7.983297109603882e-05, -7.000565528869629e-05, -6.017833948135376e-05, -5.035102367401123e-05, -4.05237078666687e-05, -3.069639205932617e-05, -2.0869076251983643e-05, -1.1041760444641113e-05, -1.214444637298584e-06, 8.612871170043945e-06, 1.8440186977386475e-05, 2.8267502784729004e-05, 3.809481859207153e-05, 4.792213439941406e-05, 5.774945020675659e-05, 6.757676601409912e-05, 7.740408182144165e-05, 8.723139762878418e-05, 9.705871343612671e-05, 0.00010688602924346924, 0.00011671334505081177, 0.0001265406608581543, 0.00013636797666549683, 0.00014619529247283936, 0.00015602260828018188, 0.00016584992408752441, 0.00017567723989486694, 0.00018550455570220947, 0.000195331871509552, 0.00020515918731689453, 0.00021498650312423706, 0.0002248138189315796, 0.00023464113473892212, 0.00024446845054626465, 0.0002542957663536072, 0.0002641230821609497, 0.00027395039796829224, 0.00028377771377563477, 0.0002936050295829773, 0.0003034323453903198, 0.00031325966119766235, 0.0003230869770050049, 0.0003329142928123474, 0.00034274160861968994, 0.00035256892442703247, 0.000362396240234375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 7.0, 5.0, 8.0, 14.0, 17.0, 19.0, 32.0, 50.0, 47.0, 86.0, 132.0, 195.0, 302.0, 519.0, 846.0, 1330.0, 2263.0, 3870.0, 6804.0, 12116.0, 21960.0, 38948.0, 68416.0, 114754.0, 168351.0, 193505.0, 160925.0, 106671.0, 63802.0, 35815.0, 20140.0, 11163.0, 6541.0, 3486.0, 2048.0, 1192.0, 746.0, 492.0, 299.0, 207.0, 146.0, 86.0, 52.0, 44.0, 32.0, 27.0, 15.0, 10.0, 8.0, 6.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.4765625, -4.3426513671875, -4.208740234375, -4.0748291015625, -3.94091796875, -3.8070068359375, -3.673095703125, -3.5391845703125, -3.4052734375, -3.2713623046875, -3.137451171875, -3.0035400390625, -2.86962890625, -2.7357177734375, -2.601806640625, -2.4678955078125, -2.333984375, -2.2000732421875, -2.066162109375, -1.9322509765625, -1.79833984375, -1.6644287109375, -1.530517578125, -1.3966064453125, -1.2626953125, -1.1287841796875, -0.994873046875, -0.8609619140625, -0.72705078125, -0.5931396484375, -0.459228515625, -0.3253173828125, -0.19140625, -0.0574951171875, 0.076416015625, 0.2103271484375, 0.34423828125, 0.4781494140625, 0.612060546875, 0.7459716796875, 0.8798828125, 1.0137939453125, 1.147705078125, 1.2816162109375, 1.41552734375, 1.5494384765625, 1.683349609375, 1.8172607421875, 1.951171875, 2.0850830078125, 2.218994140625, 2.3529052734375, 2.48681640625, 2.6207275390625, 2.754638671875, 2.8885498046875, 3.0224609375, 3.1563720703125, 3.290283203125, 3.4241943359375, 3.55810546875, 3.6920166015625, 3.825927734375, 3.9598388671875, 4.09375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 4.0, 10.0, 11.0, 10.0, 11.0, 9.0, 29.0, 22.0, 30.0, 22.0, 30.0, 30.0, 34.0, 48.0, 48.0, 42.0, 47.0, 62.0, 61.0, 46.0, 42.0, 33.0, 42.0, 38.0, 33.0, 30.0, 31.0, 26.0, 22.0, 22.0, 11.0, 12.0, 7.0, 11.0, 7.0, 2.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.72265625, -1.6746826171875, -1.626708984375, -1.5787353515625, -1.53076171875, -1.4827880859375, -1.434814453125, -1.3868408203125, -1.3388671875, -1.2908935546875, -1.242919921875, -1.1949462890625, -1.14697265625, -1.0989990234375, -1.051025390625, -1.0030517578125, -0.955078125, -0.9071044921875, -0.859130859375, -0.8111572265625, -0.76318359375, -0.7152099609375, -0.667236328125, -0.6192626953125, -0.5712890625, -0.5233154296875, -0.475341796875, -0.4273681640625, -0.37939453125, -0.3314208984375, -0.283447265625, -0.2354736328125, -0.1875, -0.1395263671875, -0.091552734375, -0.0435791015625, 0.00439453125, 0.0523681640625, 0.100341796875, 0.1483154296875, 0.1962890625, 0.2442626953125, 0.292236328125, 0.3402099609375, 0.38818359375, 0.4361572265625, 0.484130859375, 0.5321044921875, 0.580078125, 0.6280517578125, 0.676025390625, 0.7239990234375, 0.77197265625, 0.8199462890625, 0.867919921875, 0.9158935546875, 0.9638671875, 1.0118408203125, 1.059814453125, 1.1077880859375, 1.15576171875, 1.2037353515625, 1.251708984375, 1.2996826171875, 1.34765625]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 6.0, 7.0, 10.0, 7.0, 11.0, 8.0, 13.0, 11.0, 17.0, 22.0, 19.0, 23.0, 31.0, 46.0, 41.0, 47.0, 62.0, 41.0, 48.0, 54.0, 55.0, 50.0, 36.0, 41.0, 46.0, 36.0, 32.0, 31.0, 21.0, 25.0, 21.0, 15.0, 12.0, 10.0, 8.0, 9.0, 11.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.135467529296875, -7.851094722747803, -7.5667219161987305, -7.282349109649658, -6.997976303100586, -6.713603973388672, -6.4292311668396, -6.144858360290527, -5.860485553741455, -5.576112747192383, -5.2917399406433105, -5.007367134094238, -4.722994804382324, -4.438621520996094, -4.15424919128418, -3.8698763847351074, -3.585503578186035, -3.301130771636963, -3.0167579650878906, -2.7323853969573975, -2.448012590408325, -2.163639783859253, -1.8792670965194702, -1.5948944091796875, -1.3105216026306152, -1.026148796081543, -0.7417761087417603, -0.45740336179733276, -0.17303061485290527, 0.11134219169616699, 0.3957148790359497, 0.6800875663757324, 0.9644603729248047, 1.248833179473877, 1.5332058668136597, 1.8175785541534424, 2.1019513607025146, 2.386324167251587, 2.67069673538208, 2.9550695419311523, 3.2394423484802246, 3.523815155029297, 3.808187961578369, 4.092560768127441, 4.3769330978393555, 4.661306381225586, 4.9456787109375, 5.230051517486572, 5.5144243240356445, 5.798797130584717, 6.083169937133789, 6.367542743682861, 6.651915550231934, 6.936287879943848, 7.22066068649292, 7.505033493041992, 7.7894062995910645, 8.073779106140137, 8.35815143585205, 8.642524719238281, 8.926897048950195, 9.211270332336426, 9.49564266204834, 9.78001594543457, 10.064388275146484]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 11.0, 7.0, 13.0, 16.0, 18.0, 18.0, 16.0, 20.0, 30.0, 24.0, 28.0, 30.0, 26.0, 26.0, 38.0, 43.0, 39.0, 54.0, 36.0, 32.0, 40.0, 49.0, 42.0, 34.0, 26.0, 30.0, 28.0, 30.0, 24.0, 25.0, 15.0, 20.0, 21.0, 24.0, 14.0, 8.0, 7.0, 6.0, 7.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.85439682006836, -11.501228332519531, -11.148059844970703, -10.794891357421875, -10.441723823547363, -10.088555335998535, -9.735386848449707, -9.382218360900879, -9.029050827026367, -8.675882339477539, -8.322713851928711, -7.969545841217041, -7.616377830505371, -7.263209342956543, -6.910040855407715, -6.556872367858887, -6.203703880310059, -5.8505353927612305, -5.4973673820495605, -5.144198894500732, -4.7910308837890625, -4.437862396240234, -4.084693908691406, -3.7315256595611572, -3.378357410430908, -3.025189161300659, -2.67202091217041, -2.318852424621582, -1.965684175491333, -1.612515926361084, -1.2593474388122559, -0.9061791896820068, -0.5530099868774414, -0.1998416781425476, 0.1533266305923462, 0.5064949989318848, 0.8596632480621338, 1.2128314971923828, 1.565999984741211, 1.91916823387146, 2.272336483001709, 2.625504732131958, 2.978672981262207, 3.331841468811035, 3.685009717941284, 4.038177967071533, 4.391346454620361, 4.744514465332031, 5.097682952880859, 5.4508514404296875, 5.804019451141357, 6.1571879386901855, 6.5103559494018555, 6.863524436950684, 7.216692924499512, 7.56986141204834, 7.92302942276001, 8.27619743347168, 8.629365921020508, 8.982534408569336, 9.335702896118164, 9.688871383666992, 10.04203987121582, 10.395207405090332, 10.74837589263916]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 8.0, 10.0, 9.0, 20.0, 30.0, 47.0, 106.0, 169.0, 231.0, 376.0, 650.0, 1031.0, 1768.0, 2966.0, 5162.0, 9036.0, 16477.0, 29619.0, 53620.0, 98218.0, 182086.0, 333643.0, 576494.0, 821092.0, 809361.0, 554524.0, 316324.0, 171491.0, 93144.0, 51397.0, 28177.0, 15748.0, 8915.0, 5105.0, 2947.0, 1742.0, 1045.0, 582.0, 347.0, 212.0, 144.0, 68.0, 48.0, 32.0, 36.0, 12.0, 9.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.7421875, -9.4373779296875, -9.132568359375, -8.8277587890625, -8.52294921875, -8.2181396484375, -7.913330078125, -7.6085205078125, -7.3037109375, -6.9989013671875, -6.694091796875, -6.3892822265625, -6.08447265625, -5.7796630859375, -5.474853515625, -5.1700439453125, -4.865234375, -4.5604248046875, -4.255615234375, -3.9508056640625, -3.64599609375, -3.3411865234375, -3.036376953125, -2.7315673828125, -2.4267578125, -2.1219482421875, -1.817138671875, -1.5123291015625, -1.20751953125, -0.9027099609375, -0.597900390625, -0.2930908203125, 0.01171875, 0.3165283203125, 0.621337890625, 0.9261474609375, 1.23095703125, 1.5357666015625, 1.840576171875, 2.1453857421875, 2.4501953125, 2.7550048828125, 3.059814453125, 3.3646240234375, 3.66943359375, 3.9742431640625, 4.279052734375, 4.5838623046875, 4.888671875, 5.1934814453125, 5.498291015625, 5.8031005859375, 6.10791015625, 6.4127197265625, 6.717529296875, 7.0223388671875, 7.3271484375, 7.6319580078125, 7.936767578125, 8.2415771484375, 8.54638671875, 8.8511962890625, 9.156005859375, 9.4608154296875, 9.765625]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 3.0, 5.0, 9.0, 16.0, 16.0, 17.0, 17.0, 18.0, 29.0, 21.0, 22.0, 34.0, 27.0, 28.0, 38.0, 38.0, 44.0, 43.0, 42.0, 42.0, 40.0, 42.0, 44.0, 49.0, 30.0, 35.0, 34.0, 20.0, 25.0, 19.0, 20.0, 24.0, 23.0, 16.0, 13.0, 13.0, 9.0, 7.0, 7.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2265625, -7.9808349609375, -7.735107421875, -7.4893798828125, -7.24365234375, -6.9979248046875, -6.752197265625, -6.5064697265625, -6.2607421875, -6.0150146484375, -5.769287109375, -5.5235595703125, -5.27783203125, -5.0321044921875, -4.786376953125, -4.5406494140625, -4.294921875, -4.0491943359375, -3.803466796875, -3.5577392578125, -3.31201171875, -3.0662841796875, -2.820556640625, -2.5748291015625, -2.3291015625, -2.0833740234375, -1.837646484375, -1.5919189453125, -1.34619140625, -1.1004638671875, -0.854736328125, -0.6090087890625, -0.36328125, -0.1175537109375, 0.128173828125, 0.3739013671875, 0.61962890625, 0.8653564453125, 1.111083984375, 1.3568115234375, 1.6025390625, 1.8482666015625, 2.093994140625, 2.3397216796875, 2.58544921875, 2.8311767578125, 3.076904296875, 3.3226318359375, 3.568359375, 3.8140869140625, 4.059814453125, 4.3055419921875, 4.55126953125, 4.7969970703125, 5.042724609375, 5.2884521484375, 5.5341796875, 5.7799072265625, 6.025634765625, 6.2713623046875, 6.51708984375, 6.7628173828125, 7.008544921875, 7.2542724609375, 7.5]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 12.0, 24.0, 31.0, 46.0, 78.0, 116.0, 199.0, 328.0, 492.0, 792.0, 1213.0, 1997.0, 3270.0, 5140.0, 8461.0, 13758.0, 22646.0, 37247.0, 61107.0, 99972.0, 163865.0, 259345.0, 388466.0, 525772.0, 614568.0, 592757.0, 478161.0, 339451.0, 220662.0, 138223.0, 84080.0, 51293.0, 30998.0, 18802.0, 11762.0, 7135.0, 4418.0, 2828.0, 1728.0, 1131.0, 683.0, 455.0, 307.0, 165.0, 121.0, 67.0, 37.0, 30.0, 20.0, 7.0, 6.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0], "bins": [-7.01953125, -6.7989501953125, -6.578369140625, -6.3577880859375, -6.13720703125, -5.9166259765625, -5.696044921875, -5.4754638671875, -5.2548828125, -5.0343017578125, -4.813720703125, -4.5931396484375, -4.37255859375, -4.1519775390625, -3.931396484375, -3.7108154296875, -3.490234375, -3.2696533203125, -3.049072265625, -2.8284912109375, -2.60791015625, -2.3873291015625, -2.166748046875, -1.9461669921875, -1.7255859375, -1.5050048828125, -1.284423828125, -1.0638427734375, -0.84326171875, -0.6226806640625, -0.402099609375, -0.1815185546875, 0.0390625, 0.2596435546875, 0.480224609375, 0.7008056640625, 0.92138671875, 1.1419677734375, 1.362548828125, 1.5831298828125, 1.8037109375, 2.0242919921875, 2.244873046875, 2.4654541015625, 2.68603515625, 2.9066162109375, 3.127197265625, 3.3477783203125, 3.568359375, 3.7889404296875, 4.009521484375, 4.2301025390625, 4.45068359375, 4.6712646484375, 4.891845703125, 5.1124267578125, 5.3330078125, 5.5535888671875, 5.774169921875, 5.9947509765625, 6.21533203125, 6.4359130859375, 6.656494140625, 6.8770751953125, 7.09765625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 7.0, 2.0, 11.0, 5.0, 8.0, 9.0, 22.0, 13.0, 35.0, 27.0, 37.0, 37.0, 60.0, 82.0, 80.0, 82.0, 107.0, 107.0, 154.0, 149.0, 157.0, 160.0, 187.0, 207.0, 176.0, 201.0, 213.0, 188.0, 201.0, 186.0, 140.0, 160.0, 125.0, 104.0, 91.0, 101.0, 76.0, 72.0, 55.0, 49.0, 42.0, 33.0, 26.0, 18.0, 20.0, 17.0, 9.0, 13.0, 9.0, 4.0, 8.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.984375, -2.881256103515625, -2.77813720703125, -2.675018310546875, -2.5718994140625, -2.468780517578125, -2.36566162109375, -2.262542724609375, -2.159423828125, -2.056304931640625, -1.95318603515625, -1.850067138671875, -1.7469482421875, -1.643829345703125, -1.54071044921875, -1.437591552734375, -1.33447265625, -1.231353759765625, -1.12823486328125, -1.025115966796875, -0.9219970703125, -0.818878173828125, -0.71575927734375, -0.612640380859375, -0.509521484375, -0.406402587890625, -0.30328369140625, -0.200164794921875, -0.0970458984375, 0.006072998046875, 0.10919189453125, 0.212310791015625, 0.3154296875, 0.418548583984375, 0.52166748046875, 0.624786376953125, 0.7279052734375, 0.831024169921875, 0.93414306640625, 1.037261962890625, 1.140380859375, 1.243499755859375, 1.34661865234375, 1.449737548828125, 1.5528564453125, 1.655975341796875, 1.75909423828125, 1.862213134765625, 1.96533203125, 2.068450927734375, 2.17156982421875, 2.274688720703125, 2.3778076171875, 2.480926513671875, 2.58404541015625, 2.687164306640625, 2.790283203125, 2.893402099609375, 2.99652099609375, 3.099639892578125, 3.2027587890625, 3.305877685546875, 3.40899658203125, 3.512115478515625, 3.615234375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 2.0, 6.0, 7.0, 9.0, 14.0, 12.0, 12.0, 14.0, 28.0, 21.0, 34.0, 32.0, 41.0, 35.0, 47.0, 58.0, 62.0, 59.0, 46.0, 58.0, 43.0, 41.0, 54.0, 39.0, 30.0, 36.0, 22.0, 25.0, 15.0, 20.0, 12.0, 17.0, 13.0, 7.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.599434852600098, -8.331212043762207, -8.062989234924316, -7.794765949249268, -7.526543140411377, -7.258320331573486, -6.9900970458984375, -6.721874237060547, -6.453651428222656, -6.185428619384766, -5.917205810546875, -5.648982524871826, -5.3807597160339355, -5.112536907196045, -4.844313621520996, -4.5760908126831055, -4.307868003845215, -4.039645195007324, -3.7714221477508545, -3.5031991004943848, -3.234976291656494, -2.9667534828186035, -2.698530435562134, -2.430307388305664, -2.1620845794677734, -1.8938616514205933, -1.625638723373413, -1.357415795326233, -1.0891928672790527, -0.8209699392318726, -0.5527470111846924, -0.2845240831375122, -0.01630115509033203, 0.25192177295684814, 0.5201447010040283, 0.7883676290512085, 1.0565905570983887, 1.3248134851455688, 1.593036413192749, 1.8612593412399292, 2.1294822692871094, 2.397705078125, 2.6659281253814697, 2.9341511726379395, 3.20237398147583, 3.4705967903137207, 3.7388198375701904, 4.00704288482666, 4.275265693664551, 4.543488502502441, 4.811711311340332, 5.079934597015381, 5.3481574058532715, 5.616380214691162, 5.884603500366211, 6.152826309204102, 6.421049118041992, 6.689271926879883, 6.957494735717773, 7.225718021392822, 7.493940830230713, 7.7621636390686035, 8.030386924743652, 8.298609733581543, 8.566832542419434]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 10.0, 3.0, 3.0, 10.0, 10.0, 8.0, 8.0, 15.0, 14.0, 22.0, 16.0, 27.0, 18.0, 24.0, 37.0, 34.0, 32.0, 22.0, 33.0, 36.0, 38.0, 36.0, 40.0, 37.0, 39.0, 45.0, 37.0, 43.0, 38.0, 27.0, 33.0, 41.0, 19.0, 18.0, 23.0, 15.0, 16.0, 10.0, 18.0, 10.0, 9.0, 11.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.347528457641602, -9.035837173461914, -8.72414493560791, -8.412453651428223, -8.100761413574219, -7.789069652557373, -7.477377891540527, -7.16568660736084, -6.853994369506836, -6.54230260848999, -6.2306108474731445, -5.918919086456299, -5.607227325439453, -5.295535564422607, -4.983843803405762, -4.672152519226074, -4.3604607582092285, -4.048768997192383, -3.737077236175537, -3.4253854751586914, -3.1136937141418457, -2.802001953125, -2.4903104305267334, -2.1786186695098877, -1.866926908493042, -1.5552351474761963, -1.2435433864593506, -0.9318517446517944, -0.6201599836349487, -0.308468222618103, 0.003223419189453125, 0.31491518020629883, 0.6266069412231445, 0.9382987022399902, 1.249990463256836, 1.561682105064392, 1.8733738660812378, 2.185065746307373, 2.4967572689056396, 2.8084490299224854, 3.120140790939331, 3.4318325519561768, 3.7435243129730225, 4.055215835571289, 4.366907596588135, 4.6785993576049805, 4.990291118621826, 5.301982879638672, 5.613674640655518, 5.925366401672363, 6.237058162689209, 6.548749923706055, 6.8604416847229, 7.172133445739746, 7.483824729919434, 7.7955169677734375, 8.107208251953125, 8.418899536132812, 8.730591773986816, 9.042283058166504, 9.353975296020508, 9.665666580200195, 9.9773588180542, 10.289050102233887, 10.60074234008789]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 10.0, 9.0, 11.0, 23.0, 41.0, 40.0, 80.0, 115.0, 195.0, 328.0, 466.0, 727.0, 1244.0, 1936.0, 3149.0, 5017.0, 8122.0, 13206.0, 21290.0, 35243.0, 56929.0, 90949.0, 138832.0, 184731.0, 169412.0, 118350.0, 75677.0, 47255.0, 29016.0, 17746.0, 10959.0, 6591.0, 3966.0, 2574.0, 1558.0, 979.0, 671.0, 366.0, 288.0, 159.0, 91.0, 67.0, 50.0, 31.0, 19.0, 16.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.84375, -1.7838897705078125, -1.724029541015625, -1.6641693115234375, -1.60430908203125, -1.5444488525390625, -1.484588623046875, -1.4247283935546875, -1.3648681640625, -1.3050079345703125, -1.245147705078125, -1.1852874755859375, -1.12542724609375, -1.0655670166015625, -1.005706787109375, -0.9458465576171875, -0.885986328125, -0.8261260986328125, -0.766265869140625, -0.7064056396484375, -0.64654541015625, -0.5866851806640625, -0.526824951171875, -0.4669647216796875, -0.4071044921875, -0.3472442626953125, -0.287384033203125, -0.2275238037109375, -0.16766357421875, -0.1078033447265625, -0.047943115234375, 0.0119171142578125, 0.07177734375, 0.1316375732421875, 0.191497802734375, 0.2513580322265625, 0.31121826171875, 0.3710784912109375, 0.430938720703125, 0.4907989501953125, 0.5506591796875, 0.6105194091796875, 0.670379638671875, 0.7302398681640625, 0.79010009765625, 0.8499603271484375, 0.909820556640625, 0.9696807861328125, 1.029541015625, 1.0894012451171875, 1.149261474609375, 1.2091217041015625, 1.26898193359375, 1.3288421630859375, 1.388702392578125, 1.4485626220703125, 1.5084228515625, 1.5682830810546875, 1.628143310546875, 1.6880035400390625, 1.74786376953125, 1.8077239990234375, 1.867584228515625, 1.9274444580078125, 1.9873046875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 7.0, 2.0, 8.0, 9.0, 4.0, 10.0, 13.0, 9.0, 10.0, 21.0, 25.0, 18.0, 26.0, 32.0, 16.0, 31.0, 36.0, 34.0, 42.0, 40.0, 44.0, 34.0, 40.0, 46.0, 32.0, 43.0, 42.0, 43.0, 34.0, 35.0, 30.0, 30.0, 24.0, 21.0, 16.0, 14.0, 15.0, 17.0, 17.0, 9.0, 9.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5234375, -9.192138671875, -8.86083984375, -8.529541015625, -8.1982421875, -7.866943359375, -7.53564453125, -7.204345703125, -6.873046875, -6.541748046875, -6.21044921875, -5.879150390625, -5.5478515625, -5.216552734375, -4.88525390625, -4.553955078125, -4.22265625, -3.891357421875, -3.56005859375, -3.228759765625, -2.8974609375, -2.566162109375, -2.23486328125, -1.903564453125, -1.572265625, -1.240966796875, -0.90966796875, -0.578369140625, -0.2470703125, 0.084228515625, 0.41552734375, 0.746826171875, 1.078125, 1.409423828125, 1.74072265625, 2.072021484375, 2.4033203125, 2.734619140625, 3.06591796875, 3.397216796875, 3.728515625, 4.059814453125, 4.39111328125, 4.722412109375, 5.0537109375, 5.385009765625, 5.71630859375, 6.047607421875, 6.37890625, 6.710205078125, 7.04150390625, 7.372802734375, 7.7041015625, 8.035400390625, 8.36669921875, 8.697998046875, 9.029296875, 9.360595703125, 9.69189453125, 10.023193359375, 10.3544921875, 10.685791015625, 11.01708984375, 11.348388671875, 11.6796875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 11.0, 10.0, 10.0, 19.0, 24.0, 40.0, 50.0, 84.0, 140.0, 197.0, 291.0, 464.0, 771.0, 1169.0, 2001.0, 3201.0, 5328.0, 8623.0, 14425.0, 24431.0, 40634.0, 68340.0, 112218.0, 171208.0, 201726.0, 151487.0, 96372.0, 58104.0, 34948.0, 20778.0, 12237.0, 7471.0, 4439.0, 2694.0, 1657.0, 1055.0, 629.0, 425.0, 285.0, 171.0, 137.0, 76.0, 58.0, 32.0, 29.0, 15.0, 14.0, 7.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0], "bins": [-1.697265625, -1.6463623046875, -1.595458984375, -1.5445556640625, -1.49365234375, -1.4427490234375, -1.391845703125, -1.3409423828125, -1.2900390625, -1.2391357421875, -1.188232421875, -1.1373291015625, -1.08642578125, -1.0355224609375, -0.984619140625, -0.9337158203125, -0.8828125, -0.8319091796875, -0.781005859375, -0.7301025390625, -0.67919921875, -0.6282958984375, -0.577392578125, -0.5264892578125, -0.4755859375, -0.4246826171875, -0.373779296875, -0.3228759765625, -0.27197265625, -0.2210693359375, -0.170166015625, -0.1192626953125, -0.068359375, -0.0174560546875, 0.033447265625, 0.0843505859375, 0.13525390625, 0.1861572265625, 0.237060546875, 0.2879638671875, 0.3388671875, 0.3897705078125, 0.440673828125, 0.4915771484375, 0.54248046875, 0.5933837890625, 0.644287109375, 0.6951904296875, 0.74609375, 0.7969970703125, 0.847900390625, 0.8988037109375, 0.94970703125, 1.0006103515625, 1.051513671875, 1.1024169921875, 1.1533203125, 1.2042236328125, 1.255126953125, 1.3060302734375, 1.35693359375, 1.4078369140625, 1.458740234375, 1.5096435546875, 1.560546875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 6.0, 8.0, 9.0, 14.0, 16.0, 18.0, 22.0, 18.0, 27.0, 25.0, 30.0, 27.0, 25.0, 45.0, 40.0, 43.0, 43.0, 40.0, 41.0, 32.0, 47.0, 41.0, 36.0, 30.0, 22.0, 42.0, 30.0, 38.0, 17.0, 17.0, 22.0, 16.0, 16.0, 20.0, 6.0, 7.0, 12.0, 8.0, 7.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.69140625, -6.4920654296875, -6.292724609375, -6.0933837890625, -5.89404296875, -5.6947021484375, -5.495361328125, -5.2960205078125, -5.0966796875, -4.8973388671875, -4.697998046875, -4.4986572265625, -4.29931640625, -4.0999755859375, -3.900634765625, -3.7012939453125, -3.501953125, -3.3026123046875, -3.103271484375, -2.9039306640625, -2.70458984375, -2.5052490234375, -2.305908203125, -2.1065673828125, -1.9072265625, -1.7078857421875, -1.508544921875, -1.3092041015625, -1.10986328125, -0.9105224609375, -0.711181640625, -0.5118408203125, -0.3125, -0.1131591796875, 0.086181640625, 0.2855224609375, 0.48486328125, 0.6842041015625, 0.883544921875, 1.0828857421875, 1.2822265625, 1.4815673828125, 1.680908203125, 1.8802490234375, 2.07958984375, 2.2789306640625, 2.478271484375, 2.6776123046875, 2.876953125, 3.0762939453125, 3.275634765625, 3.4749755859375, 3.67431640625, 3.8736572265625, 4.072998046875, 4.2723388671875, 4.4716796875, 4.6710205078125, 4.870361328125, 5.0697021484375, 5.26904296875, 5.4683837890625, 5.667724609375, 5.8670654296875, 6.06640625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 7.0, 20.0, 15.0, 12.0, 25.0, 31.0, 54.0, 82.0, 133.0, 204.0, 283.0, 494.0, 835.0, 1541.0, 2979.0, 6429.0, 14211.0, 34080.0, 97588.0, 324571.0, 379464.0, 115882.0, 39409.0, 16001.0, 6976.0, 3265.0, 1556.0, 944.0, 476.0, 349.0, 201.0, 132.0, 79.0, 70.0, 30.0, 21.0, 24.0, 21.0, 12.0, 13.0, 10.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.386962890625, -0.3752632141113281, -0.36356353759765625, -0.3518638610839844, -0.3401641845703125, -0.3284645080566406, -0.31676483154296875, -0.3050651550292969, -0.293365478515625, -0.2816658020019531, -0.26996612548828125, -0.2582664489746094, -0.2465667724609375, -0.23486709594726562, -0.22316741943359375, -0.21146774291992188, -0.19976806640625, -0.18806838989257812, -0.17636871337890625, -0.16466903686523438, -0.1529693603515625, -0.14126968383789062, -0.12957000732421875, -0.11787033081054688, -0.106170654296875, -0.09447097778320312, -0.08277130126953125, -0.07107162475585938, -0.0593719482421875, -0.047672271728515625, -0.03597259521484375, -0.024272918701171875, -0.0125732421875, -0.000873565673828125, 0.01082611083984375, 0.022525787353515625, 0.0342254638671875, 0.045925140380859375, 0.05762481689453125, 0.06932449340820312, 0.081024169921875, 0.09272384643554688, 0.10442352294921875, 0.11612319946289062, 0.1278228759765625, 0.13952255249023438, 0.15122222900390625, 0.16292190551757812, 0.17462158203125, 0.18632125854492188, 0.19802093505859375, 0.20972061157226562, 0.2214202880859375, 0.23311996459960938, 0.24481964111328125, 0.2565193176269531, 0.268218994140625, 0.2799186706542969, 0.29161834716796875, 0.3033180236816406, 0.3150177001953125, 0.3267173767089844, 0.33841705322265625, 0.3501167297363281, 0.36181640625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 3.0, 5.0, 6.0, 11.0, 11.0, 17.0, 32.0, 34.0, 41.0, 63.0, 84.0, 101.0, 116.0, 100.0, 114.0, 63.0, 47.0, 38.0, 17.0, 16.0, 20.0, 15.0, 10.0, 5.0, 8.0, 4.0, 7.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.4849853515625e-05, -6.320886313915253e-05, -6.156787276268005e-05, -5.992688238620758e-05, -5.828589200973511e-05, -5.6644901633262634e-05, -5.500391125679016e-05, -5.336292088031769e-05, -5.1721930503845215e-05, -5.008094012737274e-05, -4.843994975090027e-05, -4.6798959374427795e-05, -4.515796899795532e-05, -4.351697862148285e-05, -4.1875988245010376e-05, -4.02349978685379e-05, -3.859400749206543e-05, -3.6953017115592957e-05, -3.5312026739120483e-05, -3.367103636264801e-05, -3.203004598617554e-05, -3.0389055609703064e-05, -2.874806523323059e-05, -2.7107074856758118e-05, -2.5466084480285645e-05, -2.382509410381317e-05, -2.2184103727340698e-05, -2.0543113350868225e-05, -1.8902122974395752e-05, -1.726113259792328e-05, -1.5620142221450806e-05, -1.3979151844978333e-05, -1.233816146850586e-05, -1.0697171092033386e-05, -9.056180715560913e-06, -7.41519033908844e-06, -5.774199962615967e-06, -4.133209586143494e-06, -2.4922192096710205e-06, -8.512288331985474e-07, 7.897615432739258e-07, 2.430751919746399e-06, 4.071742296218872e-06, 5.712732672691345e-06, 7.353723049163818e-06, 8.994713425636292e-06, 1.0635703802108765e-05, 1.2276694178581238e-05, 1.3917684555053711e-05, 1.5558674931526184e-05, 1.7199665307998657e-05, 1.884065568447113e-05, 2.0481646060943604e-05, 2.2122636437416077e-05, 2.376362681388855e-05, 2.5404617190361023e-05, 2.7045607566833496e-05, 2.868659794330597e-05, 3.0327588319778442e-05, 3.1968578696250916e-05, 3.360956907272339e-05, 3.525055944919586e-05, 3.6891549825668335e-05, 3.853254020214081e-05, 4.017353057861328e-05]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 11.0, 9.0, 16.0, 24.0, 37.0, 49.0, 87.0, 122.0, 197.0, 334.0, 502.0, 838.0, 1351.0, 2253.0, 4041.0, 7280.0, 13713.0, 26597.0, 56291.0, 128222.0, 308167.0, 280293.0, 114509.0, 50589.0, 24397.0, 12460.0, 6806.0, 3805.0, 2200.0, 1294.0, 786.0, 459.0, 267.0, 182.0, 129.0, 87.0, 42.0, 37.0, 29.0, 18.0, 9.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4208984375, -0.4077186584472656, -0.39453887939453125, -0.3813591003417969, -0.3681793212890625, -0.3549995422363281, -0.34181976318359375, -0.3286399841308594, -0.315460205078125, -0.3022804260253906, -0.28910064697265625, -0.2759208679199219, -0.2627410888671875, -0.24956130981445312, -0.23638153076171875, -0.22320175170898438, -0.21002197265625, -0.19684219360351562, -0.18366241455078125, -0.17048263549804688, -0.1573028564453125, -0.14412307739257812, -0.13094329833984375, -0.11776351928710938, -0.104583740234375, -0.09140396118164062, -0.07822418212890625, -0.06504440307617188, -0.0518646240234375, -0.038684844970703125, -0.02550506591796875, -0.012325286865234375, 0.0008544921875, 0.014034271240234375, 0.02721405029296875, 0.040393829345703125, 0.0535736083984375, 0.06675338745117188, 0.07993316650390625, 0.09311294555664062, 0.106292724609375, 0.11947250366210938, 0.13265228271484375, 0.14583206176757812, 0.1590118408203125, 0.17219161987304688, 0.18537139892578125, 0.19855117797851562, 0.21173095703125, 0.22491073608398438, 0.23809051513671875, 0.2512702941894531, 0.2644500732421875, 0.2776298522949219, 0.29080963134765625, 0.3039894104003906, 0.317169189453125, 0.3303489685058594, 0.34352874755859375, 0.3567085266113281, 0.3698883056640625, 0.3830680847167969, 0.39624786376953125, 0.4094276428222656, 0.422607421875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 3.0, 9.0, 13.0, 16.0, 29.0, 29.0, 54.0, 64.0, 90.0, 89.0, 97.0, 95.0, 74.0, 82.0, 66.0, 44.0, 36.0, 20.0, 19.0, 10.0, 10.0, 6.0, 10.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.166748046875, -0.16234207153320312, -0.15793609619140625, -0.15353012084960938, -0.1491241455078125, -0.14471817016601562, -0.14031219482421875, -0.13590621948242188, -0.131500244140625, -0.12709426879882812, -0.12268829345703125, -0.11828231811523438, -0.1138763427734375, -0.10947036743164062, -0.10506439208984375, -0.10065841674804688, -0.09625244140625, -0.09184646606445312, -0.08744049072265625, -0.08303451538085938, -0.0786285400390625, -0.07422256469726562, -0.06981658935546875, -0.06541061401367188, -0.061004638671875, -0.056598663330078125, -0.05219268798828125, -0.047786712646484375, -0.0433807373046875, -0.038974761962890625, -0.03456878662109375, -0.030162811279296875, -0.0257568359375, -0.021350860595703125, -0.01694488525390625, -0.012538909912109375, -0.0081329345703125, -0.003726959228515625, 0.00067901611328125, 0.005084991455078125, 0.009490966796875, 0.013896942138671875, 0.01830291748046875, 0.022708892822265625, 0.0271148681640625, 0.031520843505859375, 0.03592681884765625, 0.040332794189453125, 0.04473876953125, 0.049144744873046875, 0.05355072021484375, 0.057956695556640625, 0.0623626708984375, 0.06676864624023438, 0.07117462158203125, 0.07558059692382812, 0.079986572265625, 0.08439254760742188, 0.08879852294921875, 0.09320449829101562, 0.0976104736328125, 0.10201644897460938, 0.10642242431640625, 0.11082839965820312, 0.115234375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 2.0, 0.0, 2.0, 3.0, 7.0, 2.0, 6.0, 8.0, 8.0, 6.0, 17.0, 14.0, 19.0, 21.0, 21.0, 35.0, 34.0, 36.0, 37.0, 47.0, 53.0, 66.0, 63.0, 53.0, 53.0, 45.0, 47.0, 45.0, 42.0, 39.0, 28.0, 22.0, 23.0, 18.0, 15.0, 17.0, 12.0, 11.0, 12.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.68140983581543, -8.410303115844727, -8.139195442199707, -7.868088722229004, -7.596982002258301, -7.3258748054504395, -7.054767608642578, -6.783660888671875, -6.512553691864014, -6.241446495056152, -5.970339775085449, -5.699232578277588, -5.428125381469727, -5.157018661499023, -4.885911464691162, -4.614804267883301, -4.343697547912598, -4.072590351104736, -3.801483631134033, -3.530376434326172, -3.2592694759368896, -2.9881625175476074, -2.717055320739746, -2.445948362350464, -2.1748414039611816, -1.9037344455718994, -1.6326273679733276, -1.3615202903747559, -1.0904133319854736, -0.8193063735961914, -0.5481992959976196, -0.27709221839904785, -0.005984306335449219, 0.2651227116584778, 0.5362297296524048, 0.8073367476463318, 1.0784437656402588, 1.349550724029541, 1.6206578016281128, 1.8917648792266846, 2.162871837615967, 2.433978796005249, 2.7050857543945312, 2.9761929512023926, 3.247299909591675, 3.518406867980957, 3.7895140647888184, 4.06062126159668, 4.331727981567383, 4.602835178375244, 4.873941898345947, 5.145049095153809, 5.416155815124512, 5.687263011932373, 5.958370208740234, 6.2294769287109375, 6.500584125518799, 6.77169132232666, 7.042798042297363, 7.313905239105225, 7.585012435913086, 7.856119155883789, 8.127225875854492, 8.398333549499512, 8.669440269470215]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 7.0, 2.0, 5.0, 10.0, 10.0, 8.0, 8.0, 13.0, 17.0, 21.0, 18.0, 27.0, 19.0, 24.0, 36.0, 33.0, 33.0, 22.0, 36.0, 33.0, 40.0, 36.0, 41.0, 39.0, 36.0, 47.0, 31.0, 46.0, 37.0, 27.0, 32.0, 42.0, 18.0, 18.0, 21.0, 17.0, 14.0, 10.0, 19.0, 8.0, 9.0, 11.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.179637908935547, -8.87120246887207, -8.562767028808594, -8.254332542419434, -7.945897102355957, -7.6374616622924805, -7.329026699066162, -7.020591735839844, -6.712156295776367, -6.403720855712891, -6.095285892486572, -5.786850929260254, -5.478415489196777, -5.169980049133301, -4.861545085906982, -4.553110122680664, -4.2446746826171875, -3.93623948097229, -3.6278042793273926, -3.319369077682495, -3.0109338760375977, -2.7024986743927, -2.3940634727478027, -2.0856282711029053, -1.7771930694580078, -1.4687578678131104, -1.160322666168213, -0.8518874645233154, -0.543452262878418, -0.2350170612335205, 0.07341814041137695, 0.3818533420562744, 0.6902875900268555, 0.9987227916717529, 1.3071579933166504, 1.6155931949615479, 1.9240283966064453, 2.2324635982513428, 2.5408987998962402, 2.8493340015411377, 3.157769203186035, 3.4662044048309326, 3.77463960647583, 4.083074569702148, 4.391510009765625, 4.699945449829102, 5.00838041305542, 5.316815376281738, 5.625250816345215, 5.933686256408691, 6.24212121963501, 6.550556182861328, 6.858991622924805, 7.167427062988281, 7.4758620262146, 7.784296989440918, 8.092732429504395, 8.401167869567871, 8.709602355957031, 9.018037796020508, 9.326473236083984, 9.634908676147461, 9.943344116210938, 10.251778602600098, 10.560214042663574]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 4.0, 10.0, 18.0, 40.0, 48.0, 86.0, 169.0, 205.0, 371.0, 638.0, 918.0, 1480.0, 2359.0, 3676.0, 5650.0, 9181.0, 14779.0, 23596.0, 36459.0, 56423.0, 82126.0, 112294.0, 135122.0, 140816.0, 126210.0, 98014.0, 70267.0, 46293.0, 30131.0, 19100.0, 11816.0, 7394.0, 4756.0, 3022.0, 1901.0, 1215.0, 783.0, 451.0, 279.0, 170.0, 93.0, 72.0, 49.0, 19.0, 27.0, 11.0, 6.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.421875, -8.1761474609375, -7.930419921875, -7.6846923828125, -7.43896484375, -7.1932373046875, -6.947509765625, -6.7017822265625, -6.4560546875, -6.2103271484375, -5.964599609375, -5.7188720703125, -5.47314453125, -5.2274169921875, -4.981689453125, -4.7359619140625, -4.490234375, -4.2445068359375, -3.998779296875, -3.7530517578125, -3.50732421875, -3.2615966796875, -3.015869140625, -2.7701416015625, -2.5244140625, -2.2786865234375, -2.032958984375, -1.7872314453125, -1.54150390625, -1.2957763671875, -1.050048828125, -0.8043212890625, -0.55859375, -0.3128662109375, -0.067138671875, 0.1785888671875, 0.42431640625, 0.6700439453125, 0.915771484375, 1.1614990234375, 1.4072265625, 1.6529541015625, 1.898681640625, 2.1444091796875, 2.39013671875, 2.6358642578125, 2.881591796875, 3.1273193359375, 3.373046875, 3.6187744140625, 3.864501953125, 4.1102294921875, 4.35595703125, 4.6016845703125, 4.847412109375, 5.0931396484375, 5.3388671875, 5.5845947265625, 5.830322265625, 6.0760498046875, 6.32177734375, 6.5675048828125, 6.813232421875, 7.0589599609375, 7.3046875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 1.0, 8.0, 7.0, 12.0, 6.0, 1.0, 9.0, 12.0, 19.0, 15.0, 28.0, 28.0, 24.0, 34.0, 34.0, 36.0, 20.0, 22.0, 40.0, 37.0, 37.0, 37.0, 44.0, 29.0, 42.0, 28.0, 44.0, 40.0, 43.0, 38.0, 28.0, 30.0, 26.0, 18.0, 21.0, 17.0, 17.0, 7.0, 11.0, 14.0, 9.0, 8.0, 5.0, 4.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.859375, -8.5595703125, -8.259765625, -7.9599609375, -7.66015625, -7.3603515625, -7.060546875, -6.7607421875, -6.4609375, -6.1611328125, -5.861328125, -5.5615234375, -5.26171875, -4.9619140625, -4.662109375, -4.3623046875, -4.0625, -3.7626953125, -3.462890625, -3.1630859375, -2.86328125, -2.5634765625, -2.263671875, -1.9638671875, -1.6640625, -1.3642578125, -1.064453125, -0.7646484375, -0.46484375, -0.1650390625, 0.134765625, 0.4345703125, 0.734375, 1.0341796875, 1.333984375, 1.6337890625, 1.93359375, 2.2333984375, 2.533203125, 2.8330078125, 3.1328125, 3.4326171875, 3.732421875, 4.0322265625, 4.33203125, 4.6318359375, 4.931640625, 5.2314453125, 5.53125, 5.8310546875, 6.130859375, 6.4306640625, 6.73046875, 7.0302734375, 7.330078125, 7.6298828125, 7.9296875, 8.2294921875, 8.529296875, 8.8291015625, 9.12890625, 9.4287109375, 9.728515625, 10.0283203125, 10.328125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 6.0, 8.0, 10.0, 21.0, 15.0, 26.0, 38.0, 79.0, 105.0, 185.0, 321.0, 486.0, 777.0, 1384.0, 2349.0, 4173.0, 7307.0, 12930.0, 23180.0, 41060.0, 71104.0, 113688.0, 159367.0, 178590.0, 157069.0, 112044.0, 69558.0, 40426.0, 22584.0, 12626.0, 7066.0, 4167.0, 2309.0, 1356.0, 834.0, 481.0, 296.0, 215.0, 115.0, 78.0, 36.0, 31.0, 29.0, 14.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-10.640625, -10.33203125, -10.0234375, -9.71484375, -9.40625, -9.09765625, -8.7890625, -8.48046875, -8.171875, -7.86328125, -7.5546875, -7.24609375, -6.9375, -6.62890625, -6.3203125, -6.01171875, -5.703125, -5.39453125, -5.0859375, -4.77734375, -4.46875, -4.16015625, -3.8515625, -3.54296875, -3.234375, -2.92578125, -2.6171875, -2.30859375, -2.0, -1.69140625, -1.3828125, -1.07421875, -0.765625, -0.45703125, -0.1484375, 0.16015625, 0.46875, 0.77734375, 1.0859375, 1.39453125, 1.703125, 2.01171875, 2.3203125, 2.62890625, 2.9375, 3.24609375, 3.5546875, 3.86328125, 4.171875, 4.48046875, 4.7890625, 5.09765625, 5.40625, 5.71484375, 6.0234375, 6.33203125, 6.640625, 6.94921875, 7.2578125, 7.56640625, 7.875, 8.18359375, 8.4921875, 8.80078125, 9.109375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 1.0, 8.0, 5.0, 7.0, 9.0, 13.0, 10.0, 13.0, 21.0, 18.0, 16.0, 39.0, 28.0, 40.0, 46.0, 37.0, 39.0, 51.0, 37.0, 54.0, 43.0, 46.0, 46.0, 39.0, 41.0, 28.0, 38.0, 34.0, 35.0, 20.0, 23.0, 23.0, 23.0, 15.0, 12.0, 11.0, 10.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-8.2890625, -8.06622314453125, -7.8433837890625, -7.62054443359375, -7.397705078125, -7.17486572265625, -6.9520263671875, -6.72918701171875, -6.50634765625, -6.28350830078125, -6.0606689453125, -5.83782958984375, -5.614990234375, -5.39215087890625, -5.1693115234375, -4.94647216796875, -4.7236328125, -4.50079345703125, -4.2779541015625, -4.05511474609375, -3.832275390625, -3.60943603515625, -3.3865966796875, -3.16375732421875, -2.94091796875, -2.71807861328125, -2.4952392578125, -2.27239990234375, -2.049560546875, -1.82672119140625, -1.6038818359375, -1.38104248046875, -1.158203125, -0.93536376953125, -0.7125244140625, -0.48968505859375, -0.266845703125, -0.04400634765625, 0.1788330078125, 0.40167236328125, 0.62451171875, 0.84735107421875, 1.0701904296875, 1.29302978515625, 1.515869140625, 1.73870849609375, 1.9615478515625, 2.18438720703125, 2.4072265625, 2.63006591796875, 2.8529052734375, 3.07574462890625, 3.298583984375, 3.52142333984375, 3.7442626953125, 3.96710205078125, 4.18994140625, 4.41278076171875, 4.6356201171875, 4.85845947265625, 5.081298828125, 5.30413818359375, 5.5269775390625, 5.74981689453125, 5.97265625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 8.0, 10.0, 8.0, 16.0, 24.0, 36.0, 41.0, 71.0, 102.0, 148.0, 241.0, 324.0, 457.0, 718.0, 1048.0, 1705.0, 2437.0, 3922.0, 6152.0, 9880.0, 15514.0, 24588.0, 39365.0, 61798.0, 94589.0, 133430.0, 161112.0, 152358.0, 118034.0, 79559.0, 51887.0, 32744.0, 20761.0, 12809.0, 8109.0, 5129.0, 3245.0, 2066.0, 1367.0, 906.0, 571.0, 406.0, 270.0, 196.0, 116.0, 113.0, 56.0, 42.0, 22.0, 22.0, 6.0, 13.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.832672119140625, -2.73760986328125, -2.642547607421875, -2.5474853515625, -2.452423095703125, -2.35736083984375, -2.262298583984375, -2.167236328125, -2.072174072265625, -1.97711181640625, -1.882049560546875, -1.7869873046875, -1.691925048828125, -1.59686279296875, -1.501800537109375, -1.40673828125, -1.311676025390625, -1.21661376953125, -1.121551513671875, -1.0264892578125, -0.931427001953125, -0.83636474609375, -0.741302490234375, -0.646240234375, -0.551177978515625, -0.45611572265625, -0.361053466796875, -0.2659912109375, -0.170928955078125, -0.07586669921875, 0.019195556640625, 0.1142578125, 0.209320068359375, 0.30438232421875, 0.399444580078125, 0.4945068359375, 0.589569091796875, 0.68463134765625, 0.779693603515625, 0.874755859375, 0.969818115234375, 1.06488037109375, 1.159942626953125, 1.2550048828125, 1.350067138671875, 1.44512939453125, 1.540191650390625, 1.63525390625, 1.730316162109375, 1.82537841796875, 1.920440673828125, 2.0155029296875, 2.110565185546875, 2.20562744140625, 2.300689697265625, 2.395751953125, 2.490814208984375, 2.58587646484375, 2.680938720703125, 2.7760009765625, 2.871063232421875, 2.96612548828125, 3.061187744140625, 3.15625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 7.0, 14.0, 11.0, 15.0, 17.0, 24.0, 11.0, 38.0, 37.0, 44.0, 52.0, 52.0, 48.0, 59.0, 71.0, 65.0, 66.0, 61.0, 50.0, 41.0, 38.0, 36.0, 34.0, 22.0, 13.0, 15.0, 13.0, 9.0, 6.0, 6.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031495094299316406, -0.00030553340911865234, -0.0002961158752441406, -0.0002866983413696289, -0.0002772808074951172, -0.00026786327362060547, -0.00025844573974609375, -0.00024902820587158203, -0.0002396106719970703, -0.0002301931381225586, -0.00022077560424804688, -0.00021135807037353516, -0.00020194053649902344, -0.00019252300262451172, -0.00018310546875, -0.00017368793487548828, -0.00016427040100097656, -0.00015485286712646484, -0.00014543533325195312, -0.0001360177993774414, -0.0001266002655029297, -0.00011718273162841797, -0.00010776519775390625, -9.834766387939453e-05, -8.893013000488281e-05, -7.95125961303711e-05, -7.009506225585938e-05, -6.0677528381347656e-05, -5.125999450683594e-05, -4.184246063232422e-05, -3.24249267578125e-05, -2.300739288330078e-05, -1.3589859008789062e-05, -4.172325134277344e-06, 5.245208740234375e-06, 1.4662742614746094e-05, 2.4080276489257812e-05, 3.349781036376953e-05, 4.291534423828125e-05, 5.233287811279297e-05, 6.175041198730469e-05, 7.11679458618164e-05, 8.058547973632812e-05, 9.000301361083984e-05, 9.942054748535156e-05, 0.00010883808135986328, 0.000118255615234375, 0.00012767314910888672, 0.00013709068298339844, 0.00014650821685791016, 0.00015592575073242188, 0.0001653432846069336, 0.0001747608184814453, 0.00018417835235595703, 0.00019359588623046875, 0.00020301342010498047, 0.0002124309539794922, 0.0002218484878540039, 0.00023126602172851562, 0.00024068355560302734, 0.00025010108947753906, 0.0002595186233520508, 0.0002689361572265625, 0.0002783536911010742, 0.00028777122497558594]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 4.0, 4.0, 4.0, 4.0, 8.0, 12.0, 11.0, 22.0, 36.0, 32.0, 62.0, 118.0, 140.0, 201.0, 347.0, 498.0, 795.0, 1154.0, 1830.0, 2689.0, 4214.0, 6746.0, 10815.0, 17926.0, 29160.0, 48252.0, 79377.0, 121783.0, 165146.0, 173478.0, 139259.0, 93962.0, 58180.0, 35581.0, 21304.0, 12959.0, 7960.0, 5090.0, 3302.0, 2125.0, 1368.0, 839.0, 564.0, 414.0, 241.0, 179.0, 120.0, 87.0, 54.0, 42.0, 35.0, 10.0, 11.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.380859375, -3.27581787109375, -3.1707763671875, -3.06573486328125, -2.960693359375, -2.85565185546875, -2.7506103515625, -2.64556884765625, -2.54052734375, -2.43548583984375, -2.3304443359375, -2.22540283203125, -2.120361328125, -2.01531982421875, -1.9102783203125, -1.80523681640625, -1.7001953125, -1.59515380859375, -1.4901123046875, -1.38507080078125, -1.280029296875, -1.17498779296875, -1.0699462890625, -0.96490478515625, -0.85986328125, -0.75482177734375, -0.6497802734375, -0.54473876953125, -0.439697265625, -0.33465576171875, -0.2296142578125, -0.12457275390625, -0.01953125, 0.08551025390625, 0.1905517578125, 0.29559326171875, 0.400634765625, 0.50567626953125, 0.6107177734375, 0.71575927734375, 0.82080078125, 0.92584228515625, 1.0308837890625, 1.13592529296875, 1.240966796875, 1.34600830078125, 1.4510498046875, 1.55609130859375, 1.6611328125, 1.76617431640625, 1.8712158203125, 1.97625732421875, 2.081298828125, 2.18634033203125, 2.2913818359375, 2.39642333984375, 2.50146484375, 2.60650634765625, 2.7115478515625, 2.81658935546875, 2.921630859375, 3.02667236328125, 3.1317138671875, 3.23675537109375, 3.341796875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 7.0, 10.0, 7.0, 13.0, 13.0, 16.0, 22.0, 36.0, 33.0, 51.0, 55.0, 40.0, 63.0, 48.0, 62.0, 69.0, 58.0, 62.0, 46.0, 48.0, 44.0, 36.0, 21.0, 19.0, 17.0, 14.0, 9.0, 13.0, 12.0, 6.0, 8.0, 6.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.193359375, -1.15032958984375, -1.1072998046875, -1.06427001953125, -1.021240234375, -0.97821044921875, -0.9351806640625, -0.89215087890625, -0.84912109375, -0.80609130859375, -0.7630615234375, -0.72003173828125, -0.677001953125, -0.63397216796875, -0.5909423828125, -0.54791259765625, -0.5048828125, -0.46185302734375, -0.4188232421875, -0.37579345703125, -0.332763671875, -0.28973388671875, -0.2467041015625, -0.20367431640625, -0.16064453125, -0.11761474609375, -0.0745849609375, -0.03155517578125, 0.011474609375, 0.05450439453125, 0.0975341796875, 0.14056396484375, 0.18359375, 0.22662353515625, 0.2696533203125, 0.31268310546875, 0.355712890625, 0.39874267578125, 0.4417724609375, 0.48480224609375, 0.52783203125, 0.57086181640625, 0.6138916015625, 0.65692138671875, 0.699951171875, 0.74298095703125, 0.7860107421875, 0.82904052734375, 0.8720703125, 0.91510009765625, 0.9581298828125, 1.00115966796875, 1.044189453125, 1.08721923828125, 1.1302490234375, 1.17327880859375, 1.21630859375, 1.25933837890625, 1.3023681640625, 1.34539794921875, 1.388427734375, 1.43145751953125, 1.4744873046875, 1.51751708984375, 1.560546875]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 3.0, 8.0, 13.0, 11.0, 15.0, 18.0, 31.0, 41.0, 36.0, 43.0, 45.0, 53.0, 61.0, 70.0, 73.0, 56.0, 53.0, 58.0, 49.0, 42.0, 44.0, 32.0, 27.0, 23.0, 13.0, 14.0, 13.0, 11.0, 9.0, 2.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.805140495300293, -10.509845733642578, -10.214550018310547, -9.919255256652832, -9.623960494995117, -9.328664779663086, -9.033370018005371, -8.738075256347656, -8.442779541015625, -8.14748477935791, -7.852189064025879, -7.556894302368164, -7.261599063873291, -6.966303825378418, -6.671009063720703, -6.37571382522583, -6.080418586730957, -5.785123348236084, -5.489828109741211, -5.194533348083496, -4.899238109588623, -4.60394287109375, -4.308648109436035, -4.013352870941162, -3.718057632446289, -3.422762393951416, -3.127467393875122, -2.832172393798828, -2.536877155303955, -2.241581916809082, -1.946286916732788, -1.6509919166564941, -1.3556957244873047, -1.0604006052017212, -0.7651054859161377, -0.4698103666305542, -0.1745152473449707, 0.12077987194061279, 0.4160749912261963, 0.7113699913024902, 1.0066652297973633, 1.3019603490829468, 1.5972554683685303, 1.8925505876541138, 2.1878457069396973, 2.4831409454345703, 2.7784359455108643, 3.073730945587158, 3.3690261840820312, 3.6643214225769043, 3.9596164226531982, 4.254911422729492, 4.550206661224365, 4.845501899719238, 5.140796661376953, 5.436091899871826, 5.731387138366699, 6.026682376861572, 6.321977615356445, 6.61727237701416, 6.912567615509033, 7.207862854003906, 7.503157615661621, 7.798452854156494, 8.093748092651367]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 13.0, 10.0, 9.0, 16.0, 8.0, 25.0, 18.0, 19.0, 20.0, 26.0, 25.0, 24.0, 37.0, 37.0, 32.0, 32.0, 42.0, 49.0, 52.0, 34.0, 44.0, 39.0, 47.0, 25.0, 22.0, 34.0, 33.0, 30.0, 26.0, 29.0, 22.0, 17.0, 11.0, 15.0, 11.0, 11.0, 12.0, 3.0, 6.0, 8.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.377065658569336, -10.06190013885498, -9.746734619140625, -9.431568145751953, -9.116402626037598, -8.801237106323242, -8.486071586608887, -8.170906066894531, -7.855739593505859, -7.540574073791504, -7.22540807723999, -6.910242557525635, -6.595076560974121, -6.279911041259766, -5.96474552154541, -5.6495795249938965, -5.334414005279541, -5.0192484855651855, -4.704082489013672, -4.388916969299316, -4.073750972747803, -3.7585854530334473, -3.4434196949005127, -3.128253936767578, -2.8130881786346436, -2.497922420501709, -2.1827566623687744, -1.8675910234451294, -1.5524252653121948, -1.2372595071792603, -0.9220938682556152, -0.6069281101226807, -0.2917623519897461, 0.02340337634086609, 0.33856910467147827, 0.6537348031997681, 0.9689005613327026, 1.2840663194656372, 1.5992319583892822, 1.9143977165222168, 2.2295634746551514, 2.544729232788086, 2.8598949909210205, 3.175060749053955, 3.4902262687683105, 3.805392265319824, 4.12055778503418, 4.435723304748535, 4.750889301300049, 5.066054821014404, 5.381220817565918, 5.696386337280273, 6.011552333831787, 6.326717853546143, 6.641883850097656, 6.957049369812012, 7.272214889526367, 7.587380409240723, 7.902546405792236, 8.21771240234375, 8.532877922058105, 8.848043441772461, 9.163208961486816, 9.478374481201172, 9.793540954589844]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 7.0, 10.0, 11.0, 23.0, 34.0, 58.0, 88.0, 149.0, 218.0, 363.0, 540.0, 931.0, 1450.0, 2411.0, 3813.0, 6216.0, 10334.0, 17531.0, 29059.0, 49611.0, 85329.0, 146680.0, 254453.0, 430671.0, 657698.0, 787348.0, 665296.0, 433115.0, 253285.0, 146607.0, 84765.0, 49659.0, 29585.0, 17830.0, 10850.0, 6775.0, 4304.0, 2562.0, 1589.0, 1061.0, 687.0, 435.0, 328.0, 195.0, 123.0, 82.0, 35.0, 31.0, 19.0, 21.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.66015625, -6.41802978515625, -6.1759033203125, -5.93377685546875, -5.691650390625, -5.44952392578125, -5.2073974609375, -4.96527099609375, -4.72314453125, -4.48101806640625, -4.2388916015625, -3.99676513671875, -3.754638671875, -3.51251220703125, -3.2703857421875, -3.02825927734375, -2.7861328125, -2.54400634765625, -2.3018798828125, -2.05975341796875, -1.817626953125, -1.57550048828125, -1.3333740234375, -1.09124755859375, -0.84912109375, -0.60699462890625, -0.3648681640625, -0.12274169921875, 0.119384765625, 0.36151123046875, 0.6036376953125, 0.84576416015625, 1.087890625, 1.33001708984375, 1.5721435546875, 1.81427001953125, 2.056396484375, 2.29852294921875, 2.5406494140625, 2.78277587890625, 3.02490234375, 3.26702880859375, 3.5091552734375, 3.75128173828125, 3.993408203125, 4.23553466796875, 4.4776611328125, 4.71978759765625, 4.9619140625, 5.20404052734375, 5.4461669921875, 5.68829345703125, 5.930419921875, 6.17254638671875, 6.4146728515625, 6.65679931640625, 6.89892578125, 7.14105224609375, 7.3831787109375, 7.62530517578125, 7.867431640625, 8.10955810546875, 8.3516845703125, 8.59381103515625, 8.8359375]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 3.0, 7.0, 11.0, 6.0, 11.0, 16.0, 14.0, 19.0, 21.0, 21.0, 21.0, 28.0, 27.0, 34.0, 33.0, 59.0, 22.0, 39.0, 48.0, 48.0, 46.0, 49.0, 43.0, 34.0, 36.0, 33.0, 37.0, 32.0, 27.0, 29.0, 21.0, 21.0, 19.0, 14.0, 16.0, 13.0, 7.0, 10.0, 4.0, 6.0, 5.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.4609375, -7.2364501953125, -7.011962890625, -6.7874755859375, -6.56298828125, -6.3385009765625, -6.114013671875, -5.8895263671875, -5.6650390625, -5.4405517578125, -5.216064453125, -4.9915771484375, -4.76708984375, -4.5426025390625, -4.318115234375, -4.0936279296875, -3.869140625, -3.6446533203125, -3.420166015625, -3.1956787109375, -2.97119140625, -2.7467041015625, -2.522216796875, -2.2977294921875, -2.0732421875, -1.8487548828125, -1.624267578125, -1.3997802734375, -1.17529296875, -0.9508056640625, -0.726318359375, -0.5018310546875, -0.27734375, -0.0528564453125, 0.171630859375, 0.3961181640625, 0.62060546875, 0.8450927734375, 1.069580078125, 1.2940673828125, 1.5185546875, 1.7430419921875, 1.967529296875, 2.1920166015625, 2.41650390625, 2.6409912109375, 2.865478515625, 3.0899658203125, 3.314453125, 3.5389404296875, 3.763427734375, 3.9879150390625, 4.21240234375, 4.4368896484375, 4.661376953125, 4.8858642578125, 5.1103515625, 5.3348388671875, 5.559326171875, 5.7838134765625, 6.00830078125, 6.2327880859375, 6.457275390625, 6.6817626953125, 6.90625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 9.0, 14.0, 28.0, 36.0, 62.0, 108.0, 134.0, 248.0, 411.0, 603.0, 959.0, 1459.0, 2325.0, 3830.0, 6100.0, 9773.0, 16266.0, 26614.0, 43914.0, 72314.0, 118787.0, 192869.0, 302755.0, 447645.0, 583119.0, 634840.0, 564947.0, 421986.0, 282485.0, 178267.0, 110023.0, 66877.0, 40159.0, 24750.0, 15137.0, 9214.0, 5696.0, 3542.0, 2223.0, 1373.0, 846.0, 561.0, 332.0, 234.0, 134.0, 106.0, 65.0, 35.0, 32.0, 20.0, 6.0, 9.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-6.48046875, -6.28057861328125, -6.0806884765625, -5.88079833984375, -5.680908203125, -5.48101806640625, -5.2811279296875, -5.08123779296875, -4.88134765625, -4.68145751953125, -4.4815673828125, -4.28167724609375, -4.081787109375, -3.88189697265625, -3.6820068359375, -3.48211669921875, -3.2822265625, -3.08233642578125, -2.8824462890625, -2.68255615234375, -2.482666015625, -2.28277587890625, -2.0828857421875, -1.88299560546875, -1.68310546875, -1.48321533203125, -1.2833251953125, -1.08343505859375, -0.883544921875, -0.68365478515625, -0.4837646484375, -0.28387451171875, -0.083984375, 0.11590576171875, 0.3157958984375, 0.51568603515625, 0.715576171875, 0.91546630859375, 1.1153564453125, 1.31524658203125, 1.51513671875, 1.71502685546875, 1.9149169921875, 2.11480712890625, 2.314697265625, 2.51458740234375, 2.7144775390625, 2.91436767578125, 3.1142578125, 3.31414794921875, 3.5140380859375, 3.71392822265625, 3.913818359375, 4.11370849609375, 4.3135986328125, 4.51348876953125, 4.71337890625, 4.91326904296875, 5.1131591796875, 5.31304931640625, 5.512939453125, 5.71282958984375, 5.9127197265625, 6.11260986328125, 6.3125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 6.0, 7.0, 21.0, 14.0, 14.0, 32.0, 19.0, 36.0, 33.0, 47.0, 70.0, 74.0, 94.0, 122.0, 110.0, 140.0, 124.0, 146.0, 156.0, 172.0, 197.0, 218.0, 189.0, 173.0, 203.0, 171.0, 165.0, 167.0, 160.0, 151.0, 112.0, 122.0, 101.0, 77.0, 74.0, 65.0, 42.0, 54.0, 42.0, 36.0, 23.0, 13.0, 25.0, 7.0, 6.0, 14.0, 6.0, 2.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.90234375, -2.80908203125, -2.7158203125, -2.62255859375, -2.529296875, -2.43603515625, -2.3427734375, -2.24951171875, -2.15625, -2.06298828125, -1.9697265625, -1.87646484375, -1.783203125, -1.68994140625, -1.5966796875, -1.50341796875, -1.41015625, -1.31689453125, -1.2236328125, -1.13037109375, -1.037109375, -0.94384765625, -0.8505859375, -0.75732421875, -0.6640625, -0.57080078125, -0.4775390625, -0.38427734375, -0.291015625, -0.19775390625, -0.1044921875, -0.01123046875, 0.08203125, 0.17529296875, 0.2685546875, 0.36181640625, 0.455078125, 0.54833984375, 0.6416015625, 0.73486328125, 0.828125, 0.92138671875, 1.0146484375, 1.10791015625, 1.201171875, 1.29443359375, 1.3876953125, 1.48095703125, 1.57421875, 1.66748046875, 1.7607421875, 1.85400390625, 1.947265625, 2.04052734375, 2.1337890625, 2.22705078125, 2.3203125, 2.41357421875, 2.5068359375, 2.60009765625, 2.693359375, 2.78662109375, 2.8798828125, 2.97314453125, 3.06640625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 5.0, 9.0, 7.0, 6.0, 6.0, 2.0, 12.0, 6.0, 14.0, 17.0, 23.0, 24.0, 31.0, 36.0, 50.0, 41.0, 41.0, 46.0, 60.0, 70.0, 53.0, 50.0, 50.0, 55.0, 38.0, 39.0, 39.0, 20.0, 28.0, 16.0, 22.0, 8.0, 19.0, 9.0, 13.0, 3.0, 6.0, 7.0, 4.0, 2.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.85355806350708, -7.615810871124268, -7.378064155578613, -7.140316963195801, -6.902569770812988, -6.664822578430176, -6.4270758628845215, -6.189328670501709, -5.9515814781188965, -5.713834285736084, -5.47608757019043, -5.238340377807617, -5.000593185424805, -4.762845993041992, -4.525099277496338, -4.287352085113525, -4.049605369567871, -3.8118584156036377, -3.574111223220825, -3.336364269256592, -3.0986170768737793, -2.860870122909546, -2.6231231689453125, -2.3853759765625, -2.1476287841796875, -1.9098817110061646, -1.6721346378326416, -1.4343876838684082, -1.1966404914855957, -0.9588935375213623, -0.7211464643478394, -0.4833993911743164, -0.2456521987915039, -0.007905140519142151, 0.2298419177532196, 0.46758896112442017, 0.7053360342979431, 0.9430830478668213, 1.1808301210403442, 1.4185771942138672, 1.6563242673873901, 1.894071340560913, 2.1318182945251465, 2.369565486907959, 2.6073124408721924, 2.845059394836426, 3.0828065872192383, 3.320553779602051, 3.558300733566284, 3.7960476875305176, 4.03379487991333, 4.271542072296143, 4.509288787841797, 4.747035980224609, 4.984783172607422, 5.222530364990234, 5.460277080535889, 5.698024272918701, 5.9357709884643555, 6.173518180847168, 6.4112653732299805, 6.649012565612793, 6.886759281158447, 7.12450647354126, 7.362253665924072]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 6.0, 7.0, 13.0, 16.0, 17.0, 14.0, 19.0, 17.0, 12.0, 35.0, 38.0, 35.0, 32.0, 41.0, 40.0, 52.0, 43.0, 40.0, 46.0, 36.0, 33.0, 42.0, 35.0, 43.0, 30.0, 38.0, 31.0, 32.0, 26.0, 29.0, 18.0, 14.0, 13.0, 8.0, 7.0, 6.0, 15.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.265344619750977, -9.948668479919434, -9.63199234008789, -9.315315246582031, -8.998639106750488, -8.681962966918945, -8.365285873413086, -8.048609733581543, -7.73193359375, -7.415257453918457, -7.098580837249756, -6.781904220581055, -6.465228080749512, -6.148551940917969, -5.831875324249268, -5.515198707580566, -5.198522567749023, -4.8818464279174805, -4.565169811248779, -4.248493194580078, -3.931817054748535, -3.615140676498413, -3.298464298248291, -2.981787919998169, -2.665111541748047, -2.348435163497925, -2.0317587852478027, -1.7150824069976807, -1.3984060287475586, -1.0817296504974365, -0.7650532722473145, -0.4483768939971924, -0.13170146942138672, 0.18497490882873535, 0.5016512870788574, 0.8183276653289795, 1.1350040435791016, 1.4516804218292236, 1.7683568000793457, 2.0850331783294678, 2.40170955657959, 2.718385934829712, 3.035062313079834, 3.351738691329956, 3.668415069580078, 3.9850914478302, 4.301767826080322, 4.618444442749023, 4.935120582580566, 5.251796722412109, 5.5684733390808105, 5.885149955749512, 6.201826095581055, 6.518502235412598, 6.835178852081299, 7.15185546875, 7.468531608581543, 7.785207748413086, 8.101884841918945, 8.418560981750488, 8.735237121582031, 9.051913261413574, 9.368589401245117, 9.685266494750977, 10.00194263458252]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 15.0, 16.0, 18.0, 23.0, 34.0, 59.0, 82.0, 119.0, 170.0, 297.0, 401.0, 594.0, 999.0, 1445.0, 2358.0, 3560.0, 5741.0, 9152.0, 14301.0, 22710.0, 36078.0, 57601.0, 90945.0, 137770.0, 182262.0, 165792.0, 115078.0, 74117.0, 46740.0, 29428.0, 18422.0, 11659.0, 7391.0, 4653.0, 2978.0, 1875.0, 1222.0, 832.0, 525.0, 369.0, 231.0, 149.0, 116.0, 65.0, 43.0, 44.0, 23.0, 16.0, 8.0, 9.0, 7.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0], "bins": [-1.46484375, -1.4187469482421875, -1.372650146484375, -1.3265533447265625, -1.28045654296875, -1.2343597412109375, -1.188262939453125, -1.1421661376953125, -1.0960693359375, -1.0499725341796875, -1.003875732421875, -0.9577789306640625, -0.91168212890625, -0.8655853271484375, -0.819488525390625, -0.7733917236328125, -0.727294921875, -0.6811981201171875, -0.635101318359375, -0.5890045166015625, -0.54290771484375, -0.4968109130859375, -0.450714111328125, -0.4046173095703125, -0.3585205078125, -0.3124237060546875, -0.266326904296875, -0.2202301025390625, -0.17413330078125, -0.1280364990234375, -0.081939697265625, -0.0358428955078125, 0.01025390625, 0.0563507080078125, 0.102447509765625, 0.1485443115234375, 0.19464111328125, 0.2407379150390625, 0.286834716796875, 0.3329315185546875, 0.3790283203125, 0.4251251220703125, 0.471221923828125, 0.5173187255859375, 0.56341552734375, 0.6095123291015625, 0.655609130859375, 0.7017059326171875, 0.747802734375, 0.7938995361328125, 0.839996337890625, 0.8860931396484375, 0.93218994140625, 0.9782867431640625, 1.024383544921875, 1.0704803466796875, 1.1165771484375, 1.1626739501953125, 1.208770751953125, 1.2548675537109375, 1.30096435546875, 1.3470611572265625, 1.393157958984375, 1.4392547607421875, 1.4853515625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 8.0, 4.0, 10.0, 10.0, 14.0, 10.0, 21.0, 17.0, 18.0, 13.0, 29.0, 25.0, 26.0, 43.0, 40.0, 31.0, 47.0, 48.0, 46.0, 41.0, 37.0, 32.0, 39.0, 41.0, 31.0, 32.0, 31.0, 36.0, 26.0, 27.0, 27.0, 30.0, 16.0, 23.0, 12.0, 11.0, 10.0, 7.0, 10.0, 7.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.828125, -8.5274658203125, -8.226806640625, -7.9261474609375, -7.62548828125, -7.3248291015625, -7.024169921875, -6.7235107421875, -6.4228515625, -6.1221923828125, -5.821533203125, -5.5208740234375, -5.22021484375, -4.9195556640625, -4.618896484375, -4.3182373046875, -4.017578125, -3.7169189453125, -3.416259765625, -3.1156005859375, -2.81494140625, -2.5142822265625, -2.213623046875, -1.9129638671875, -1.6123046875, -1.3116455078125, -1.010986328125, -0.7103271484375, -0.40966796875, -0.1090087890625, 0.191650390625, 0.4923095703125, 0.79296875, 1.0936279296875, 1.394287109375, 1.6949462890625, 1.99560546875, 2.2962646484375, 2.596923828125, 2.8975830078125, 3.1982421875, 3.4989013671875, 3.799560546875, 4.1002197265625, 4.40087890625, 4.7015380859375, 5.002197265625, 5.3028564453125, 5.603515625, 5.9041748046875, 6.204833984375, 6.5054931640625, 6.80615234375, 7.1068115234375, 7.407470703125, 7.7081298828125, 8.0087890625, 8.3094482421875, 8.610107421875, 8.9107666015625, 9.21142578125, 9.5120849609375, 9.812744140625, 10.1134033203125, 10.4140625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 8.0, 7.0, 16.0, 22.0, 42.0, 47.0, 67.0, 119.0, 177.0, 242.0, 367.0, 509.0, 709.0, 1183.0, 1685.0, 2540.0, 3747.0, 5656.0, 8642.0, 13063.0, 20199.0, 30587.0, 47040.0, 71080.0, 104798.0, 148674.0, 169565.0, 137214.0, 94689.0, 63877.0, 42038.0, 27558.0, 18112.0, 11571.0, 7522.0, 4922.0, 3272.0, 2231.0, 1558.0, 1061.0, 685.0, 489.0, 296.0, 208.0, 158.0, 95.0, 75.0, 38.0, 31.0, 34.0, 12.0, 13.0, 6.0, 1.0, 4.0], "bins": [-1.2998046875, -1.2630615234375, -1.226318359375, -1.1895751953125, -1.15283203125, -1.1160888671875, -1.079345703125, -1.0426025390625, -1.005859375, -0.9691162109375, -0.932373046875, -0.8956298828125, -0.85888671875, -0.8221435546875, -0.785400390625, -0.7486572265625, -0.7119140625, -0.6751708984375, -0.638427734375, -0.6016845703125, -0.56494140625, -0.5281982421875, -0.491455078125, -0.4547119140625, -0.41796875, -0.3812255859375, -0.344482421875, -0.3077392578125, -0.27099609375, -0.2342529296875, -0.197509765625, -0.1607666015625, -0.1240234375, -0.0872802734375, -0.050537109375, -0.0137939453125, 0.02294921875, 0.0596923828125, 0.096435546875, 0.1331787109375, 0.169921875, 0.2066650390625, 0.243408203125, 0.2801513671875, 0.31689453125, 0.3536376953125, 0.390380859375, 0.4271240234375, 0.4638671875, 0.5006103515625, 0.537353515625, 0.5740966796875, 0.61083984375, 0.6475830078125, 0.684326171875, 0.7210693359375, 0.7578125, 0.7945556640625, 0.831298828125, 0.8680419921875, 0.90478515625, 0.9415283203125, 0.978271484375, 1.0150146484375, 1.0517578125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 9.0, 7.0, 8.0, 10.0, 17.0, 15.0, 21.0, 19.0, 23.0, 42.0, 35.0, 33.0, 32.0, 35.0, 50.0, 46.0, 52.0, 42.0, 55.0, 41.0, 39.0, 35.0, 41.0, 38.0, 30.0, 39.0, 25.0, 21.0, 32.0, 20.0, 16.0, 6.0, 6.0, 4.0, 8.0, 6.0, 6.0, 6.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.53125, -6.3302001953125, -6.129150390625, -5.9281005859375, -5.72705078125, -5.5260009765625, -5.324951171875, -5.1239013671875, -4.9228515625, -4.7218017578125, -4.520751953125, -4.3197021484375, -4.11865234375, -3.9176025390625, -3.716552734375, -3.5155029296875, -3.314453125, -3.1134033203125, -2.912353515625, -2.7113037109375, -2.51025390625, -2.3092041015625, -2.108154296875, -1.9071044921875, -1.7060546875, -1.5050048828125, -1.303955078125, -1.1029052734375, -0.90185546875, -0.7008056640625, -0.499755859375, -0.2987060546875, -0.09765625, 0.1033935546875, 0.304443359375, 0.5054931640625, 0.70654296875, 0.9075927734375, 1.108642578125, 1.3096923828125, 1.5107421875, 1.7117919921875, 1.912841796875, 2.1138916015625, 2.31494140625, 2.5159912109375, 2.717041015625, 2.9180908203125, 3.119140625, 3.3201904296875, 3.521240234375, 3.7222900390625, 3.92333984375, 4.1243896484375, 4.325439453125, 4.5264892578125, 4.7275390625, 4.9285888671875, 5.129638671875, 5.3306884765625, 5.53173828125, 5.7327880859375, 5.933837890625, 6.1348876953125, 6.3359375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 9.0, 12.0, 6.0, 20.0, 31.0, 35.0, 47.0, 72.0, 89.0, 141.0, 180.0, 300.0, 459.0, 723.0, 1156.0, 2096.0, 3721.0, 7240.0, 14996.0, 32835.0, 74326.0, 170079.0, 332033.0, 225301.0, 98958.0, 43428.0, 19590.0, 9297.0, 4778.0, 2698.0, 1474.0, 857.0, 492.0, 306.0, 236.0, 158.0, 113.0, 76.0, 58.0, 37.0, 27.0, 20.0, 10.0, 13.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.1851806640625, -0.179840087890625, -0.17449951171875, -0.169158935546875, -0.163818359375, -0.158477783203125, -0.15313720703125, -0.147796630859375, -0.1424560546875, -0.137115478515625, -0.13177490234375, -0.126434326171875, -0.12109375, -0.115753173828125, -0.11041259765625, -0.105072021484375, -0.0997314453125, -0.094390869140625, -0.08905029296875, -0.083709716796875, -0.078369140625, -0.073028564453125, -0.06768798828125, -0.062347412109375, -0.0570068359375, -0.051666259765625, -0.04632568359375, -0.040985107421875, -0.03564453125, -0.030303955078125, -0.02496337890625, -0.019622802734375, -0.0142822265625, -0.008941650390625, -0.00360107421875, 0.001739501953125, 0.007080078125, 0.012420654296875, 0.01776123046875, 0.023101806640625, 0.0284423828125, 0.033782958984375, 0.03912353515625, 0.044464111328125, 0.0498046875, 0.055145263671875, 0.06048583984375, 0.065826416015625, 0.0711669921875, 0.076507568359375, 0.08184814453125, 0.087188720703125, 0.092529296875, 0.097869873046875, 0.10321044921875, 0.108551025390625, 0.1138916015625, 0.119232177734375, 0.12457275390625, 0.129913330078125, 0.13525390625, 0.140594482421875, 0.14593505859375, 0.151275634765625, 0.1566162109375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 9.0, 10.0, 8.0, 16.0, 10.0, 19.0, 19.0, 9.0, 34.0, 24.0, 41.0, 36.0, 37.0, 39.0, 52.0, 58.0, 57.0, 60.0, 49.0, 59.0, 47.0, 47.0, 29.0, 34.0, 34.0, 20.0, 16.0, 21.0, 10.0, 19.0, 11.0, 12.0, 9.0, 7.0, 12.0, 9.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.71661376953125e-05, -1.6658566892147064e-05, -1.615099608898163e-05, -1.5643425285816193e-05, -1.5135854482650757e-05, -1.4628283679485321e-05, -1.4120712876319885e-05, -1.361314207315445e-05, -1.3105571269989014e-05, -1.2598000466823578e-05, -1.2090429663658142e-05, -1.1582858860492706e-05, -1.107528805732727e-05, -1.0567717254161835e-05, -1.0060146450996399e-05, -9.552575647830963e-06, -9.045004844665527e-06, -8.537434041500092e-06, -8.029863238334656e-06, -7.52229243516922e-06, -7.014721632003784e-06, -6.507150828838348e-06, -5.999580025672913e-06, -5.492009222507477e-06, -4.984438419342041e-06, -4.476867616176605e-06, -3.9692968130111694e-06, -3.4617260098457336e-06, -2.954155206680298e-06, -2.446584403514862e-06, -1.9390136003494263e-06, -1.4314427971839905e-06, -9.238719940185547e-07, -4.163011908531189e-07, 9.12696123123169e-08, 5.988404154777527e-07, 1.1064112186431885e-06, 1.6139820218086243e-06, 2.12155282497406e-06, 2.629123628139496e-06, 3.1366944313049316e-06, 3.6442652344703674e-06, 4.151836037635803e-06, 4.659406840801239e-06, 5.166977643966675e-06, 5.674548447132111e-06, 6.182119250297546e-06, 6.689690053462982e-06, 7.197260856628418e-06, 7.704831659793854e-06, 8.21240246295929e-06, 8.719973266124725e-06, 9.227544069290161e-06, 9.735114872455597e-06, 1.0242685675621033e-05, 1.0750256478786469e-05, 1.1257827281951904e-05, 1.176539808511734e-05, 1.2272968888282776e-05, 1.2780539691448212e-05, 1.3288110494613647e-05, 1.3795681297779083e-05, 1.4303252100944519e-05, 1.4810822904109955e-05, 1.531839370727539e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 3.0, 8.0, 5.0, 9.0, 12.0, 12.0, 12.0, 21.0, 36.0, 46.0, 62.0, 110.0, 147.0, 209.0, 328.0, 497.0, 778.0, 1242.0, 2301.0, 3990.0, 7417.0, 13650.0, 26770.0, 53516.0, 110147.0, 229806.0, 291237.0, 154229.0, 74057.0, 36858.0, 18657.0, 9760.0, 5216.0, 2921.0, 1610.0, 1040.0, 623.0, 396.0, 244.0, 173.0, 125.0, 97.0, 44.0, 36.0, 33.0, 20.0, 11.0, 8.0, 11.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2073974609375, -0.20053672790527344, -0.19367599487304688, -0.1868152618408203, -0.17995452880859375, -0.1730937957763672, -0.16623306274414062, -0.15937232971191406, -0.1525115966796875, -0.14565086364746094, -0.13879013061523438, -0.1319293975830078, -0.12506866455078125, -0.11820793151855469, -0.11134719848632812, -0.10448646545410156, -0.097625732421875, -0.09076499938964844, -0.08390426635742188, -0.07704353332519531, -0.07018280029296875, -0.06332206726074219, -0.056461334228515625, -0.04960060119628906, -0.0427398681640625, -0.03587913513183594, -0.029018402099609375, -0.022157669067382812, -0.01529693603515625, -0.008436203002929688, -0.001575469970703125, 0.0052852630615234375, 0.01214599609375, 0.019006729125976562, 0.025867462158203125, 0.03272819519042969, 0.03958892822265625, 0.04644966125488281, 0.053310394287109375, 0.06017112731933594, 0.0670318603515625, 0.07389259338378906, 0.08075332641601562, 0.08761405944824219, 0.09447479248046875, 0.10133552551269531, 0.10819625854492188, 0.11505699157714844, 0.121917724609375, 0.12877845764160156, 0.13563919067382812, 0.1424999237060547, 0.14936065673828125, 0.1562213897705078, 0.16308212280273438, 0.16994285583496094, 0.1768035888671875, 0.18366432189941406, 0.19052505493164062, 0.1973857879638672, 0.20424652099609375, 0.2111072540283203, 0.21796798706054688, 0.22482872009277344, 0.231689453125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 5.0, 9.0, 12.0, 13.0, 23.0, 16.0, 19.0, 31.0, 33.0, 47.0, 55.0, 66.0, 73.0, 69.0, 91.0, 75.0, 55.0, 49.0, 40.0, 37.0, 35.0, 25.0, 19.0, 19.0, 11.0, 19.0, 8.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.073974609375, -0.07149696350097656, -0.06901931762695312, -0.06654167175292969, -0.06406402587890625, -0.06158638000488281, -0.059108734130859375, -0.05663108825683594, -0.0541534423828125, -0.05167579650878906, -0.049198150634765625, -0.04672050476074219, -0.04424285888671875, -0.04176521301269531, -0.039287567138671875, -0.03680992126464844, -0.034332275390625, -0.03185462951660156, -0.029376983642578125, -0.026899337768554688, -0.02442169189453125, -0.021944046020507812, -0.019466400146484375, -0.016988754272460938, -0.0145111083984375, -0.012033462524414062, -0.009555816650390625, -0.0070781707763671875, -0.00460052490234375, -0.0021228790283203125, 0.000354766845703125, 0.0028324127197265625, 0.00531005859375, 0.0077877044677734375, 0.010265350341796875, 0.012742996215820312, 0.01522064208984375, 0.017698287963867188, 0.020175933837890625, 0.022653579711914062, 0.0251312255859375, 0.027608871459960938, 0.030086517333984375, 0.03256416320800781, 0.03504180908203125, 0.03751945495605469, 0.039997100830078125, 0.04247474670410156, 0.044952392578125, 0.04743003845214844, 0.049907684326171875, 0.05238533020019531, 0.05486297607421875, 0.05734062194824219, 0.059818267822265625, 0.06229591369628906, 0.0647735595703125, 0.06725120544433594, 0.06972885131835938, 0.07220649719238281, 0.07468414306640625, 0.07716178894042969, 0.07963943481445312, 0.08211708068847656, 0.0845947265625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 5.0, 5.0, 7.0, 8.0, 7.0, 12.0, 17.0, 26.0, 22.0, 21.0, 40.0, 48.0, 40.0, 47.0, 49.0, 52.0, 64.0, 64.0, 40.0, 58.0, 61.0, 32.0, 42.0, 35.0, 23.0, 22.0, 27.0, 20.0, 11.0, 16.0, 9.0, 9.0, 11.0, 5.0, 7.0, 3.0, 2.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.868477821350098, -7.631544589996338, -7.394611358642578, -7.15767765045166, -6.9207444190979, -6.683811187744141, -6.446877956390381, -6.209944725036621, -5.973011493682861, -5.736078262329102, -5.499145030975342, -5.262211799621582, -5.025278091430664, -4.788344860076904, -4.5514116287231445, -4.314478397369385, -4.077545166015625, -3.8406119346618652, -3.6036784648895264, -3.3667452335357666, -3.129812002182007, -2.892878532409668, -2.655945301055908, -2.4190120697021484, -2.1820783615112305, -1.9451450109481812, -1.7082117795944214, -1.471278429031372, -1.2343451976776123, -0.997411847114563, -0.7604784965515137, -0.5235452651977539, -0.28661203384399414, -0.049678727984428406, 0.18725457787513733, 0.42418789863586426, 0.6611211895942688, 0.8980544805526733, 1.1349878311157227, 1.3719210624694824, 1.6088544130325317, 1.845787763595581, 2.082720994949341, 2.3196544647216797, 2.5565876960754395, 2.793520927429199, 3.030454158782959, 3.2673873901367188, 3.5043208599090576, 3.7412540912628174, 3.9781875610351562, 4.215120792388916, 4.452054023742676, 4.6889872550964355, 4.925920486450195, 5.162854194641113, 5.399787425994873, 5.636720657348633, 5.873653888702393, 6.110587120056152, 6.34752082824707, 6.58445405960083, 6.82138729095459, 7.05832052230835, 7.295253753662109]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 4.0, 8.0, 13.0, 14.0, 18.0, 16.0, 18.0, 14.0, 15.0, 36.0, 36.0, 36.0, 32.0, 40.0, 40.0, 53.0, 42.0, 41.0, 46.0, 33.0, 36.0, 41.0, 36.0, 44.0, 29.0, 38.0, 30.0, 35.0, 25.0, 29.0, 17.0, 16.0, 12.0, 9.0, 7.0, 5.0, 15.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.29301929473877, -9.97712516784668, -9.661231994628906, -9.345337867736816, -9.029444694519043, -8.713550567626953, -8.39765739440918, -8.08176326751709, -7.765870094299316, -7.449976444244385, -7.134082794189453, -6.8181891441345215, -6.50229549407959, -6.186401844024658, -5.870508193969727, -5.554614067077637, -5.238720417022705, -4.922826766967773, -4.606933116912842, -4.29103946685791, -3.9751458168029785, -3.659252166748047, -3.343358278274536, -3.0274646282196045, -2.711570978164673, -2.395677328109741, -2.0797836780548096, -1.7638899087905884, -1.4479962587356567, -1.132102608680725, -0.8162088394165039, -0.5003151893615723, -0.18442153930664062, 0.1314721405506134, 0.44736582040786743, 0.7632595300674438, 1.0791531801223755, 1.3950468301773071, 1.7109405994415283, 2.02683424949646, 2.3427278995513916, 2.6586215496063232, 2.974515199661255, 3.2904090881347656, 3.6063027381896973, 3.922196388244629, 4.2380900382995605, 4.553983688354492, 4.869877338409424, 5.1857709884643555, 5.501664638519287, 5.817558288574219, 6.13345193862915, 6.449345588684082, 6.765239715576172, 7.081132888793945, 7.397027015686035, 7.712920665740967, 8.028814315795898, 8.344708442687988, 8.660601615905762, 8.976495742797852, 9.292388916015625, 9.608283042907715, 9.924176216125488]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 11.0, 12.0, 26.0, 42.0, 51.0, 105.0, 165.0, 254.0, 359.0, 617.0, 971.0, 1636.0, 2612.0, 4154.0, 6989.0, 11540.0, 19868.0, 32740.0, 53843.0, 84561.0, 122029.0, 153659.0, 160091.0, 134530.0, 97014.0, 62976.0, 38665.0, 23290.0, 14260.0, 8402.0, 5114.0, 2953.0, 1867.0, 1135.0, 750.0, 454.0, 287.0, 179.0, 142.0, 75.0, 40.0, 23.0, 24.0, 16.0, 9.0, 5.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.5391845703125, -7.289306640625, -7.0394287109375, -6.78955078125, -6.5396728515625, -6.289794921875, -6.0399169921875, -5.7900390625, -5.5401611328125, -5.290283203125, -5.0404052734375, -4.79052734375, -4.5406494140625, -4.290771484375, -4.0408935546875, -3.791015625, -3.5411376953125, -3.291259765625, -3.0413818359375, -2.79150390625, -2.5416259765625, -2.291748046875, -2.0418701171875, -1.7919921875, -1.5421142578125, -1.292236328125, -1.0423583984375, -0.79248046875, -0.5426025390625, -0.292724609375, -0.0428466796875, 0.20703125, 0.4569091796875, 0.706787109375, 0.9566650390625, 1.20654296875, 1.4564208984375, 1.706298828125, 1.9561767578125, 2.2060546875, 2.4559326171875, 2.705810546875, 2.9556884765625, 3.20556640625, 3.4554443359375, 3.705322265625, 3.9552001953125, 4.205078125, 4.4549560546875, 4.704833984375, 4.9547119140625, 5.20458984375, 5.4544677734375, 5.704345703125, 5.9542236328125, 6.2041015625, 6.4539794921875, 6.703857421875, 6.9537353515625, 7.20361328125, 7.4534912109375, 7.703369140625, 7.9532470703125, 8.203125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 7.0, 8.0, 12.0, 12.0, 16.0, 15.0, 21.0, 10.0, 19.0, 36.0, 30.0, 20.0, 49.0, 31.0, 40.0, 35.0, 50.0, 34.0, 43.0, 42.0, 39.0, 34.0, 30.0, 47.0, 27.0, 35.0, 29.0, 35.0, 28.0, 29.0, 20.0, 21.0, 17.0, 11.0, 10.0, 7.0, 7.0, 12.0, 13.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-9.625, -9.334716796875, -9.04443359375, -8.754150390625, -8.4638671875, -8.173583984375, -7.88330078125, -7.593017578125, -7.302734375, -7.012451171875, -6.72216796875, -6.431884765625, -6.1416015625, -5.851318359375, -5.56103515625, -5.270751953125, -4.98046875, -4.690185546875, -4.39990234375, -4.109619140625, -3.8193359375, -3.529052734375, -3.23876953125, -2.948486328125, -2.658203125, -2.367919921875, -2.07763671875, -1.787353515625, -1.4970703125, -1.206787109375, -0.91650390625, -0.626220703125, -0.3359375, -0.045654296875, 0.24462890625, 0.534912109375, 0.8251953125, 1.115478515625, 1.40576171875, 1.696044921875, 1.986328125, 2.276611328125, 2.56689453125, 2.857177734375, 3.1474609375, 3.437744140625, 3.72802734375, 4.018310546875, 4.30859375, 4.598876953125, 4.88916015625, 5.179443359375, 5.4697265625, 5.760009765625, 6.05029296875, 6.340576171875, 6.630859375, 6.921142578125, 7.21142578125, 7.501708984375, 7.7919921875, 8.082275390625, 8.37255859375, 8.662841796875, 8.953125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 15.0, 22.0, 23.0, 45.0, 43.0, 65.0, 111.0, 168.0, 254.0, 370.0, 525.0, 818.0, 1177.0, 1934.0, 2846.0, 4442.0, 6798.0, 10765.0, 16887.0, 26095.0, 40996.0, 61428.0, 89412.0, 121772.0, 143834.0, 142937.0, 118734.0, 86996.0, 59189.0, 38940.0, 25248.0, 16005.0, 10369.0, 6859.0, 4323.0, 2754.0, 1853.0, 1122.0, 817.0, 498.0, 338.0, 250.0, 146.0, 120.0, 69.0, 42.0, 37.0, 30.0, 8.0, 14.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.0859375, -6.86419677734375, -6.6424560546875, -6.42071533203125, -6.198974609375, -5.97723388671875, -5.7554931640625, -5.53375244140625, -5.31201171875, -5.09027099609375, -4.8685302734375, -4.64678955078125, -4.425048828125, -4.20330810546875, -3.9815673828125, -3.75982666015625, -3.5380859375, -3.31634521484375, -3.0946044921875, -2.87286376953125, -2.651123046875, -2.42938232421875, -2.2076416015625, -1.98590087890625, -1.76416015625, -1.54241943359375, -1.3206787109375, -1.09893798828125, -0.877197265625, -0.65545654296875, -0.4337158203125, -0.21197509765625, 0.009765625, 0.23150634765625, 0.4532470703125, 0.67498779296875, 0.896728515625, 1.11846923828125, 1.3402099609375, 1.56195068359375, 1.78369140625, 2.00543212890625, 2.2271728515625, 2.44891357421875, 2.670654296875, 2.89239501953125, 3.1141357421875, 3.33587646484375, 3.5576171875, 3.77935791015625, 4.0010986328125, 4.22283935546875, 4.444580078125, 4.66632080078125, 4.8880615234375, 5.10980224609375, 5.33154296875, 5.55328369140625, 5.7750244140625, 5.99676513671875, 6.218505859375, 6.44024658203125, 6.6619873046875, 6.88372802734375, 7.10546875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 5.0, 10.0, 12.0, 9.0, 10.0, 12.0, 18.0, 13.0, 19.0, 21.0, 25.0, 31.0, 25.0, 37.0, 32.0, 42.0, 32.0, 38.0, 51.0, 32.0, 47.0, 44.0, 35.0, 39.0, 44.0, 34.0, 31.0, 30.0, 28.0, 26.0, 36.0, 21.0, 22.0, 19.0, 19.0, 12.0, 5.0, 11.0, 9.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30078125, -5.12152099609375, -4.9422607421875, -4.76300048828125, -4.583740234375, -4.40447998046875, -4.2252197265625, -4.04595947265625, -3.86669921875, -3.68743896484375, -3.5081787109375, -3.32891845703125, -3.149658203125, -2.97039794921875, -2.7911376953125, -2.61187744140625, -2.4326171875, -2.25335693359375, -2.0740966796875, -1.89483642578125, -1.715576171875, -1.53631591796875, -1.3570556640625, -1.17779541015625, -0.99853515625, -0.81927490234375, -0.6400146484375, -0.46075439453125, -0.281494140625, -0.10223388671875, 0.0770263671875, 0.25628662109375, 0.435546875, 0.61480712890625, 0.7940673828125, 0.97332763671875, 1.152587890625, 1.33184814453125, 1.5111083984375, 1.69036865234375, 1.86962890625, 2.04888916015625, 2.2281494140625, 2.40740966796875, 2.586669921875, 2.76593017578125, 2.9451904296875, 3.12445068359375, 3.3037109375, 3.48297119140625, 3.6622314453125, 3.84149169921875, 4.020751953125, 4.20001220703125, 4.3792724609375, 4.55853271484375, 4.73779296875, 4.91705322265625, 5.0963134765625, 5.27557373046875, 5.454833984375, 5.63409423828125, 5.8133544921875, 5.99261474609375, 6.171875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 7.0, 11.0, 16.0, 35.0, 36.0, 51.0, 99.0, 111.0, 167.0, 253.0, 378.0, 571.0, 899.0, 1389.0, 2273.0, 4181.0, 8142.0, 17489.0, 41145.0, 105664.0, 250939.0, 323653.0, 171402.0, 66672.0, 26920.0, 11990.0, 5895.0, 3123.0, 1756.0, 1125.0, 730.0, 478.0, 300.0, 190.0, 141.0, 101.0, 73.0, 43.0, 34.0, 32.0, 7.0, 7.0, 9.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.56640625, -5.3990478515625, -5.231689453125, -5.0643310546875, -4.89697265625, -4.7296142578125, -4.562255859375, -4.3948974609375, -4.2275390625, -4.0601806640625, -3.892822265625, -3.7254638671875, -3.55810546875, -3.3907470703125, -3.223388671875, -3.0560302734375, -2.888671875, -2.7213134765625, -2.553955078125, -2.3865966796875, -2.21923828125, -2.0518798828125, -1.884521484375, -1.7171630859375, -1.5498046875, -1.3824462890625, -1.215087890625, -1.0477294921875, -0.88037109375, -0.7130126953125, -0.545654296875, -0.3782958984375, -0.2109375, -0.0435791015625, 0.123779296875, 0.2911376953125, 0.45849609375, 0.6258544921875, 0.793212890625, 0.9605712890625, 1.1279296875, 1.2952880859375, 1.462646484375, 1.6300048828125, 1.79736328125, 1.9647216796875, 2.132080078125, 2.2994384765625, 2.466796875, 2.6341552734375, 2.801513671875, 2.9688720703125, 3.13623046875, 3.3035888671875, 3.470947265625, 3.6383056640625, 3.8056640625, 3.9730224609375, 4.140380859375, 4.3077392578125, 4.47509765625, 4.6424560546875, 4.809814453125, 4.9771728515625, 5.14453125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 10.0, 11.0, 21.0, 21.0, 27.0, 30.0, 41.0, 56.0, 61.0, 54.0, 66.0, 81.0, 73.0, 76.0, 75.0, 56.0, 46.0, 37.0, 31.0, 19.0, 19.0, 15.0, 5.0, 8.0, 4.0, 5.0, 4.0, 8.0, 1.0, 4.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003478527069091797, -0.0003383718430995941, -0.00032889097929000854, -0.000319410115480423, -0.0003099292516708374, -0.00030044838786125183, -0.00029096752405166626, -0.0002814866602420807, -0.0002720057964324951, -0.00026252493262290955, -0.000253044068813324, -0.0002435632050037384, -0.00023408234119415283, -0.00022460147738456726, -0.0002151206135749817, -0.00020563974976539612, -0.00019615888595581055, -0.00018667802214622498, -0.0001771971583366394, -0.00016771629452705383, -0.00015823543071746826, -0.0001487545669078827, -0.00013927370309829712, -0.00012979283928871155, -0.00012031197547912598, -0.0001108311116695404, -0.00010135024785995483, -9.186938405036926e-05, -8.238852024078369e-05, -7.290765643119812e-05, -6.342679262161255e-05, -5.394592881202698e-05, -4.4465065002441406e-05, -3.4984201192855835e-05, -2.5503337383270264e-05, -1.6022473573684692e-05, -6.541609764099121e-06, 2.93925404548645e-06, 1.2420117855072021e-05, 2.1900981664657593e-05, 3.1381845474243164e-05, 4.0862709283828735e-05, 5.034357309341431e-05, 5.982443690299988e-05, 6.930530071258545e-05, 7.878616452217102e-05, 8.826702833175659e-05, 9.774789214134216e-05, 0.00010722875595092773, 0.0001167096197605133, 0.00012619048357009888, 0.00013567134737968445, 0.00014515221118927002, 0.0001546330749988556, 0.00016411393880844116, 0.00017359480261802673, 0.0001830756664276123, 0.00019255653023719788, 0.00020203739404678345, 0.00021151825785636902, 0.0002209991216659546, 0.00023047998547554016, 0.00023996084928512573, 0.0002494417130947113, 0.0002589225769042969]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 11.0, 14.0, 25.0, 43.0, 38.0, 60.0, 98.0, 121.0, 189.0, 256.0, 402.0, 627.0, 1004.0, 1518.0, 2332.0, 3860.0, 6441.0, 10913.0, 19241.0, 35319.0, 64753.0, 117038.0, 185943.0, 214173.0, 163992.0, 98072.0, 53538.0, 28728.0, 16085.0, 9142.0, 5488.0, 3222.0, 2103.0, 1342.0, 822.0, 506.0, 346.0, 251.0, 149.0, 125.0, 67.0, 46.0, 35.0, 28.0, 11.0, 21.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 5.0], "bins": [-3.548828125, -3.4423828125, -3.3359375, -3.2294921875, -3.123046875, -3.0166015625, -2.91015625, -2.8037109375, -2.697265625, -2.5908203125, -2.484375, -2.3779296875, -2.271484375, -2.1650390625, -2.05859375, -1.9521484375, -1.845703125, -1.7392578125, -1.6328125, -1.5263671875, -1.419921875, -1.3134765625, -1.20703125, -1.1005859375, -0.994140625, -0.8876953125, -0.78125, -0.6748046875, -0.568359375, -0.4619140625, -0.35546875, -0.2490234375, -0.142578125, -0.0361328125, 0.0703125, 0.1767578125, 0.283203125, 0.3896484375, 0.49609375, 0.6025390625, 0.708984375, 0.8154296875, 0.921875, 1.0283203125, 1.134765625, 1.2412109375, 1.34765625, 1.4541015625, 1.560546875, 1.6669921875, 1.7734375, 1.8798828125, 1.986328125, 2.0927734375, 2.19921875, 2.3056640625, 2.412109375, 2.5185546875, 2.625, 2.7314453125, 2.837890625, 2.9443359375, 3.05078125, 3.1572265625, 3.263671875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 6.0, 6.0, 7.0, 8.0, 14.0, 22.0, 25.0, 20.0, 17.0, 36.0, 37.0, 36.0, 55.0, 56.0, 67.0, 61.0, 61.0, 80.0, 61.0, 42.0, 45.0, 38.0, 29.0, 41.0, 19.0, 18.0, 19.0, 14.0, 11.0, 10.0, 6.0, 2.0, 3.0, 4.0, 5.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-1.431640625, -1.390533447265625, -1.34942626953125, -1.308319091796875, -1.2672119140625, -1.226104736328125, -1.18499755859375, -1.143890380859375, -1.102783203125, -1.061676025390625, -1.02056884765625, -0.979461669921875, -0.9383544921875, -0.897247314453125, -0.85614013671875, -0.815032958984375, -0.77392578125, -0.732818603515625, -0.69171142578125, -0.650604248046875, -0.6094970703125, -0.568389892578125, -0.52728271484375, -0.486175537109375, -0.445068359375, -0.403961181640625, -0.36285400390625, -0.321746826171875, -0.2806396484375, -0.239532470703125, -0.19842529296875, -0.157318115234375, -0.1162109375, -0.075103759765625, -0.03399658203125, 0.007110595703125, 0.0482177734375, 0.089324951171875, 0.13043212890625, 0.171539306640625, 0.212646484375, 0.253753662109375, 0.29486083984375, 0.335968017578125, 0.3770751953125, 0.418182373046875, 0.45928955078125, 0.500396728515625, 0.54150390625, 0.582611083984375, 0.62371826171875, 0.664825439453125, 0.7059326171875, 0.747039794921875, 0.78814697265625, 0.829254150390625, 0.870361328125, 0.911468505859375, 0.95257568359375, 0.993682861328125, 1.0347900390625, 1.075897216796875, 1.11700439453125, 1.158111572265625, 1.19921875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 6.0, 9.0, 6.0, 8.0, 2.0, 5.0, 8.0, 6.0, 12.0, 15.0, 14.0, 18.0, 23.0, 21.0, 20.0, 33.0, 43.0, 51.0, 41.0, 52.0, 60.0, 44.0, 46.0, 53.0, 51.0, 40.0, 35.0, 41.0, 34.0, 47.0, 17.0, 27.0, 21.0, 16.0, 10.0, 9.0, 9.0, 7.0, 7.0, 9.0, 5.0, 8.0, 2.0, 8.0, 0.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.44700813293457, -6.234295845031738, -6.021583080291748, -5.808870792388916, -5.596158027648926, -5.383445739746094, -5.170733451843262, -4.95802116394043, -4.7453083992004395, -4.532596111297607, -4.319883346557617, -4.107171058654785, -3.894458532333374, -3.681746006011963, -3.469033718109131, -3.2563211917877197, -3.0436086654663086, -2.8308961391448975, -2.6181836128234863, -2.4054713249206543, -2.192758798599243, -1.980046272277832, -1.7673338651657104, -1.5546214580535889, -1.3419089317321777, -1.1291964054107666, -0.916483998298645, -0.7037715315818787, -0.4910590648651123, -0.27834653854370117, -0.06563413143157959, 0.147078275680542, 0.35979127883911133, 0.5725037455558777, 0.785216212272644, 0.9979286789894104, 1.2106411457061768, 1.423353672027588, 1.6360660791397095, 1.848778486251831, 2.061491012573242, 2.2742035388946533, 2.4869160652160645, 2.6996283531188965, 2.9123408794403076, 3.1250534057617188, 3.337765693664551, 3.550478219985962, 3.763190746307373, 3.975903272628784, 4.188615798950195, 4.401328086853027, 4.614040374755859, 4.82675313949585, 5.039465427398682, 5.252178192138672, 5.464890480041504, 5.677602767944336, 5.890315532684326, 6.103027820587158, 6.315740585327148, 6.5284528732299805, 6.7411651611328125, 6.9538774490356445, 7.166590213775635]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 8.0, 7.0, 4.0, 10.0, 15.0, 13.0, 18.0, 9.0, 13.0, 21.0, 32.0, 31.0, 29.0, 22.0, 44.0, 25.0, 33.0, 39.0, 30.0, 42.0, 31.0, 37.0, 47.0, 37.0, 27.0, 36.0, 31.0, 34.0, 27.0, 29.0, 25.0, 30.0, 20.0, 18.0, 23.0, 15.0, 14.0, 10.0, 16.0, 11.0, 5.0, 7.0, 4.0, 3.0, 2.0, 6.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.585413932800293, -8.30331039428711, -8.02120590209961, -7.739102363586426, -7.456998825073242, -7.1748948097229, -6.892790794372559, -6.610687255859375, -6.328583240509033, -6.046479225158691, -5.764375686645508, -5.482271671295166, -5.200167655944824, -4.918064117431641, -4.635960102081299, -4.353856086730957, -4.071752548217773, -3.7896487712860107, -3.507544994354248, -3.2254409790039062, -2.9433372020721436, -2.661233425140381, -2.379129409790039, -2.0970256328582764, -1.8149218559265137, -1.532818078994751, -1.2507141828536987, -0.9686103463172913, -0.6865065097808838, -0.4044027328491211, -0.12229883670806885, 0.1598050594329834, 0.4419088363647461, 0.7240126729011536, 1.006116509437561, 1.2882204055786133, 1.570324182510376, 1.8524279594421387, 2.1345319747924805, 2.416635751724243, 2.698739528656006, 2.9808433055877686, 3.2629470825195312, 3.545051097869873, 3.8271548748016357, 4.109258651733398, 4.39136266708374, 4.673466682434082, 4.955570220947266, 5.237674236297607, 5.519777774810791, 5.801881790161133, 6.083985328674316, 6.366089344024658, 6.648193359375, 6.930296897888184, 7.212400913238525, 7.494504928588867, 7.776608467102051, 8.058712005615234, 8.340816497802734, 8.622920036315918, 8.905023574829102, 9.187128067016602, 9.469231605529785]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 6.0, 11.0, 13.0, 11.0, 33.0, 35.0, 49.0, 70.0, 113.0, 175.0, 241.0, 424.0, 607.0, 898.0, 1421.0, 2268.0, 3370.0, 5679.0, 9105.0, 14963.0, 24988.0, 42294.0, 72689.0, 127780.0, 225626.0, 394327.0, 634970.0, 808917.0, 710793.0, 468100.0, 272971.0, 154201.0, 88550.0, 51053.0, 30015.0, 17730.0, 10971.0, 6733.0, 4316.0, 2748.0, 1713.0, 1133.0, 693.0, 499.0, 340.0, 241.0, 150.0, 92.0, 55.0, 40.0, 29.0, 14.0, 12.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-7.1953125, -6.968017578125, -6.74072265625, -6.513427734375, -6.2861328125, -6.058837890625, -5.83154296875, -5.604248046875, -5.376953125, -5.149658203125, -4.92236328125, -4.695068359375, -4.4677734375, -4.240478515625, -4.01318359375, -3.785888671875, -3.55859375, -3.331298828125, -3.10400390625, -2.876708984375, -2.6494140625, -2.422119140625, -2.19482421875, -1.967529296875, -1.740234375, -1.512939453125, -1.28564453125, -1.058349609375, -0.8310546875, -0.603759765625, -0.37646484375, -0.149169921875, 0.078125, 0.305419921875, 0.53271484375, 0.760009765625, 0.9873046875, 1.214599609375, 1.44189453125, 1.669189453125, 1.896484375, 2.123779296875, 2.35107421875, 2.578369140625, 2.8056640625, 3.032958984375, 3.26025390625, 3.487548828125, 3.71484375, 3.942138671875, 4.16943359375, 4.396728515625, 4.6240234375, 4.851318359375, 5.07861328125, 5.305908203125, 5.533203125, 5.760498046875, 5.98779296875, 6.215087890625, 6.4423828125, 6.669677734375, 6.89697265625, 7.124267578125, 7.3515625]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 4.0, 11.0, 15.0, 9.0, 17.0, 16.0, 5.0, 15.0, 16.0, 22.0, 25.0, 26.0, 34.0, 39.0, 27.0, 26.0, 33.0, 37.0, 38.0, 43.0, 37.0, 41.0, 32.0, 32.0, 32.0, 38.0, 32.0, 26.0, 31.0, 31.0, 29.0, 16.0, 22.0, 20.0, 21.0, 19.0, 11.0, 12.0, 10.0, 12.0, 10.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.59765625, -5.41033935546875, -5.2230224609375, -5.03570556640625, -4.848388671875, -4.66107177734375, -4.4737548828125, -4.28643798828125, -4.09912109375, -3.91180419921875, -3.7244873046875, -3.53717041015625, -3.349853515625, -3.16253662109375, -2.9752197265625, -2.78790283203125, -2.6005859375, -2.41326904296875, -2.2259521484375, -2.03863525390625, -1.851318359375, -1.66400146484375, -1.4766845703125, -1.28936767578125, -1.10205078125, -0.91473388671875, -0.7274169921875, -0.54010009765625, -0.352783203125, -0.16546630859375, 0.0218505859375, 0.20916748046875, 0.396484375, 0.58380126953125, 0.7711181640625, 0.95843505859375, 1.145751953125, 1.33306884765625, 1.5203857421875, 1.70770263671875, 1.89501953125, 2.08233642578125, 2.2696533203125, 2.45697021484375, 2.644287109375, 2.83160400390625, 3.0189208984375, 3.20623779296875, 3.3935546875, 3.58087158203125, 3.7681884765625, 3.95550537109375, 4.142822265625, 4.33013916015625, 4.5174560546875, 4.70477294921875, 4.89208984375, 5.07940673828125, 5.2667236328125, 5.45404052734375, 5.641357421875, 5.82867431640625, 6.0159912109375, 6.20330810546875, 6.390625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 9.0, 11.0, 22.0, 26.0, 48.0, 93.0, 136.0, 149.0, 297.0, 520.0, 808.0, 1417.0, 2519.0, 4263.0, 7452.0, 13732.0, 25737.0, 48079.0, 91635.0, 173263.0, 321996.0, 551148.0, 785446.0, 807327.0, 593267.0, 353708.0, 192535.0, 101574.0, 53511.0, 28420.0, 15458.0, 8458.0, 4722.0, 2657.0, 1531.0, 910.0, 524.0, 315.0, 209.0, 117.0, 87.0, 61.0, 38.0, 17.0, 11.0, 12.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.19921875, -6.95989990234375, -6.7205810546875, -6.48126220703125, -6.241943359375, -6.00262451171875, -5.7633056640625, -5.52398681640625, -5.28466796875, -5.04534912109375, -4.8060302734375, -4.56671142578125, -4.327392578125, -4.08807373046875, -3.8487548828125, -3.60943603515625, -3.3701171875, -3.13079833984375, -2.8914794921875, -2.65216064453125, -2.412841796875, -2.17352294921875, -1.9342041015625, -1.69488525390625, -1.45556640625, -1.21624755859375, -0.9769287109375, -0.73760986328125, -0.498291015625, -0.25897216796875, -0.0196533203125, 0.21966552734375, 0.458984375, 0.69830322265625, 0.9376220703125, 1.17694091796875, 1.416259765625, 1.65557861328125, 1.8948974609375, 2.13421630859375, 2.37353515625, 2.61285400390625, 2.8521728515625, 3.09149169921875, 3.330810546875, 3.57012939453125, 3.8094482421875, 4.04876708984375, 4.2880859375, 4.52740478515625, 4.7667236328125, 5.00604248046875, 5.245361328125, 5.48468017578125, 5.7239990234375, 5.96331787109375, 6.20263671875, 6.44195556640625, 6.6812744140625, 6.92059326171875, 7.159912109375, 7.39923095703125, 7.6385498046875, 7.87786865234375, 8.1171875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 7.0, 10.0, 17.0, 19.0, 25.0, 32.0, 34.0, 51.0, 60.0, 83.0, 85.0, 94.0, 106.0, 124.0, 142.0, 148.0, 181.0, 183.0, 187.0, 196.0, 177.0, 233.0, 200.0, 196.0, 197.0, 167.0, 175.0, 138.0, 119.0, 111.0, 90.0, 81.0, 62.0, 76.0, 55.0, 30.0, 36.0, 27.0, 22.0, 14.0, 17.0, 14.0, 5.0, 7.0, 8.0, 3.0, 7.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0], "bins": [-2.94140625, -2.850921630859375, -2.76043701171875, -2.669952392578125, -2.5794677734375, -2.488983154296875, -2.39849853515625, -2.308013916015625, -2.217529296875, -2.127044677734375, -2.03656005859375, -1.946075439453125, -1.8555908203125, -1.765106201171875, -1.67462158203125, -1.584136962890625, -1.49365234375, -1.403167724609375, -1.31268310546875, -1.222198486328125, -1.1317138671875, -1.041229248046875, -0.95074462890625, -0.860260009765625, -0.769775390625, -0.679290771484375, -0.58880615234375, -0.498321533203125, -0.4078369140625, -0.317352294921875, -0.22686767578125, -0.136383056640625, -0.0458984375, 0.044586181640625, 0.13507080078125, 0.225555419921875, 0.3160400390625, 0.406524658203125, 0.49700927734375, 0.587493896484375, 0.677978515625, 0.768463134765625, 0.85894775390625, 0.949432373046875, 1.0399169921875, 1.130401611328125, 1.22088623046875, 1.311370849609375, 1.40185546875, 1.492340087890625, 1.58282470703125, 1.673309326171875, 1.7637939453125, 1.854278564453125, 1.94476318359375, 2.035247802734375, 2.125732421875, 2.216217041015625, 2.30670166015625, 2.397186279296875, 2.4876708984375, 2.578155517578125, 2.66864013671875, 2.759124755859375, 2.849609375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 10.0, 17.0, 19.0, 16.0, 23.0, 17.0, 32.0, 31.0, 45.0, 48.0, 60.0, 59.0, 55.0, 58.0, 64.0, 57.0, 61.0, 47.0, 44.0, 40.0, 28.0, 23.0, 28.0, 18.0, 17.0, 15.0, 4.0, 7.0, 10.0, 3.0, 4.0, 6.0, 4.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.232551097869873, -6.989795207977295, -6.747038841247559, -6.5042829513549805, -6.261527061462402, -6.018771171569824, -5.776014804840088, -5.53325891494751, -5.290502548217773, -5.047746658325195, -4.804990291595459, -4.562234401702881, -4.319478511810303, -4.076722145080566, -3.8339662551879883, -3.59121036529541, -3.348454475402832, -3.105698347091675, -2.8629424571990967, -2.6201863288879395, -2.3774304389953613, -2.134674310684204, -1.8919181823730469, -1.6491621732711792, -1.4064061641693115, -1.1636501550674438, -0.9208940863609314, -0.678138017654419, -0.43538200855255127, -0.1926259994506836, 0.05013012886047363, 0.2928861379623413, 0.5356426239013672, 0.7783986330032349, 1.0211546421051025, 1.2639107704162598, 1.5066667795181274, 1.7494227886199951, 1.9921789169311523, 2.2349348068237305, 2.4776909351348877, 2.720447063446045, 2.963202953338623, 3.2059590816497803, 3.4487152099609375, 3.6914710998535156, 3.934227228164673, 4.17698335647583, 4.419739246368408, 4.662495136260986, 4.905251502990723, 5.148007392883301, 5.390763282775879, 5.633519172668457, 5.876275539398193, 6.1190314292907715, 6.361787796020508, 6.604543685913086, 6.847300052642822, 7.0900559425354, 7.3328118324279785, 7.575568199157715, 7.818324089050293, 8.061079978942871, 8.30383586883545]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 6.0, 7.0, 6.0, 10.0, 18.0, 10.0, 12.0, 15.0, 23.0, 22.0, 25.0, 31.0, 23.0, 35.0, 41.0, 34.0, 41.0, 37.0, 32.0, 34.0, 44.0, 38.0, 38.0, 50.0, 43.0, 20.0, 42.0, 30.0, 28.0, 34.0, 21.0, 21.0, 19.0, 15.0, 12.0, 14.0, 12.0, 9.0, 9.0, 11.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.19920539855957, -8.926764488220215, -8.654324531555176, -8.38188362121582, -8.109442710876465, -7.837002277374268, -7.56456184387207, -7.292120933532715, -7.019680500030518, -6.74724006652832, -6.474799156188965, -6.202358722686768, -5.92991828918457, -5.657477378845215, -5.385036945343018, -5.11259651184082, -4.840155601501465, -4.567715167999268, -4.295274257659912, -4.022833824157715, -3.7503931522369385, -3.477952480316162, -3.205512046813965, -2.9330713748931885, -2.660630702972412, -2.3881900310516357, -2.1157493591308594, -1.843308925628662, -1.5708682537078857, -1.2984275817871094, -1.0259870290756226, -0.7535464763641357, -0.48110485076904297, -0.20866423845291138, 0.06377637386322021, 0.3362169861793518, 0.6086575984954834, 0.8810982704162598, 1.1535388231277466, 1.4259793758392334, 1.6984200477600098, 1.9708607196807861, 2.2433013916015625, 2.5157418251037598, 2.788182497024536, 3.0606231689453125, 3.3330636024475098, 3.605504274368286, 3.8779449462890625, 4.15038537979126, 4.422826290130615, 4.6952667236328125, 4.967707633972168, 5.240148067474365, 5.5125885009765625, 5.785029411315918, 6.057469844818115, 6.3299102783203125, 6.602351188659668, 6.874791622161865, 7.1472320556640625, 7.419672966003418, 7.692113399505615, 7.9645538330078125, 8.236994743347168]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 10.0, 20.0, 20.0, 34.0, 57.0, 99.0, 133.0, 207.0, 326.0, 507.0, 828.0, 1216.0, 1965.0, 3035.0, 4713.0, 7560.0, 11689.0, 18494.0, 28989.0, 45255.0, 69988.0, 107377.0, 154441.0, 178217.0, 141886.0, 96589.0, 62620.0, 40528.0, 25856.0, 16818.0, 10506.0, 6881.0, 4221.0, 2709.0, 1771.0, 1045.0, 671.0, 470.0, 300.0, 172.0, 122.0, 79.0, 41.0, 33.0, 24.0, 16.0, 8.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.3056640625, -1.2653350830078125, -1.225006103515625, -1.1846771240234375, -1.14434814453125, -1.1040191650390625, -1.063690185546875, -1.0233612060546875, -0.9830322265625, -0.9427032470703125, -0.902374267578125, -0.8620452880859375, -0.82171630859375, -0.7813873291015625, -0.741058349609375, -0.7007293701171875, -0.660400390625, -0.6200714111328125, -0.579742431640625, -0.5394134521484375, -0.49908447265625, -0.4587554931640625, -0.418426513671875, -0.3780975341796875, -0.3377685546875, -0.2974395751953125, -0.257110595703125, -0.2167816162109375, -0.17645263671875, -0.1361236572265625, -0.095794677734375, -0.0554656982421875, -0.01513671875, 0.0251922607421875, 0.065521240234375, 0.1058502197265625, 0.14617919921875, 0.1865081787109375, 0.226837158203125, 0.2671661376953125, 0.3074951171875, 0.3478240966796875, 0.388153076171875, 0.4284820556640625, 0.46881103515625, 0.5091400146484375, 0.549468994140625, 0.5897979736328125, 0.630126953125, 0.6704559326171875, 0.710784912109375, 0.7511138916015625, 0.79144287109375, 0.8317718505859375, 0.872100830078125, 0.9124298095703125, 0.9527587890625, 0.9930877685546875, 1.033416748046875, 1.0737457275390625, 1.11407470703125, 1.1544036865234375, 1.194732666015625, 1.2350616455078125, 1.275390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 6.0, 9.0, 10.0, 13.0, 14.0, 18.0, 15.0, 16.0, 21.0, 32.0, 35.0, 34.0, 34.0, 32.0, 42.0, 41.0, 43.0, 35.0, 50.0, 36.0, 50.0, 35.0, 36.0, 46.0, 37.0, 28.0, 26.0, 33.0, 25.0, 20.0, 22.0, 17.0, 17.0, 10.0, 14.0, 11.0, 4.0, 6.0, 10.0, 5.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3046875, -9.0135498046875, -8.722412109375, -8.4312744140625, -8.14013671875, -7.8489990234375, -7.557861328125, -7.2667236328125, -6.9755859375, -6.6844482421875, -6.393310546875, -6.1021728515625, -5.81103515625, -5.5198974609375, -5.228759765625, -4.9376220703125, -4.646484375, -4.3553466796875, -4.064208984375, -3.7730712890625, -3.48193359375, -3.1907958984375, -2.899658203125, -2.6085205078125, -2.3173828125, -2.0262451171875, -1.735107421875, -1.4439697265625, -1.15283203125, -0.8616943359375, -0.570556640625, -0.2794189453125, 0.01171875, 0.3028564453125, 0.593994140625, 0.8851318359375, 1.17626953125, 1.4674072265625, 1.758544921875, 2.0496826171875, 2.3408203125, 2.6319580078125, 2.923095703125, 3.2142333984375, 3.50537109375, 3.7965087890625, 4.087646484375, 4.3787841796875, 4.669921875, 4.9610595703125, 5.252197265625, 5.5433349609375, 5.83447265625, 6.1256103515625, 6.416748046875, 6.7078857421875, 6.9990234375, 7.2901611328125, 7.581298828125, 7.8724365234375, 8.16357421875, 8.4547119140625, 8.745849609375, 9.0369873046875, 9.328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 6.0, 12.0, 15.0, 29.0, 40.0, 48.0, 87.0, 112.0, 162.0, 237.0, 336.0, 497.0, 783.0, 1028.0, 1653.0, 2446.0, 3646.0, 5443.0, 8333.0, 12670.0, 19686.0, 29970.0, 45407.0, 67407.0, 98868.0, 137883.0, 165264.0, 140445.0, 101045.0, 69526.0, 46034.0, 30742.0, 20298.0, 13037.0, 8664.0, 5439.0, 3792.0, 2415.0, 1590.0, 1141.0, 706.0, 505.0, 352.0, 219.0, 179.0, 118.0, 86.0, 47.0, 45.0, 29.0, 15.0, 8.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.0751953125, -1.042144775390625, -1.00909423828125, -0.976043701171875, -0.9429931640625, -0.909942626953125, -0.87689208984375, -0.843841552734375, -0.810791015625, -0.777740478515625, -0.74468994140625, -0.711639404296875, -0.6785888671875, -0.645538330078125, -0.61248779296875, -0.579437255859375, -0.54638671875, -0.513336181640625, -0.48028564453125, -0.447235107421875, -0.4141845703125, -0.381134033203125, -0.34808349609375, -0.315032958984375, -0.281982421875, -0.248931884765625, -0.21588134765625, -0.182830810546875, -0.1497802734375, -0.116729736328125, -0.08367919921875, -0.050628662109375, -0.017578125, 0.015472412109375, 0.04852294921875, 0.081573486328125, 0.1146240234375, 0.147674560546875, 0.18072509765625, 0.213775634765625, 0.246826171875, 0.279876708984375, 0.31292724609375, 0.345977783203125, 0.3790283203125, 0.412078857421875, 0.44512939453125, 0.478179931640625, 0.51123046875, 0.544281005859375, 0.57733154296875, 0.610382080078125, 0.6434326171875, 0.676483154296875, 0.70953369140625, 0.742584228515625, 0.775634765625, 0.808685302734375, 0.84173583984375, 0.874786376953125, 0.9078369140625, 0.940887451171875, 0.97393798828125, 1.006988525390625, 1.0400390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 5.0, 11.0, 17.0, 14.0, 17.0, 15.0, 19.0, 22.0, 22.0, 23.0, 33.0, 28.0, 30.0, 32.0, 34.0, 31.0, 59.0, 31.0, 36.0, 38.0, 42.0, 46.0, 25.0, 35.0, 41.0, 36.0, 35.0, 19.0, 32.0, 31.0, 23.0, 15.0, 19.0, 11.0, 7.0, 11.0, 6.0, 5.0, 11.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.109375, -4.94671630859375, -4.7840576171875, -4.62139892578125, -4.458740234375, -4.29608154296875, -4.1334228515625, -3.97076416015625, -3.80810546875, -3.64544677734375, -3.4827880859375, -3.32012939453125, -3.157470703125, -2.99481201171875, -2.8321533203125, -2.66949462890625, -2.5068359375, -2.34417724609375, -2.1815185546875, -2.01885986328125, -1.856201171875, -1.69354248046875, -1.5308837890625, -1.36822509765625, -1.20556640625, -1.04290771484375, -0.8802490234375, -0.71759033203125, -0.554931640625, -0.39227294921875, -0.2296142578125, -0.06695556640625, 0.095703125, 0.25836181640625, 0.4210205078125, 0.58367919921875, 0.746337890625, 0.90899658203125, 1.0716552734375, 1.23431396484375, 1.39697265625, 1.55963134765625, 1.7222900390625, 1.88494873046875, 2.047607421875, 2.21026611328125, 2.3729248046875, 2.53558349609375, 2.6982421875, 2.86090087890625, 3.0235595703125, 3.18621826171875, 3.348876953125, 3.51153564453125, 3.6741943359375, 3.83685302734375, 3.99951171875, 4.16217041015625, 4.3248291015625, 4.48748779296875, 4.650146484375, 4.81280517578125, 4.9754638671875, 5.13812255859375, 5.30078125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 11.0, 13.0, 11.0, 23.0, 32.0, 41.0, 86.0, 99.0, 138.0, 208.0, 307.0, 489.0, 713.0, 1206.0, 1886.0, 3055.0, 5266.0, 9291.0, 16330.0, 30001.0, 58448.0, 114029.0, 225931.0, 274457.0, 146417.0, 74036.0, 38188.0, 20337.0, 11200.0, 6330.0, 3770.0, 2276.0, 1409.0, 877.0, 503.0, 379.0, 229.0, 178.0, 111.0, 92.0, 48.0, 41.0, 17.0, 19.0, 10.0, 2.0, 1.0, 2.0, 2.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1087646484375, -0.10538482666015625, -0.1020050048828125, -0.09862518310546875, -0.095245361328125, -0.09186553955078125, -0.0884857177734375, -0.08510589599609375, -0.08172607421875, -0.07834625244140625, -0.0749664306640625, -0.07158660888671875, -0.068206787109375, -0.06482696533203125, -0.0614471435546875, -0.05806732177734375, -0.0546875, -0.05130767822265625, -0.0479278564453125, -0.04454803466796875, -0.041168212890625, -0.03778839111328125, -0.0344085693359375, -0.03102874755859375, -0.02764892578125, -0.02426910400390625, -0.0208892822265625, -0.01750946044921875, -0.014129638671875, -0.01074981689453125, -0.0073699951171875, -0.00399017333984375, -0.0006103515625, 0.00276947021484375, 0.0061492919921875, 0.00952911376953125, 0.012908935546875, 0.01628875732421875, 0.0196685791015625, 0.02304840087890625, 0.02642822265625, 0.02980804443359375, 0.0331878662109375, 0.03656768798828125, 0.039947509765625, 0.04332733154296875, 0.0467071533203125, 0.05008697509765625, 0.053466796875, 0.05684661865234375, 0.0602264404296875, 0.06360626220703125, 0.066986083984375, 0.07036590576171875, 0.0737457275390625, 0.07712554931640625, 0.08050537109375, 0.08388519287109375, 0.0872650146484375, 0.09064483642578125, 0.094024658203125, 0.09740447998046875, 0.1007843017578125, 0.10416412353515625, 0.1075439453125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 9.0, 5.0, 7.0, 7.0, 10.0, 19.0, 15.0, 16.0, 25.0, 19.0, 30.0, 46.0, 37.0, 34.0, 36.0, 50.0, 54.0, 45.0, 48.0, 61.0, 46.0, 45.0, 37.0, 40.0, 55.0, 23.0, 33.0, 31.0, 11.0, 21.0, 15.0, 8.0, 16.0, 13.0, 8.0, 10.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.6033649444580078e-05, -1.5579164028167725e-05, -1.5124678611755371e-05, -1.4670193195343018e-05, -1.4215707778930664e-05, -1.376122236251831e-05, -1.3306736946105957e-05, -1.2852251529693604e-05, -1.239776611328125e-05, -1.1943280696868896e-05, -1.1488795280456543e-05, -1.103430986404419e-05, -1.0579824447631836e-05, -1.0125339031219482e-05, -9.670853614807129e-06, -9.216368198394775e-06, -8.761882781982422e-06, -8.307397365570068e-06, -7.852911949157715e-06, -7.398426532745361e-06, -6.943941116333008e-06, -6.489455699920654e-06, -6.034970283508301e-06, -5.580484867095947e-06, -5.125999450683594e-06, -4.67151403427124e-06, -4.217028617858887e-06, -3.762543201446533e-06, -3.3080577850341797e-06, -2.853572368621826e-06, -2.3990869522094727e-06, -1.944601535797119e-06, -1.4901161193847656e-06, -1.0356307029724121e-06, -5.811452865600586e-07, -1.2665987014770508e-07, 3.2782554626464844e-07, 7.82310962677002e-07, 1.2367963790893555e-06, 1.691281795501709e-06, 2.1457672119140625e-06, 2.600252628326416e-06, 3.0547380447387695e-06, 3.509223461151123e-06, 3.9637088775634766e-06, 4.41819429397583e-06, 4.872679710388184e-06, 5.327165126800537e-06, 5.781650543212891e-06, 6.236135959625244e-06, 6.690621376037598e-06, 7.145106792449951e-06, 7.599592208862305e-06, 8.054077625274658e-06, 8.508563041687012e-06, 8.963048458099365e-06, 9.417533874511719e-06, 9.872019290924072e-06, 1.0326504707336426e-05, 1.078099012374878e-05, 1.1235475540161133e-05, 1.1689960956573486e-05, 1.214444637298584e-05, 1.2598931789398193e-05, 1.3053417205810547e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 8.0, 8.0, 13.0, 20.0, 28.0, 37.0, 49.0, 75.0, 106.0, 168.0, 292.0, 448.0, 739.0, 1380.0, 2272.0, 4353.0, 8321.0, 16776.0, 36028.0, 84235.0, 224687.0, 386960.0, 161885.0, 63269.0, 28010.0, 13247.0, 6748.0, 3642.0, 1933.0, 1073.0, 637.0, 379.0, 265.0, 138.0, 113.0, 75.0, 44.0, 27.0, 22.0, 17.0, 8.0, 8.0, 3.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.2408447265625, -0.23402976989746094, -0.22721481323242188, -0.2203998565673828, -0.21358489990234375, -0.2067699432373047, -0.19995498657226562, -0.19314002990722656, -0.1863250732421875, -0.17951011657714844, -0.17269515991210938, -0.1658802032470703, -0.15906524658203125, -0.1522502899169922, -0.14543533325195312, -0.13862037658691406, -0.131805419921875, -0.12499046325683594, -0.11817550659179688, -0.11136054992675781, -0.10454559326171875, -0.09773063659667969, -0.09091567993164062, -0.08410072326660156, -0.0772857666015625, -0.07047080993652344, -0.06365585327148438, -0.05684089660644531, -0.05002593994140625, -0.04321098327636719, -0.036396026611328125, -0.029581069946289062, -0.02276611328125, -0.015951156616210938, -0.009136199951171875, -0.0023212432861328125, 0.00449371337890625, 0.011308670043945312, 0.018123626708984375, 0.024938583374023438, 0.0317535400390625, 0.03856849670410156, 0.045383453369140625, 0.05219841003417969, 0.05901336669921875, 0.06582832336425781, 0.07264328002929688, 0.07945823669433594, 0.086273193359375, 0.09308815002441406, 0.09990310668945312, 0.10671806335449219, 0.11353302001953125, 0.12034797668457031, 0.12716293334960938, 0.13397789001464844, 0.1407928466796875, 0.14760780334472656, 0.15442276000976562, 0.1612377166748047, 0.16805267333984375, 0.1748676300048828, 0.18168258666992188, 0.18849754333496094, 0.1953125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 1.0, 3.0, 0.0, 6.0, 8.0, 6.0, 7.0, 9.0, 8.0, 12.0, 21.0, 20.0, 27.0, 31.0, 35.0, 31.0, 46.0, 57.0, 67.0, 84.0, 82.0, 86.0, 61.0, 49.0, 43.0, 27.0, 31.0, 22.0, 27.0, 11.0, 17.0, 15.0, 13.0, 6.0, 5.0, 2.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0546875, -0.05302906036376953, -0.05137062072753906, -0.049712181091308594, -0.048053741455078125, -0.046395301818847656, -0.04473686218261719, -0.04307842254638672, -0.04141998291015625, -0.03976154327392578, -0.03810310363769531, -0.036444664001464844, -0.034786224365234375, -0.033127784729003906, -0.03146934509277344, -0.02981090545654297, -0.0281524658203125, -0.02649402618408203, -0.024835586547851562, -0.023177146911621094, -0.021518707275390625, -0.019860267639160156, -0.018201828002929688, -0.01654338836669922, -0.01488494873046875, -0.013226509094238281, -0.011568069458007812, -0.009909629821777344, -0.008251190185546875, -0.006592750549316406, -0.0049343109130859375, -0.0032758712768554688, -0.001617431640625, 4.100799560546875e-05, 0.0016994476318359375, 0.0033578872680664062, 0.005016326904296875, 0.006674766540527344, 0.008333206176757812, 0.009991645812988281, 0.01165008544921875, 0.013308525085449219, 0.014966964721679688, 0.016625404357910156, 0.018283843994140625, 0.019942283630371094, 0.021600723266601562, 0.02325916290283203, 0.0249176025390625, 0.02657604217529297, 0.028234481811523438, 0.029892921447753906, 0.031551361083984375, 0.033209800720214844, 0.03486824035644531, 0.03652667999267578, 0.03818511962890625, 0.03984355926513672, 0.04150199890136719, 0.043160438537597656, 0.044818878173828125, 0.046477317810058594, 0.04813575744628906, 0.04979419708251953, 0.05145263671875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 3.0, 5.0, 7.0, 6.0, 10.0, 16.0, 17.0, 21.0, 17.0, 26.0, 32.0, 41.0, 34.0, 54.0, 58.0, 70.0, 55.0, 63.0, 55.0, 62.0, 59.0, 56.0, 33.0, 39.0, 24.0, 23.0, 25.0, 21.0, 15.0, 9.0, 5.0, 6.0, 8.0, 4.0, 4.0, 6.0, 4.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.538696765899658, -7.291049480438232, -7.043401718139648, -6.795754432678223, -6.548107147216797, -6.300459861755371, -6.052812099456787, -5.805164813995361, -5.557517051696777, -5.309869766235352, -5.062222003936768, -4.814574718475342, -4.566927433013916, -4.319279670715332, -4.071632385253906, -3.8239850997924805, -3.5763378143310547, -3.32869029045105, -3.081043004989624, -2.833395481109619, -2.5857481956481934, -2.3381006717681885, -2.0904531478881836, -1.8428057432174683, -1.595158338546753, -1.3475109338760376, -1.0998635292053223, -0.8522160053253174, -0.604568600654602, -0.3569211959838867, -0.10927367210388184, 0.1383737325668335, 0.38602161407470703, 0.6336690187454224, 0.8813164830207825, 1.1289639472961426, 1.376611351966858, 1.6242587566375732, 1.8719062805175781, 2.119553565979004, 2.367201089859009, 2.6148486137390137, 2.8624958992004395, 3.1101434230804443, 3.357790946960449, 3.605438232421875, 3.85308575630188, 4.100733280181885, 4.3483805656433105, 4.596027851104736, 4.84367561340332, 5.091322898864746, 5.338970184326172, 5.586617469787598, 5.834265232086182, 6.081912517547607, 6.329560279846191, 6.577207565307617, 6.824855327606201, 7.072502613067627, 7.320149898529053, 7.567797660827637, 7.8154449462890625, 8.063092231750488, 8.310739517211914]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 6.0, 7.0, 6.0, 10.0, 17.0, 11.0, 12.0, 13.0, 21.0, 24.0, 24.0, 32.0, 25.0, 34.0, 38.0, 34.0, 44.0, 35.0, 32.0, 35.0, 46.0, 33.0, 41.0, 47.0, 47.0, 21.0, 37.0, 33.0, 29.0, 31.0, 24.0, 22.0, 18.0, 15.0, 13.0, 12.0, 14.0, 8.0, 9.0, 11.0, 9.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.169685363769531, -8.897924423217773, -8.626164436340332, -8.354403495788574, -8.082643508911133, -7.810882568359375, -7.539122104644775, -7.267361640930176, -6.995601177215576, -6.723840713500977, -6.452080249786377, -6.180319786071777, -5.9085588455200195, -5.636798858642578, -5.36503791809082, -5.093277454376221, -4.821516990661621, -4.5497565269470215, -4.277996063232422, -4.006235599517822, -3.7344748973846436, -3.462714433670044, -3.1909537315368652, -2.9191932678222656, -2.647432804107666, -2.3756723403930664, -2.103911876678467, -1.832151174545288, -1.5603907108306885, -1.2886302471160889, -1.0168696641921997, -0.7451090812683105, -0.47334766387939453, -0.20158714056015015, 0.07017338275909424, 0.3419339060783386, 0.613694429397583, 0.8854548931121826, 1.1572154760360718, 1.428976058959961, 1.7007365226745605, 1.9724969863891602, 2.2442574501037598, 2.5160181522369385, 2.787778615951538, 3.0595390796661377, 3.3312997817993164, 3.603060245513916, 3.8748207092285156, 4.146581172943115, 4.418341636657715, 4.6901021003723145, 4.961862564086914, 5.233623504638672, 5.5053839683532715, 5.777144432067871, 6.048904895782471, 6.32066535949707, 6.59242582321167, 6.8641862869262695, 7.135947227478027, 7.407707214355469, 7.679468154907227, 7.951228618621826, 8.222989082336426]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 7.0, 8.0, 9.0, 19.0, 28.0, 29.0, 45.0, 76.0, 91.0, 179.0, 195.0, 340.0, 495.0, 812.0, 1158.0, 1950.0, 2754.0, 4423.0, 6807.0, 10379.0, 16262.0, 25696.0, 38495.0, 58079.0, 82656.0, 109925.0, 132185.0, 136296.0, 121464.0, 95475.0, 67957.0, 46815.0, 30677.0, 20067.0, 12915.0, 8263.0, 5352.0, 3553.0, 2292.0, 1509.0, 1004.0, 632.0, 399.0, 289.0, 170.0, 106.0, 77.0, 51.0, 28.0, 24.0, 27.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.734375, -5.544677734375, -5.35498046875, -5.165283203125, -4.9755859375, -4.785888671875, -4.59619140625, -4.406494140625, -4.216796875, -4.027099609375, -3.83740234375, -3.647705078125, -3.4580078125, -3.268310546875, -3.07861328125, -2.888916015625, -2.69921875, -2.509521484375, -2.31982421875, -2.130126953125, -1.9404296875, -1.750732421875, -1.56103515625, -1.371337890625, -1.181640625, -0.991943359375, -0.80224609375, -0.612548828125, -0.4228515625, -0.233154296875, -0.04345703125, 0.146240234375, 0.3359375, 0.525634765625, 0.71533203125, 0.905029296875, 1.0947265625, 1.284423828125, 1.47412109375, 1.663818359375, 1.853515625, 2.043212890625, 2.23291015625, 2.422607421875, 2.6123046875, 2.802001953125, 2.99169921875, 3.181396484375, 3.37109375, 3.560791015625, 3.75048828125, 3.940185546875, 4.1298828125, 4.319580078125, 4.50927734375, 4.698974609375, 4.888671875, 5.078369140625, 5.26806640625, 5.457763671875, 5.6474609375, 5.837158203125, 6.02685546875, 6.216552734375, 6.40625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 9.0, 5.0, 6.0, 12.0, 15.0, 16.0, 14.0, 13.0, 18.0, 18.0, 29.0, 36.0, 35.0, 36.0, 42.0, 36.0, 32.0, 32.0, 40.0, 46.0, 42.0, 43.0, 35.0, 43.0, 35.0, 33.0, 34.0, 27.0, 28.0, 21.0, 25.0, 21.0, 24.0, 12.0, 14.0, 12.0, 10.0, 13.0, 11.0, 5.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-9.265625, -8.9957275390625, -8.725830078125, -8.4559326171875, -8.18603515625, -7.9161376953125, -7.646240234375, -7.3763427734375, -7.1064453125, -6.8365478515625, -6.566650390625, -6.2967529296875, -6.02685546875, -5.7569580078125, -5.487060546875, -5.2171630859375, -4.947265625, -4.6773681640625, -4.407470703125, -4.1375732421875, -3.86767578125, -3.5977783203125, -3.327880859375, -3.0579833984375, -2.7880859375, -2.5181884765625, -2.248291015625, -1.9783935546875, -1.70849609375, -1.4385986328125, -1.168701171875, -0.8988037109375, -0.62890625, -0.3590087890625, -0.089111328125, 0.1807861328125, 0.45068359375, 0.7205810546875, 0.990478515625, 1.2603759765625, 1.5302734375, 1.8001708984375, 2.070068359375, 2.3399658203125, 2.60986328125, 2.8797607421875, 3.149658203125, 3.4195556640625, 3.689453125, 3.9593505859375, 4.229248046875, 4.4991455078125, 4.76904296875, 5.0389404296875, 5.308837890625, 5.5787353515625, 5.8486328125, 6.1185302734375, 6.388427734375, 6.6583251953125, 6.92822265625, 7.1981201171875, 7.468017578125, 7.7379150390625, 8.0078125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 12.0, 18.0, 21.0, 33.0, 53.0, 74.0, 113.0, 167.0, 257.0, 382.0, 582.0, 951.0, 1485.0, 2280.0, 3669.0, 5761.0, 9096.0, 14288.0, 22907.0, 36015.0, 55158.0, 80714.0, 111718.0, 137653.0, 143874.0, 127569.0, 98261.0, 69003.0, 45916.0, 29469.0, 18784.0, 11758.0, 7469.0, 4625.0, 3061.0, 1933.0, 1208.0, 758.0, 508.0, 323.0, 210.0, 142.0, 94.0, 59.0, 44.0, 27.0, 18.0, 12.0, 12.0, 4.0, 7.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-6.453125, -6.25323486328125, -6.0533447265625, -5.85345458984375, -5.653564453125, -5.45367431640625, -5.2537841796875, -5.05389404296875, -4.85400390625, -4.65411376953125, -4.4542236328125, -4.25433349609375, -4.054443359375, -3.85455322265625, -3.6546630859375, -3.45477294921875, -3.2548828125, -3.05499267578125, -2.8551025390625, -2.65521240234375, -2.455322265625, -2.25543212890625, -2.0555419921875, -1.85565185546875, -1.65576171875, -1.45587158203125, -1.2559814453125, -1.05609130859375, -0.856201171875, -0.65631103515625, -0.4564208984375, -0.25653076171875, -0.056640625, 0.14324951171875, 0.3431396484375, 0.54302978515625, 0.742919921875, 0.94281005859375, 1.1427001953125, 1.34259033203125, 1.54248046875, 1.74237060546875, 1.9422607421875, 2.14215087890625, 2.342041015625, 2.54193115234375, 2.7418212890625, 2.94171142578125, 3.1416015625, 3.34149169921875, 3.5413818359375, 3.74127197265625, 3.941162109375, 4.14105224609375, 4.3409423828125, 4.54083251953125, 4.74072265625, 4.94061279296875, 5.1405029296875, 5.34039306640625, 5.540283203125, 5.74017333984375, 5.9400634765625, 6.13995361328125, 6.33984375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 13.0, 7.0, 4.0, 11.0, 13.0, 11.0, 19.0, 23.0, 21.0, 31.0, 24.0, 31.0, 27.0, 37.0, 48.0, 43.0, 44.0, 40.0, 34.0, 50.0, 48.0, 41.0, 37.0, 40.0, 38.0, 34.0, 28.0, 22.0, 31.0, 24.0, 21.0, 16.0, 18.0, 12.0, 10.0, 7.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.17578125, -5.01025390625, -4.8447265625, -4.67919921875, -4.513671875, -4.34814453125, -4.1826171875, -4.01708984375, -3.8515625, -3.68603515625, -3.5205078125, -3.35498046875, -3.189453125, -3.02392578125, -2.8583984375, -2.69287109375, -2.52734375, -2.36181640625, -2.1962890625, -2.03076171875, -1.865234375, -1.69970703125, -1.5341796875, -1.36865234375, -1.203125, -1.03759765625, -0.8720703125, -0.70654296875, -0.541015625, -0.37548828125, -0.2099609375, -0.04443359375, 0.12109375, 0.28662109375, 0.4521484375, 0.61767578125, 0.783203125, 0.94873046875, 1.1142578125, 1.27978515625, 1.4453125, 1.61083984375, 1.7763671875, 1.94189453125, 2.107421875, 2.27294921875, 2.4384765625, 2.60400390625, 2.76953125, 2.93505859375, 3.1005859375, 3.26611328125, 3.431640625, 3.59716796875, 3.7626953125, 3.92822265625, 4.09375, 4.25927734375, 4.4248046875, 4.59033203125, 4.755859375, 4.92138671875, 5.0869140625, 5.25244140625, 5.41796875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 6.0, 5.0, 9.0, 9.0, 21.0, 22.0, 43.0, 56.0, 67.0, 115.0, 138.0, 246.0, 369.0, 547.0, 867.0, 1290.0, 2119.0, 3431.0, 5593.0, 9440.0, 16092.0, 28292.0, 49108.0, 85924.0, 143421.0, 201036.0, 191015.0, 129050.0, 76209.0, 43295.0, 24685.0, 14155.0, 8399.0, 5002.0, 3018.0, 1906.0, 1225.0, 803.0, 481.0, 311.0, 235.0, 172.0, 95.0, 77.0, 44.0, 44.0, 21.0, 13.0, 8.0, 7.0, 16.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.00390625, -2.912567138671875, -2.82122802734375, -2.729888916015625, -2.6385498046875, -2.547210693359375, -2.45587158203125, -2.364532470703125, -2.273193359375, -2.181854248046875, -2.09051513671875, -1.999176025390625, -1.9078369140625, -1.816497802734375, -1.72515869140625, -1.633819580078125, -1.54248046875, -1.451141357421875, -1.35980224609375, -1.268463134765625, -1.1771240234375, -1.085784912109375, -0.99444580078125, -0.903106689453125, -0.811767578125, -0.720428466796875, -0.62908935546875, -0.537750244140625, -0.4464111328125, -0.355072021484375, -0.26373291015625, -0.172393798828125, -0.0810546875, 0.010284423828125, 0.10162353515625, 0.192962646484375, 0.2843017578125, 0.375640869140625, 0.46697998046875, 0.558319091796875, 0.649658203125, 0.740997314453125, 0.83233642578125, 0.923675537109375, 1.0150146484375, 1.106353759765625, 1.19769287109375, 1.289031982421875, 1.38037109375, 1.471710205078125, 1.56304931640625, 1.654388427734375, 1.7457275390625, 1.837066650390625, 1.92840576171875, 2.019744873046875, 2.111083984375, 2.202423095703125, 2.29376220703125, 2.385101318359375, 2.4764404296875, 2.567779541015625, 2.65911865234375, 2.750457763671875, 2.841796875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 0.0, 1.0, 6.0, 15.0, 12.0, 18.0, 20.0, 25.0, 35.0, 35.0, 51.0, 45.0, 58.0, 70.0, 70.0, 75.0, 70.0, 73.0, 58.0, 53.0, 39.0, 43.0, 33.0, 33.0, 16.0, 15.0, 10.0, 7.0, 9.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.000293731689453125, -0.0002860892564058304, -0.00027844682335853577, -0.00027080439031124115, -0.00026316195726394653, -0.0002555195242166519, -0.0002478770911693573, -0.00024023465812206268, -0.00023259222507476807, -0.00022494979202747345, -0.00021730735898017883, -0.00020966492593288422, -0.0002020224928855896, -0.00019438005983829498, -0.00018673762679100037, -0.00017909519374370575, -0.00017145276069641113, -0.00016381032764911652, -0.0001561678946018219, -0.00014852546155452728, -0.00014088302850723267, -0.00013324059545993805, -0.00012559816241264343, -0.00011795572936534882, -0.0001103132963180542, -0.00010267086327075958, -9.502843022346497e-05, -8.738599717617035e-05, -7.974356412887573e-05, -7.210113108158112e-05, -6.44586980342865e-05, -5.681626498699188e-05, -4.9173831939697266e-05, -4.153139889240265e-05, -3.388896584510803e-05, -2.6246532797813416e-05, -1.86040997505188e-05, -1.0961666703224182e-05, -3.3192336559295654e-06, 4.323199391365051e-06, 1.1965632438659668e-05, 1.9608065485954285e-05, 2.72504985332489e-05, 3.489293158054352e-05, 4.2535364627838135e-05, 5.017779767513275e-05, 5.782023072242737e-05, 6.546266376972198e-05, 7.31050968170166e-05, 8.074752986431122e-05, 8.838996291160583e-05, 9.603239595890045e-05, 0.00010367482900619507, 0.00011131726205348969, 0.0001189596951007843, 0.00012660212814807892, 0.00013424456119537354, 0.00014188699424266815, 0.00014952942728996277, 0.00015717186033725739, 0.000164814293384552, 0.00017245672643184662, 0.00018009915947914124, 0.00018774159252643585, 0.00019538402557373047]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 10.0, 12.0, 14.0, 19.0, 31.0, 58.0, 61.0, 151.0, 187.0, 278.0, 493.0, 721.0, 1140.0, 1780.0, 2930.0, 4783.0, 8050.0, 13537.0, 23437.0, 41049.0, 71831.0, 121132.0, 179347.0, 198767.0, 152432.0, 95129.0, 55106.0, 31328.0, 18018.0, 10543.0, 6198.0, 3696.0, 2320.0, 1425.0, 904.0, 594.0, 359.0, 242.0, 149.0, 113.0, 71.0, 39.0, 21.0, 14.0, 21.0, 13.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0], "bins": [-3.126953125, -3.03826904296875, -2.9495849609375, -2.86090087890625, -2.772216796875, -2.68353271484375, -2.5948486328125, -2.50616455078125, -2.41748046875, -2.32879638671875, -2.2401123046875, -2.15142822265625, -2.062744140625, -1.97406005859375, -1.8853759765625, -1.79669189453125, -1.7080078125, -1.61932373046875, -1.5306396484375, -1.44195556640625, -1.353271484375, -1.26458740234375, -1.1759033203125, -1.08721923828125, -0.99853515625, -0.90985107421875, -0.8211669921875, -0.73248291015625, -0.643798828125, -0.55511474609375, -0.4664306640625, -0.37774658203125, -0.2890625, -0.20037841796875, -0.1116943359375, -0.02301025390625, 0.065673828125, 0.15435791015625, 0.2430419921875, 0.33172607421875, 0.42041015625, 0.50909423828125, 0.5977783203125, 0.68646240234375, 0.775146484375, 0.86383056640625, 0.9525146484375, 1.04119873046875, 1.1298828125, 1.21856689453125, 1.3072509765625, 1.39593505859375, 1.484619140625, 1.57330322265625, 1.6619873046875, 1.75067138671875, 1.83935546875, 1.92803955078125, 2.0167236328125, 2.10540771484375, 2.194091796875, 2.28277587890625, 2.3714599609375, 2.46014404296875, 2.548828125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 2.0, 4.0, 8.0, 4.0, 6.0, 5.0, 12.0, 14.0, 12.0, 16.0, 21.0, 20.0, 30.0, 43.0, 38.0, 56.0, 38.0, 64.0, 58.0, 67.0, 55.0, 67.0, 60.0, 37.0, 51.0, 37.0, 34.0, 21.0, 19.0, 18.0, 16.0, 15.0, 8.0, 10.0, 5.0, 11.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1240234375, -1.0908889770507812, -1.0577545166015625, -1.0246200561523438, -0.991485595703125, -0.9583511352539062, -0.9252166748046875, -0.8920822143554688, -0.85894775390625, -0.8258132934570312, -0.7926788330078125, -0.7595443725585938, -0.726409912109375, -0.6932754516601562, -0.6601409912109375, -0.6270065307617188, -0.5938720703125, -0.5607376098632812, -0.5276031494140625, -0.49446868896484375, -0.461334228515625, -0.42819976806640625, -0.3950653076171875, -0.36193084716796875, -0.32879638671875, -0.29566192626953125, -0.2625274658203125, -0.22939300537109375, -0.196258544921875, -0.16312408447265625, -0.1299896240234375, -0.09685516357421875, -0.063720703125, -0.03058624267578125, 0.0025482177734375, 0.03568267822265625, 0.068817138671875, 0.10195159912109375, 0.1350860595703125, 0.16822052001953125, 0.20135498046875, 0.23448944091796875, 0.2676239013671875, 0.30075836181640625, 0.333892822265625, 0.36702728271484375, 0.4001617431640625, 0.43329620361328125, 0.4664306640625, 0.49956512451171875, 0.5326995849609375, 0.5658340454101562, 0.598968505859375, 0.6321029663085938, 0.6652374267578125, 0.6983718872070312, 0.73150634765625, 0.7646408081054688, 0.7977752685546875, 0.8309097290039062, 0.864044189453125, 0.8971786499023438, 0.9303131103515625, 0.9634475708007812, 0.99658203125]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 5.0, 5.0, 10.0, 8.0, 9.0, 12.0, 8.0, 9.0, 19.0, 30.0, 23.0, 33.0, 32.0, 38.0, 55.0, 69.0, 62.0, 54.0, 65.0, 62.0, 63.0, 50.0, 54.0, 38.0, 34.0, 23.0, 26.0, 16.0, 21.0, 18.0, 12.0, 6.0, 9.0, 4.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.793361186981201, -7.545561790466309, -7.297762393951416, -7.049962997436523, -6.802163124084473, -6.554364204406738, -6.3065643310546875, -6.058764934539795, -5.810965538024902, -5.56316614151001, -5.315366744995117, -5.067567348480225, -4.819767951965332, -4.571968078613281, -4.324168682098389, -4.076369285583496, -3.8285698890686035, -3.580770492553711, -3.3329710960388184, -3.0851714611053467, -2.837372064590454, -2.5895726680755615, -2.34177303314209, -2.0939736366271973, -1.8461742401123047, -1.598374843597412, -1.35057532787323, -1.1027758121490479, -0.8549764156341553, -0.6071770191192627, -0.35937750339508057, -0.11157798767089844, 0.13622188568115234, 0.3840213418006897, 0.631820797920227, 0.8796202540397644, 1.1274197101593018, 1.3752191066741943, 1.6230186223983765, 1.8708181381225586, 2.118617534637451, 2.3664169311523438, 2.6142163276672363, 2.862015962600708, 3.1098153591156006, 3.357614755630493, 3.605414390563965, 3.8532137870788574, 4.10101318359375, 4.348812580108643, 4.596611976623535, 4.844411373138428, 5.09221076965332, 5.340010643005371, 5.587810039520264, 5.835609436035156, 6.083408832550049, 6.331208229064941, 6.579007625579834, 6.826807022094727, 7.074606895446777, 7.322405815124512, 7.5702056884765625, 7.818005084991455, 8.065804481506348]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 2.0, 6.0, 5.0, 7.0, 15.0, 10.0, 14.0, 11.0, 14.0, 18.0, 25.0, 25.0, 20.0, 22.0, 27.0, 40.0, 38.0, 44.0, 33.0, 29.0, 36.0, 32.0, 41.0, 42.0, 37.0, 47.0, 32.0, 41.0, 34.0, 22.0, 30.0, 28.0, 20.0, 23.0, 16.0, 20.0, 14.0, 14.0, 12.0, 7.0, 13.0, 8.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-8.209084510803223, -7.949554920196533, -7.690025329589844, -7.430495738983154, -7.170966148376465, -6.911437034606934, -6.651907444000244, -6.392377853393555, -6.132848262786865, -5.873318672180176, -5.613789081573486, -5.354259490966797, -5.094730377197266, -4.835200309753418, -4.575671195983887, -4.316141605377197, -4.056612014770508, -3.7970824241638184, -3.537552833557129, -3.2780234813690186, -3.018493890762329, -2.7589643001556396, -2.4994349479675293, -2.23990535736084, -1.9803757667541504, -1.720846176147461, -1.461316704750061, -1.2017872333526611, -0.9422576427459717, -0.6827280521392822, -0.4231985807418823, -0.16366910934448242, 0.09586048126220703, 0.3553900122642517, 0.6149195432662964, 0.8744490742683411, 1.1339786052703857, 1.3935081958770752, 1.653037667274475, 1.912567138671875, 2.1720967292785645, 2.431626319885254, 2.6911559104919434, 2.9506852626800537, 3.210214853286743, 3.4697444438934326, 3.729273796081543, 3.9888033866882324, 4.248332977294922, 4.507862567901611, 4.767392158508301, 5.02692174911499, 5.28645133972168, 5.545980453491211, 5.8055100440979, 6.06503963470459, 6.324569225311279, 6.584098815917969, 6.843628406524658, 7.103157997131348, 7.362687110900879, 7.622217178344727, 7.881746292114258, 8.141275405883789, 8.400805473327637]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 6.0, 10.0, 8.0, 28.0, 31.0, 61.0, 79.0, 110.0, 220.0, 331.0, 551.0, 893.0, 1421.0, 2400.0, 4055.0, 6962.0, 12081.0, 21336.0, 37609.0, 70452.0, 134045.0, 262278.0, 515435.0, 874580.0, 950915.0, 621971.0, 324121.0, 163162.0, 84390.0, 45682.0, 25130.0, 14014.0, 8110.0, 4760.0, 2890.0, 1674.0, 959.0, 625.0, 354.0, 201.0, 127.0, 86.0, 46.0, 32.0, 18.0, 13.0, 11.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-8.5078125, -8.2586669921875, -8.009521484375, -7.7603759765625, -7.51123046875, -7.2620849609375, -7.012939453125, -6.7637939453125, -6.5146484375, -6.2655029296875, -6.016357421875, -5.7672119140625, -5.51806640625, -5.2689208984375, -5.019775390625, -4.7706298828125, -4.521484375, -4.2723388671875, -4.023193359375, -3.7740478515625, -3.52490234375, -3.2757568359375, -3.026611328125, -2.7774658203125, -2.5283203125, -2.2791748046875, -2.030029296875, -1.7808837890625, -1.53173828125, -1.2825927734375, -1.033447265625, -0.7843017578125, -0.53515625, -0.2860107421875, -0.036865234375, 0.2122802734375, 0.46142578125, 0.7105712890625, 0.959716796875, 1.2088623046875, 1.4580078125, 1.7071533203125, 1.956298828125, 2.2054443359375, 2.45458984375, 2.7037353515625, 2.952880859375, 3.2020263671875, 3.451171875, 3.7003173828125, 3.949462890625, 4.1986083984375, 4.44775390625, 4.6968994140625, 4.946044921875, 5.1951904296875, 5.4443359375, 5.6934814453125, 5.942626953125, 6.1917724609375, 6.44091796875, 6.6900634765625, 6.939208984375, 7.1883544921875, 7.4375]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 4.0, 4.0, 4.0, 1.0, 10.0, 15.0, 4.0, 8.0, 14.0, 17.0, 7.0, 22.0, 16.0, 21.0, 21.0, 27.0, 31.0, 34.0, 37.0, 27.0, 38.0, 35.0, 35.0, 39.0, 38.0, 41.0, 40.0, 37.0, 42.0, 36.0, 36.0, 27.0, 27.0, 25.0, 22.0, 19.0, 16.0, 14.0, 19.0, 15.0, 12.0, 12.0, 16.0, 4.0, 7.0, 8.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.296875, -5.13018798828125, -4.9635009765625, -4.79681396484375, -4.630126953125, -4.46343994140625, -4.2967529296875, -4.13006591796875, -3.96337890625, -3.79669189453125, -3.6300048828125, -3.46331787109375, -3.296630859375, -3.12994384765625, -2.9632568359375, -2.79656982421875, -2.6298828125, -2.46319580078125, -2.2965087890625, -2.12982177734375, -1.963134765625, -1.79644775390625, -1.6297607421875, -1.46307373046875, -1.29638671875, -1.12969970703125, -0.9630126953125, -0.79632568359375, -0.629638671875, -0.46295166015625, -0.2962646484375, -0.12957763671875, 0.037109375, 0.20379638671875, 0.3704833984375, 0.53717041015625, 0.703857421875, 0.87054443359375, 1.0372314453125, 1.20391845703125, 1.37060546875, 1.53729248046875, 1.7039794921875, 1.87066650390625, 2.037353515625, 2.20404052734375, 2.3707275390625, 2.53741455078125, 2.7041015625, 2.87078857421875, 3.0374755859375, 3.20416259765625, 3.370849609375, 3.53753662109375, 3.7042236328125, 3.87091064453125, 4.03759765625, 4.20428466796875, 4.3709716796875, 4.53765869140625, 4.704345703125, 4.87103271484375, 5.0377197265625, 5.20440673828125, 5.37109375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 13.0, 13.0, 23.0, 28.0, 52.0, 89.0, 132.0, 196.0, 355.0, 607.0, 941.0, 1579.0, 2730.0, 4685.0, 8248.0, 14880.0, 26522.0, 48142.0, 90659.0, 169653.0, 315651.0, 546917.0, 791581.0, 816680.0, 592380.0, 349266.0, 189111.0, 101130.0, 54000.0, 29637.0, 16472.0, 9387.0, 5061.0, 3024.0, 1757.0, 1077.0, 622.0, 386.0, 238.0, 146.0, 86.0, 59.0, 36.0, 21.0, 8.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.3125, -7.09149169921875, -6.8704833984375, -6.64947509765625, -6.428466796875, -6.20745849609375, -5.9864501953125, -5.76544189453125, -5.54443359375, -5.32342529296875, -5.1024169921875, -4.88140869140625, -4.660400390625, -4.43939208984375, -4.2183837890625, -3.99737548828125, -3.7763671875, -3.55535888671875, -3.3343505859375, -3.11334228515625, -2.892333984375, -2.67132568359375, -2.4503173828125, -2.22930908203125, -2.00830078125, -1.78729248046875, -1.5662841796875, -1.34527587890625, -1.124267578125, -0.90325927734375, -0.6822509765625, -0.46124267578125, -0.240234375, -0.01922607421875, 0.2017822265625, 0.42279052734375, 0.643798828125, 0.86480712890625, 1.0858154296875, 1.30682373046875, 1.52783203125, 1.74884033203125, 1.9698486328125, 2.19085693359375, 2.411865234375, 2.63287353515625, 2.8538818359375, 3.07489013671875, 3.2958984375, 3.51690673828125, 3.7379150390625, 3.95892333984375, 4.179931640625, 4.40093994140625, 4.6219482421875, 4.84295654296875, 5.06396484375, 5.28497314453125, 5.5059814453125, 5.72698974609375, 5.947998046875, 6.16900634765625, 6.3900146484375, 6.61102294921875, 6.83203125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 2.0, 5.0, 8.0, 8.0, 15.0, 19.0, 23.0, 31.0, 31.0, 56.0, 71.0, 50.0, 89.0, 93.0, 91.0, 126.0, 141.0, 137.0, 163.0, 195.0, 184.0, 192.0, 216.0, 197.0, 206.0, 209.0, 195.0, 157.0, 141.0, 135.0, 137.0, 108.0, 100.0, 80.0, 95.0, 49.0, 63.0, 54.0, 36.0, 29.0, 27.0, 15.0, 12.0, 11.0, 13.0, 16.0, 10.0, 5.0, 6.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-2.37109375, -2.29156494140625, -2.2120361328125, -2.13250732421875, -2.052978515625, -1.97344970703125, -1.8939208984375, -1.81439208984375, -1.73486328125, -1.65533447265625, -1.5758056640625, -1.49627685546875, -1.416748046875, -1.33721923828125, -1.2576904296875, -1.17816162109375, -1.0986328125, -1.01910400390625, -0.9395751953125, -0.86004638671875, -0.780517578125, -0.70098876953125, -0.6214599609375, -0.54193115234375, -0.46240234375, -0.38287353515625, -0.3033447265625, -0.22381591796875, -0.144287109375, -0.06475830078125, 0.0147705078125, 0.09429931640625, 0.173828125, 0.25335693359375, 0.3328857421875, 0.41241455078125, 0.491943359375, 0.57147216796875, 0.6510009765625, 0.73052978515625, 0.81005859375, 0.88958740234375, 0.9691162109375, 1.04864501953125, 1.128173828125, 1.20770263671875, 1.2872314453125, 1.36676025390625, 1.4462890625, 1.52581787109375, 1.6053466796875, 1.68487548828125, 1.764404296875, 1.84393310546875, 1.9234619140625, 2.00299072265625, 2.08251953125, 2.16204833984375, 2.2415771484375, 2.32110595703125, 2.400634765625, 2.48016357421875, 2.5596923828125, 2.63922119140625, 2.71875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 1.0, 10.0, 5.0, 14.0, 10.0, 17.0, 12.0, 22.0, 30.0, 23.0, 51.0, 38.0, 69.0, 62.0, 64.0, 82.0, 62.0, 60.0, 59.0, 62.0, 52.0, 38.0, 27.0, 20.0, 17.0, 17.0, 9.0, 11.0, 10.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.78032398223877, -8.528129577636719, -8.275934219360352, -8.0237398147583, -7.771544933319092, -7.519350051879883, -7.267155170440674, -7.014960289001465, -6.762765884399414, -6.510571002960205, -6.258376121520996, -6.006181716918945, -5.753986835479736, -5.501791954040527, -5.249597072601318, -4.997402191162109, -4.7452073097229, -4.493012428283691, -4.240817546844482, -3.9886229038238525, -3.7364282608032227, -3.4842333793640137, -3.2320384979248047, -2.9798436164855957, -2.727648973464966, -2.475454092025757, -2.223259449005127, -1.971064567565918, -1.7188698053359985, -1.466675043106079, -1.2144801616668701, -0.9622853994369507, -0.710090160369873, -0.4578953683376312, -0.2057005763053894, 0.046494245529174805, 0.29868900775909424, 0.5508837699890137, 0.8030786514282227, 1.055273413658142, 1.3074681758880615, 1.559662938117981, 1.8118577003479004, 2.0640525817871094, 2.3162474632263184, 2.5684421062469482, 2.8206369876861572, 3.072831630706787, 3.325026512145996, 3.577221393585205, 3.829416036605835, 4.081610679626465, 4.333805561065674, 4.586000442504883, 4.838195323944092, 5.090390205383301, 5.342584609985352, 5.5947794914245605, 5.8469743728637695, 6.09916877746582, 6.351363658905029, 6.603558540344238, 6.855753421783447, 7.107948303222656, 7.360143184661865]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 1.0, 5.0, 5.0, 6.0, 6.0, 10.0, 17.0, 18.0, 14.0, 21.0, 20.0, 22.0, 23.0, 24.0, 42.0, 27.0, 40.0, 37.0, 33.0, 35.0, 51.0, 23.0, 37.0, 38.0, 35.0, 37.0, 26.0, 33.0, 35.0, 30.0, 31.0, 26.0, 33.0, 17.0, 22.0, 16.0, 21.0, 17.0, 8.0, 12.0, 7.0, 9.0, 6.0, 8.0, 1.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.824223518371582, -6.586084842681885, -6.347946643829346, -6.109807968139648, -5.871669292449951, -5.633531093597412, -5.395392417907715, -5.157254219055176, -4.9191155433654785, -4.680976867675781, -4.442838668823242, -4.204699993133545, -3.9665615558624268, -3.7284231185913086, -3.4902844429016113, -3.252146005630493, -3.014007329940796, -2.7758688926696777, -2.5377302169799805, -2.2995917797088623, -2.061453342437744, -1.8233147859573364, -1.5851762294769287, -1.3470377922058105, -1.1088992357254028, -0.8707607388496399, -0.632622241973877, -0.39448368549346924, -0.1563451886177063, 0.08179330825805664, 0.31993186473846436, 0.5580703020095825, 0.7962088584899902, 1.034347414970398, 1.2724858522415161, 1.5106244087219238, 1.748762845993042, 1.9869014024734497, 2.2250399589538574, 2.4631783962249756, 2.7013168334960938, 2.939455270767212, 3.177593946456909, 3.4157323837280273, 3.6538708209991455, 3.8920092582702637, 4.130147933959961, 4.3682861328125, 4.6064252853393555, 4.844563961029053, 5.082702159881592, 5.320840835571289, 5.558979511260986, 5.797117710113525, 6.035256385803223, 6.273394584655762, 6.511533260345459, 6.749671936035156, 6.987810134887695, 7.225948810577393, 7.46408748626709, 7.702225685119629, 7.940364360809326, 8.178503036499023, 8.416641235351562]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 8.0, 9.0, 14.0, 15.0, 25.0, 49.0, 69.0, 81.0, 148.0, 189.0, 276.0, 371.0, 519.0, 831.0, 1158.0, 1690.0, 2638.0, 3801.0, 5379.0, 8025.0, 11723.0, 17446.0, 25881.0, 38088.0, 56260.0, 81814.0, 115088.0, 148767.0, 150851.0, 116379.0, 83102.0, 56931.0, 38940.0, 26528.0, 17894.0, 11975.0, 8098.0, 5692.0, 3735.0, 2527.0, 1701.0, 1219.0, 823.0, 590.0, 419.0, 279.0, 159.0, 121.0, 92.0, 48.0, 46.0, 15.0, 12.0, 7.0, 6.0, 7.0, 5.0, 3.0, 1.0], "bins": [-1.001953125, -0.9716110229492188, -0.9412689208984375, -0.9109268188476562, -0.880584716796875, -0.8502426147460938, -0.8199005126953125, -0.7895584106445312, -0.75921630859375, -0.7288742065429688, -0.6985321044921875, -0.6681900024414062, -0.637847900390625, -0.6075057983398438, -0.5771636962890625, -0.5468215942382812, -0.5164794921875, -0.48613739013671875, -0.4557952880859375, -0.42545318603515625, -0.395111083984375, -0.36476898193359375, -0.3344268798828125, -0.30408477783203125, -0.27374267578125, -0.24340057373046875, -0.2130584716796875, -0.18271636962890625, -0.152374267578125, -0.12203216552734375, -0.0916900634765625, -0.06134796142578125, -0.031005859375, -0.00066375732421875, 0.0296783447265625, 0.06002044677734375, 0.090362548828125, 0.12070465087890625, 0.1510467529296875, 0.18138885498046875, 0.21173095703125, 0.24207305908203125, 0.2724151611328125, 0.30275726318359375, 0.333099365234375, 0.36344146728515625, 0.3937835693359375, 0.42412567138671875, 0.4544677734375, 0.48480987548828125, 0.5151519775390625, 0.5454940795898438, 0.575836181640625, 0.6061782836914062, 0.6365203857421875, 0.6668624877929688, 0.69720458984375, 0.7275466918945312, 0.7578887939453125, 0.7882308959960938, 0.818572998046875, 0.8489151000976562, 0.8792572021484375, 0.9095993041992188, 0.93994140625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 1.0, 6.0, 6.0, 13.0, 14.0, 13.0, 20.0, 26.0, 26.0, 28.0, 28.0, 27.0, 46.0, 32.0, 31.0, 37.0, 41.0, 47.0, 43.0, 43.0, 45.0, 35.0, 40.0, 32.0, 33.0, 37.0, 40.0, 27.0, 19.0, 28.0, 28.0, 17.0, 20.0, 12.0, 13.0, 9.0, 7.0, 3.0, 8.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34765625, -7.08111572265625, -6.8145751953125, -6.54803466796875, -6.281494140625, -6.01495361328125, -5.7484130859375, -5.48187255859375, -5.21533203125, -4.94879150390625, -4.6822509765625, -4.41571044921875, -4.149169921875, -3.88262939453125, -3.6160888671875, -3.34954833984375, -3.0830078125, -2.81646728515625, -2.5499267578125, -2.28338623046875, -2.016845703125, -1.75030517578125, -1.4837646484375, -1.21722412109375, -0.95068359375, -0.68414306640625, -0.4176025390625, -0.15106201171875, 0.115478515625, 0.38201904296875, 0.6485595703125, 0.91510009765625, 1.181640625, 1.44818115234375, 1.7147216796875, 1.98126220703125, 2.247802734375, 2.51434326171875, 2.7808837890625, 3.04742431640625, 3.31396484375, 3.58050537109375, 3.8470458984375, 4.11358642578125, 4.380126953125, 4.64666748046875, 4.9132080078125, 5.17974853515625, 5.4462890625, 5.71282958984375, 5.9793701171875, 6.24591064453125, 6.512451171875, 6.77899169921875, 7.0455322265625, 7.31207275390625, 7.57861328125, 7.84515380859375, 8.1116943359375, 8.37823486328125, 8.644775390625, 8.91131591796875, 9.1778564453125, 9.44439697265625, 9.7109375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 6.0, 8.0, 8.0, 13.0, 23.0, 35.0, 48.0, 83.0, 109.0, 124.0, 206.0, 302.0, 438.0, 666.0, 935.0, 1372.0, 2124.0, 3353.0, 5105.0, 7815.0, 12104.0, 19021.0, 29786.0, 46236.0, 71799.0, 108556.0, 155554.0, 177192.0, 138825.0, 94740.0, 61390.0, 39193.0, 25418.0, 16025.0, 10352.0, 6705.0, 4283.0, 2841.0, 1831.0, 1281.0, 831.0, 647.0, 348.0, 268.0, 162.0, 129.0, 83.0, 64.0, 51.0, 30.0, 22.0, 16.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.017578125, -0.9840240478515625, -0.950469970703125, -0.9169158935546875, -0.88336181640625, -0.8498077392578125, -0.816253662109375, -0.7826995849609375, -0.7491455078125, -0.7155914306640625, -0.682037353515625, -0.6484832763671875, -0.61492919921875, -0.5813751220703125, -0.547821044921875, -0.5142669677734375, -0.480712890625, -0.4471588134765625, -0.413604736328125, -0.3800506591796875, -0.34649658203125, -0.3129425048828125, -0.279388427734375, -0.2458343505859375, -0.2122802734375, -0.1787261962890625, -0.145172119140625, -0.1116180419921875, -0.07806396484375, -0.0445098876953125, -0.010955810546875, 0.0225982666015625, 0.05615234375, 0.0897064208984375, 0.123260498046875, 0.1568145751953125, 0.19036865234375, 0.2239227294921875, 0.257476806640625, 0.2910308837890625, 0.3245849609375, 0.3581390380859375, 0.391693115234375, 0.4252471923828125, 0.45880126953125, 0.4923553466796875, 0.525909423828125, 0.5594635009765625, 0.593017578125, 0.6265716552734375, 0.660125732421875, 0.6936798095703125, 0.72723388671875, 0.7607879638671875, 0.794342041015625, 0.8278961181640625, 0.8614501953125, 0.8950042724609375, 0.928558349609375, 0.9621124267578125, 0.99566650390625, 1.0292205810546875, 1.062774658203125, 1.0963287353515625, 1.1298828125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 7.0, 6.0, 11.0, 8.0, 9.0, 12.0, 17.0, 25.0, 23.0, 28.0, 38.0, 39.0, 28.0, 52.0, 31.0, 42.0, 43.0, 50.0, 50.0, 47.0, 51.0, 45.0, 39.0, 55.0, 41.0, 33.0, 24.0, 26.0, 17.0, 22.0, 14.0, 18.0, 16.0, 5.0, 3.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.640625, -5.4560546875, -5.271484375, -5.0869140625, -4.90234375, -4.7177734375, -4.533203125, -4.3486328125, -4.1640625, -3.9794921875, -3.794921875, -3.6103515625, -3.42578125, -3.2412109375, -3.056640625, -2.8720703125, -2.6875, -2.5029296875, -2.318359375, -2.1337890625, -1.94921875, -1.7646484375, -1.580078125, -1.3955078125, -1.2109375, -1.0263671875, -0.841796875, -0.6572265625, -0.47265625, -0.2880859375, -0.103515625, 0.0810546875, 0.265625, 0.4501953125, 0.634765625, 0.8193359375, 1.00390625, 1.1884765625, 1.373046875, 1.5576171875, 1.7421875, 1.9267578125, 2.111328125, 2.2958984375, 2.48046875, 2.6650390625, 2.849609375, 3.0341796875, 3.21875, 3.4033203125, 3.587890625, 3.7724609375, 3.95703125, 4.1416015625, 4.326171875, 4.5107421875, 4.6953125, 4.8798828125, 5.064453125, 5.2490234375, 5.43359375, 5.6181640625, 5.802734375, 5.9873046875, 6.171875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 3.0, 5.0, 6.0, 11.0, 18.0, 30.0, 40.0, 63.0, 87.0, 130.0, 196.0, 330.0, 509.0, 724.0, 1214.0, 1922.0, 3355.0, 5785.0, 9738.0, 18203.0, 34547.0, 68691.0, 139881.0, 276959.0, 241221.0, 119149.0, 58603.0, 29179.0, 16223.0, 8872.0, 5033.0, 2991.0, 1682.0, 1070.0, 736.0, 439.0, 325.0, 206.0, 130.0, 87.0, 56.0, 43.0, 18.0, 16.0, 15.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0906982421875, -0.08794021606445312, -0.08518218994140625, -0.08242416381835938, -0.0796661376953125, -0.07690811157226562, -0.07415008544921875, -0.07139205932617188, -0.068634033203125, -0.06587600708007812, -0.06311798095703125, -0.060359954833984375, -0.0576019287109375, -0.054843902587890625, -0.05208587646484375, -0.049327850341796875, -0.04656982421875, -0.043811798095703125, -0.04105377197265625, -0.038295745849609375, -0.0355377197265625, -0.032779693603515625, -0.03002166748046875, -0.027263641357421875, -0.024505615234375, -0.021747589111328125, -0.01898956298828125, -0.016231536865234375, -0.0134735107421875, -0.010715484619140625, -0.00795745849609375, -0.005199432373046875, -0.00244140625, 0.000316619873046875, 0.00307464599609375, 0.005832672119140625, 0.0085906982421875, 0.011348724365234375, 0.01410675048828125, 0.016864776611328125, 0.019622802734375, 0.022380828857421875, 0.02513885498046875, 0.027896881103515625, 0.0306549072265625, 0.033412933349609375, 0.03617095947265625, 0.038928985595703125, 0.04168701171875, 0.044445037841796875, 0.04720306396484375, 0.049961090087890625, 0.0527191162109375, 0.055477142333984375, 0.05823516845703125, 0.060993194580078125, 0.063751220703125, 0.06650924682617188, 0.06926727294921875, 0.07202529907226562, 0.0747833251953125, 0.07754135131835938, 0.08029937744140625, 0.08305740356445312, 0.0858154296875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 7.0, 11.0, 8.0, 16.0, 17.0, 18.0, 26.0, 24.0, 26.0, 35.0, 41.0, 31.0, 44.0, 54.0, 62.0, 41.0, 50.0, 49.0, 51.0, 53.0, 56.0, 43.0, 30.0, 28.0, 27.0, 30.0, 22.0, 15.0, 8.0, 11.0, 16.0, 6.0, 9.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.0192394256591797e-05, -9.82917845249176e-06, -9.465962648391724e-06, -9.102746844291687e-06, -8.73953104019165e-06, -8.376315236091614e-06, -8.013099431991577e-06, -7.64988362789154e-06, -7.286667823791504e-06, -6.923452019691467e-06, -6.560236215591431e-06, -6.197020411491394e-06, -5.833804607391357e-06, -5.470588803291321e-06, -5.107372999191284e-06, -4.7441571950912476e-06, -4.380941390991211e-06, -4.017725586891174e-06, -3.6545097827911377e-06, -3.291293978691101e-06, -2.9280781745910645e-06, -2.564862370491028e-06, -2.201646566390991e-06, -1.8384307622909546e-06, -1.475214958190918e-06, -1.1119991540908813e-06, -7.487833499908447e-07, -3.855675458908081e-07, -2.2351741790771484e-08, 3.4086406230926514e-07, 7.040798664093018e-07, 1.0672956705093384e-06, 1.430511474609375e-06, 1.7937272787094116e-06, 2.1569430828094482e-06, 2.520158886909485e-06, 2.8833746910095215e-06, 3.246590495109558e-06, 3.6098062992095947e-06, 3.973022103309631e-06, 4.336237907409668e-06, 4.699453711509705e-06, 5.062669515609741e-06, 5.425885319709778e-06, 5.7891011238098145e-06, 6.152316927909851e-06, 6.515532732009888e-06, 6.878748536109924e-06, 7.241964340209961e-06, 7.6051801443099976e-06, 7.968395948410034e-06, 8.33161175251007e-06, 8.694827556610107e-06, 9.058043360710144e-06, 9.42125916481018e-06, 9.784474968910217e-06, 1.0147690773010254e-05, 1.051090657711029e-05, 1.0874122381210327e-05, 1.1237338185310364e-05, 1.16005539894104e-05, 1.1963769793510437e-05, 1.2326985597610474e-05, 1.269020140171051e-05, 1.3053417205810547e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 10.0, 17.0, 18.0, 26.0, 37.0, 47.0, 79.0, 95.0, 127.0, 234.0, 396.0, 532.0, 789.0, 1213.0, 1997.0, 3123.0, 4928.0, 7862.0, 12568.0, 20481.0, 33341.0, 56565.0, 97943.0, 172495.0, 239135.0, 164298.0, 92697.0, 53807.0, 31720.0, 19529.0, 11930.0, 7467.0, 4686.0, 2960.0, 1856.0, 1241.0, 725.0, 535.0, 315.0, 255.0, 149.0, 101.0, 78.0, 50.0, 30.0, 22.0, 17.0, 13.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.09429931640625, -0.09139347076416016, -0.08848762512207031, -0.08558177947998047, -0.08267593383789062, -0.07977008819580078, -0.07686424255371094, -0.0739583969116211, -0.07105255126953125, -0.0681467056274414, -0.06524085998535156, -0.06233501434326172, -0.059429168701171875, -0.05652332305908203, -0.05361747741699219, -0.050711631774902344, -0.0478057861328125, -0.044899940490722656, -0.04199409484863281, -0.03908824920654297, -0.036182403564453125, -0.03327655792236328, -0.030370712280273438, -0.027464866638183594, -0.02455902099609375, -0.021653175354003906, -0.018747329711914062, -0.01584148406982422, -0.012935638427734375, -0.010029792785644531, -0.0071239471435546875, -0.004218101501464844, -0.001312255859375, 0.0015935897827148438, 0.0044994354248046875, 0.007405281066894531, 0.010311126708984375, 0.013216972351074219, 0.016122817993164062, 0.019028663635253906, 0.02193450927734375, 0.024840354919433594, 0.027746200561523438, 0.03065204620361328, 0.033557891845703125, 0.03646373748779297, 0.03936958312988281, 0.042275428771972656, 0.0451812744140625, 0.048087120056152344, 0.05099296569824219, 0.05389881134033203, 0.056804656982421875, 0.05971050262451172, 0.06261634826660156, 0.0655221939086914, 0.06842803955078125, 0.0713338851928711, 0.07423973083496094, 0.07714557647705078, 0.08005142211914062, 0.08295726776123047, 0.08586311340332031, 0.08876895904541016, 0.0916748046875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 0.0, 7.0, 3.0, 4.0, 6.0, 12.0, 9.0, 13.0, 14.0, 22.0, 25.0, 27.0, 41.0, 32.0, 44.0, 50.0, 44.0, 58.0, 52.0, 56.0, 44.0, 61.0, 46.0, 39.0, 47.0, 34.0, 34.0, 29.0, 19.0, 21.0, 21.0, 14.0, 14.0, 14.0, 10.0, 8.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.042236328125, -0.04071044921875, -0.0391845703125, -0.03765869140625, -0.0361328125, -0.03460693359375, -0.0330810546875, -0.03155517578125, -0.030029296875, -0.02850341796875, -0.0269775390625, -0.02545166015625, -0.02392578125, -0.02239990234375, -0.0208740234375, -0.01934814453125, -0.017822265625, -0.01629638671875, -0.0147705078125, -0.01324462890625, -0.01171875, -0.01019287109375, -0.0086669921875, -0.00714111328125, -0.005615234375, -0.00408935546875, -0.0025634765625, -0.00103759765625, 0.00048828125, 0.00201416015625, 0.0035400390625, 0.00506591796875, 0.006591796875, 0.00811767578125, 0.0096435546875, 0.01116943359375, 0.0126953125, 0.01422119140625, 0.0157470703125, 0.01727294921875, 0.018798828125, 0.02032470703125, 0.0218505859375, 0.02337646484375, 0.02490234375, 0.02642822265625, 0.0279541015625, 0.02947998046875, 0.031005859375, 0.03253173828125, 0.0340576171875, 0.03558349609375, 0.037109375, 0.03863525390625, 0.0401611328125, 0.04168701171875, 0.043212890625, 0.04473876953125, 0.0462646484375, 0.04779052734375, 0.04931640625, 0.05084228515625, 0.0523681640625, 0.05389404296875, 0.055419921875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 7.0, 8.0, 16.0, 11.0, 15.0, 24.0, 23.0, 26.0, 39.0, 56.0, 58.0, 60.0, 75.0, 82.0, 63.0, 61.0, 60.0, 65.0, 43.0, 42.0, 28.0, 19.0, 15.0, 18.0, 9.0, 14.0, 8.0, 9.0, 6.0, 6.0, 5.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.574780464172363, -8.321664810180664, -8.068548202514648, -7.815432071685791, -7.562315940856934, -7.309200286865234, -7.056084156036377, -6.8029680252075195, -6.549851894378662, -6.296735763549805, -6.043619632720947, -5.79050350189209, -5.537387847900391, -5.284271240234375, -5.031155586242676, -4.778039455413818, -4.524923324584961, -4.2718071937561035, -4.018691062927246, -3.7655751705169678, -3.5124590396881104, -3.259342908859253, -3.0062270164489746, -2.753110885620117, -2.4999947547912598, -2.2468786239624023, -1.9937626123428345, -1.7406466007232666, -1.4875304698944092, -1.2344143390655518, -0.9812983274459839, -0.728182315826416, -0.4750657081604004, -0.22194963693618774, 0.031166434288024902, 0.28428250551223755, 0.5373985767364502, 0.7905147075653076, 1.0436307191848755, 1.2967467308044434, 1.5498628616333008, 1.8029789924621582, 2.0560951232910156, 2.309211015701294, 2.5623271465301514, 2.815443277359009, 3.068559169769287, 3.3216753005981445, 3.574791431427002, 3.8279075622558594, 4.081023693084717, 4.334139823913574, 4.587255477905273, 4.840372085571289, 5.093487739562988, 5.346603870391846, 5.599720001220703, 5.8528361320495605, 6.105952262878418, 6.359068393707275, 6.612184524536133, 6.865300178527832, 7.1184163093566895, 7.371532440185547, 7.624648571014404]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 1.0, 5.0, 5.0, 6.0, 6.0, 10.0, 15.0, 20.0, 14.0, 22.0, 18.0, 24.0, 23.0, 22.0, 43.0, 28.0, 40.0, 38.0, 30.0, 37.0, 51.0, 22.0, 38.0, 36.0, 37.0, 37.0, 28.0, 30.0, 36.0, 29.0, 33.0, 26.0, 30.0, 19.0, 20.0, 17.0, 22.0, 16.0, 8.0, 12.0, 7.0, 9.0, 6.0, 8.0, 1.0, 6.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.82709264755249, -6.589954853057861, -6.352816581726074, -6.115678787231445, -5.878540992736816, -5.641402721405029, -5.4042649269104, -5.167126655578613, -4.929988861083984, -4.6928510665893555, -4.455712795257568, -4.2185750007629395, -3.9814369678497314, -3.7442989349365234, -3.5071611404418945, -3.2700231075286865, -3.0328850746154785, -2.7957470417022705, -2.5586090087890625, -2.3214712142944336, -2.0843331813812256, -1.8471951484680176, -1.6100572347640991, -1.3729193210601807, -1.1357812881469727, -0.8986433148384094, -0.6615053415298462, -0.42436736822128296, -0.18722939491271973, 0.04990863800048828, 0.28704655170440674, 0.5241844654083252, 0.7613229751586914, 0.9984609484672546, 1.2355989217758179, 1.4727368354797363, 1.7098748683929443, 1.9470129013061523, 2.1841506958007812, 2.4212887287139893, 2.6584267616271973, 2.8955647945404053, 3.1327028274536133, 3.369840621948242, 3.60697865486145, 3.844116687774658, 4.081254482269287, 4.318392753601074, 4.555530548095703, 4.792668342590332, 5.029806613922119, 5.266944408416748, 5.504082679748535, 5.741220474243164, 5.978358268737793, 6.215496063232422, 6.452634334564209, 6.689772129058838, 6.926910400390625, 7.164048194885254, 7.401185989379883, 7.63832426071167, 7.875462055206299, 8.112600326538086, 8.349738121032715]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 10.0, 0.0, 9.0, 18.0, 22.0, 40.0, 73.0, 115.0, 208.0, 320.0, 557.0, 963.0, 1569.0, 2706.0, 4250.0, 6939.0, 11771.0, 19254.0, 32585.0, 53766.0, 85423.0, 128903.0, 163884.0, 166421.0, 133680.0, 90861.0, 57385.0, 34611.0, 20890.0, 12421.0, 7388.0, 4554.0, 2777.0, 1658.0, 1012.0, 593.0, 358.0, 236.0, 126.0, 86.0, 45.0, 28.0, 18.0, 13.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.6953125, -6.48651123046875, -6.2777099609375, -6.06890869140625, -5.860107421875, -5.65130615234375, -5.4425048828125, -5.23370361328125, -5.02490234375, -4.81610107421875, -4.6072998046875, -4.39849853515625, -4.189697265625, -3.98089599609375, -3.7720947265625, -3.56329345703125, -3.3544921875, -3.14569091796875, -2.9368896484375, -2.72808837890625, -2.519287109375, -2.31048583984375, -2.1016845703125, -1.89288330078125, -1.68408203125, -1.47528076171875, -1.2664794921875, -1.05767822265625, -0.848876953125, -0.64007568359375, -0.4312744140625, -0.22247314453125, -0.013671875, 0.19512939453125, 0.4039306640625, 0.61273193359375, 0.821533203125, 1.03033447265625, 1.2391357421875, 1.44793701171875, 1.65673828125, 1.86553955078125, 2.0743408203125, 2.28314208984375, 2.491943359375, 2.70074462890625, 2.9095458984375, 3.11834716796875, 3.3271484375, 3.53594970703125, 3.7447509765625, 3.95355224609375, 4.162353515625, 4.37115478515625, 4.5799560546875, 4.78875732421875, 4.99755859375, 5.20635986328125, 5.4151611328125, 5.62396240234375, 5.832763671875, 6.04156494140625, 6.2503662109375, 6.45916748046875, 6.66796875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 4.0, 7.0, 3.0, 9.0, 13.0, 7.0, 15.0, 15.0, 23.0, 27.0, 18.0, 27.0, 32.0, 41.0, 19.0, 26.0, 41.0, 43.0, 45.0, 37.0, 35.0, 50.0, 35.0, 31.0, 36.0, 45.0, 31.0, 35.0, 34.0, 22.0, 29.0, 26.0, 22.0, 15.0, 15.0, 18.0, 13.0, 8.0, 12.0, 10.0, 6.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.6640625, -7.42041015625, -7.1767578125, -6.93310546875, -6.689453125, -6.44580078125, -6.2021484375, -5.95849609375, -5.71484375, -5.47119140625, -5.2275390625, -4.98388671875, -4.740234375, -4.49658203125, -4.2529296875, -4.00927734375, -3.765625, -3.52197265625, -3.2783203125, -3.03466796875, -2.791015625, -2.54736328125, -2.3037109375, -2.06005859375, -1.81640625, -1.57275390625, -1.3291015625, -1.08544921875, -0.841796875, -0.59814453125, -0.3544921875, -0.11083984375, 0.1328125, 0.37646484375, 0.6201171875, 0.86376953125, 1.107421875, 1.35107421875, 1.5947265625, 1.83837890625, 2.08203125, 2.32568359375, 2.5693359375, 2.81298828125, 3.056640625, 3.30029296875, 3.5439453125, 3.78759765625, 4.03125, 4.27490234375, 4.5185546875, 4.76220703125, 5.005859375, 5.24951171875, 5.4931640625, 5.73681640625, 5.98046875, 6.22412109375, 6.4677734375, 6.71142578125, 6.955078125, 7.19873046875, 7.4423828125, 7.68603515625, 7.9296875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 4.0, 2.0, 5.0, 16.0, 17.0, 29.0, 47.0, 59.0, 89.0, 122.0, 170.0, 274.0, 380.0, 554.0, 777.0, 1225.0, 1883.0, 2874.0, 4295.0, 6606.0, 10250.0, 16010.0, 24500.0, 37500.0, 55200.0, 79860.0, 107325.0, 130680.0, 137703.0, 123437.0, 96996.0, 69767.0, 48236.0, 32084.0, 20879.0, 13308.0, 8852.0, 5602.0, 3643.0, 2436.0, 1597.0, 1055.0, 715.0, 479.0, 319.0, 233.0, 149.0, 106.0, 63.0, 45.0, 35.0, 28.0, 18.0, 9.0, 8.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0], "bins": [-5.25, -5.08233642578125, -4.9146728515625, -4.74700927734375, -4.579345703125, -4.41168212890625, -4.2440185546875, -4.07635498046875, -3.90869140625, -3.74102783203125, -3.5733642578125, -3.40570068359375, -3.238037109375, -3.07037353515625, -2.9027099609375, -2.73504638671875, -2.5673828125, -2.39971923828125, -2.2320556640625, -2.06439208984375, -1.896728515625, -1.72906494140625, -1.5614013671875, -1.39373779296875, -1.22607421875, -1.05841064453125, -0.8907470703125, -0.72308349609375, -0.555419921875, -0.38775634765625, -0.2200927734375, -0.05242919921875, 0.115234375, 0.28289794921875, 0.4505615234375, 0.61822509765625, 0.785888671875, 0.95355224609375, 1.1212158203125, 1.28887939453125, 1.45654296875, 1.62420654296875, 1.7918701171875, 1.95953369140625, 2.127197265625, 2.29486083984375, 2.4625244140625, 2.63018798828125, 2.7978515625, 2.96551513671875, 3.1331787109375, 3.30084228515625, 3.468505859375, 3.63616943359375, 3.8038330078125, 3.97149658203125, 4.13916015625, 4.30682373046875, 4.4744873046875, 4.64215087890625, 4.809814453125, 4.97747802734375, 5.1451416015625, 5.31280517578125, 5.48046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 4.0, 9.0, 5.0, 9.0, 11.0, 17.0, 15.0, 24.0, 11.0, 19.0, 28.0, 27.0, 29.0, 23.0, 28.0, 37.0, 35.0, 39.0, 38.0, 39.0, 39.0, 28.0, 40.0, 37.0, 34.0, 43.0, 32.0, 30.0, 35.0, 33.0, 23.0, 22.0, 26.0, 14.0, 16.0, 10.0, 14.0, 16.0, 17.0, 6.0, 9.0, 6.0, 1.0, 4.0, 3.0, 7.0, 7.0, 3.0, 2.0, 3.0], "bins": [-4.99609375, -4.85638427734375, -4.7166748046875, -4.57696533203125, -4.437255859375, -4.29754638671875, -4.1578369140625, -4.01812744140625, -3.87841796875, -3.73870849609375, -3.5989990234375, -3.45928955078125, -3.319580078125, -3.17987060546875, -3.0401611328125, -2.90045166015625, -2.7607421875, -2.62103271484375, -2.4813232421875, -2.34161376953125, -2.201904296875, -2.06219482421875, -1.9224853515625, -1.78277587890625, -1.64306640625, -1.50335693359375, -1.3636474609375, -1.22393798828125, -1.084228515625, -0.94451904296875, -0.8048095703125, -0.66510009765625, -0.525390625, -0.38568115234375, -0.2459716796875, -0.10626220703125, 0.033447265625, 0.17315673828125, 0.3128662109375, 0.45257568359375, 0.59228515625, 0.73199462890625, 0.8717041015625, 1.01141357421875, 1.151123046875, 1.29083251953125, 1.4305419921875, 1.57025146484375, 1.7099609375, 1.84967041015625, 1.9893798828125, 2.12908935546875, 2.268798828125, 2.40850830078125, 2.5482177734375, 2.68792724609375, 2.82763671875, 2.96734619140625, 3.1070556640625, 3.24676513671875, 3.386474609375, 3.52618408203125, 3.6658935546875, 3.80560302734375, 3.9453125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 10.0, 12.0, 24.0, 31.0, 32.0, 60.0, 114.0, 157.0, 243.0, 397.0, 613.0, 1072.0, 1772.0, 3172.0, 5671.0, 10219.0, 18812.0, 35081.0, 66203.0, 119589.0, 191859.0, 219883.0, 164307.0, 96058.0, 51567.0, 27661.0, 14741.0, 8172.0, 4485.0, 2656.0, 1472.0, 950.0, 534.0, 357.0, 217.0, 115.0, 91.0, 61.0, 20.0, 22.0, 12.0, 13.0, 12.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.833984375, -2.7489013671875, -2.663818359375, -2.5787353515625, -2.49365234375, -2.4085693359375, -2.323486328125, -2.2384033203125, -2.1533203125, -2.0682373046875, -1.983154296875, -1.8980712890625, -1.81298828125, -1.7279052734375, -1.642822265625, -1.5577392578125, -1.47265625, -1.3875732421875, -1.302490234375, -1.2174072265625, -1.13232421875, -1.0472412109375, -0.962158203125, -0.8770751953125, -0.7919921875, -0.7069091796875, -0.621826171875, -0.5367431640625, -0.45166015625, -0.3665771484375, -0.281494140625, -0.1964111328125, -0.111328125, -0.0262451171875, 0.058837890625, 0.1439208984375, 0.22900390625, 0.3140869140625, 0.399169921875, 0.4842529296875, 0.5693359375, 0.6544189453125, 0.739501953125, 0.8245849609375, 0.90966796875, 0.9947509765625, 1.079833984375, 1.1649169921875, 1.25, 1.3350830078125, 1.420166015625, 1.5052490234375, 1.59033203125, 1.6754150390625, 1.760498046875, 1.8455810546875, 1.9306640625, 2.0157470703125, 2.100830078125, 2.1859130859375, 2.27099609375, 2.3560791015625, 2.441162109375, 2.5262451171875, 2.611328125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 8.0, 3.0, 3.0, 8.0, 9.0, 19.0, 15.0, 26.0, 29.0, 35.0, 48.0, 49.0, 83.0, 82.0, 100.0, 95.0, 74.0, 67.0, 47.0, 44.0, 44.0, 27.0, 22.0, 15.0, 12.0, 14.0, 12.0, 3.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030994415283203125, -0.00030196644365787506, -0.00029398873448371887, -0.0002860110253095627, -0.0002780333161354065, -0.0002700556069612503, -0.0002620778977870941, -0.00025410018861293793, -0.00024612247943878174, -0.00023814477026462555, -0.00023016706109046936, -0.00022218935191631317, -0.00021421164274215698, -0.0002062339335680008, -0.0001982562243938446, -0.00019027851521968842, -0.00018230080604553223, -0.00017432309687137604, -0.00016634538769721985, -0.00015836767852306366, -0.00015038996934890747, -0.00014241226017475128, -0.0001344345510005951, -0.0001264568418264389, -0.00011847913265228271, -0.00011050142347812653, -0.00010252371430397034, -9.454600512981415e-05, -8.656829595565796e-05, -7.859058678150177e-05, -7.061287760734558e-05, -6.263516843318939e-05, -5.46574592590332e-05, -4.6679750084877014e-05, -3.8702040910720825e-05, -3.0724331736564636e-05, -2.2746622562408447e-05, -1.4768913388252258e-05, -6.791204214096069e-06, 1.1865049600601196e-06, 9.164214134216309e-06, 1.7141923308372498e-05, 2.5119632482528687e-05, 3.3097341656684875e-05, 4.1075050830841064e-05, 4.9052760004997253e-05, 5.703046917915344e-05, 6.500817835330963e-05, 7.298588752746582e-05, 8.096359670162201e-05, 8.89413058757782e-05, 9.691901504993439e-05, 0.00010489672422409058, 0.00011287443339824677, 0.00012085214257240295, 0.00012882985174655914, 0.00013680756092071533, 0.00014478527009487152, 0.0001527629792690277, 0.0001607406884431839, 0.0001687183976173401, 0.00017669610679149628, 0.00018467381596565247, 0.00019265152513980865, 0.00020062923431396484]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 11.0, 13.0, 20.0, 28.0, 57.0, 60.0, 89.0, 146.0, 182.0, 281.0, 382.0, 600.0, 869.0, 1236.0, 2035.0, 3070.0, 4952.0, 7856.0, 12668.0, 21096.0, 34993.0, 58508.0, 94981.0, 143766.0, 181381.0, 167503.0, 119169.0, 75255.0, 45825.0, 27208.0, 16533.0, 10127.0, 6308.0, 3863.0, 2466.0, 1619.0, 1121.0, 715.0, 467.0, 318.0, 254.0, 145.0, 112.0, 67.0, 59.0, 42.0, 31.0, 16.0, 16.0, 14.0, 3.0, 5.0, 4.0, 2.0, 0.0, 3.0], "bins": [-2.236328125, -2.168060302734375, -2.09979248046875, -2.031524658203125, -1.9632568359375, -1.894989013671875, -1.82672119140625, -1.758453369140625, -1.690185546875, -1.621917724609375, -1.55364990234375, -1.485382080078125, -1.4171142578125, -1.348846435546875, -1.28057861328125, -1.212310791015625, -1.14404296875, -1.075775146484375, -1.00750732421875, -0.939239501953125, -0.8709716796875, -0.802703857421875, -0.73443603515625, -0.666168212890625, -0.597900390625, -0.529632568359375, -0.46136474609375, -0.393096923828125, -0.3248291015625, -0.256561279296875, -0.18829345703125, -0.120025634765625, -0.0517578125, 0.016510009765625, 0.08477783203125, 0.153045654296875, 0.2213134765625, 0.289581298828125, 0.35784912109375, 0.426116943359375, 0.494384765625, 0.562652587890625, 0.63092041015625, 0.699188232421875, 0.7674560546875, 0.835723876953125, 0.90399169921875, 0.972259521484375, 1.04052734375, 1.108795166015625, 1.17706298828125, 1.245330810546875, 1.3135986328125, 1.381866455078125, 1.45013427734375, 1.518402099609375, 1.586669921875, 1.654937744140625, 1.72320556640625, 1.791473388671875, 1.8597412109375, 1.928009033203125, 1.99627685546875, 2.064544677734375, 2.1328125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 1.0, 6.0, 12.0, 8.0, 19.0, 15.0, 22.0, 30.0, 28.0, 32.0, 28.0, 50.0, 69.0, 53.0, 73.0, 51.0, 63.0, 73.0, 47.0, 56.0, 37.0, 37.0, 35.0, 27.0, 24.0, 19.0, 19.0, 10.0, 8.0, 11.0, 8.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.019500732421875, -0.98626708984375, -0.953033447265625, -0.9197998046875, -0.886566162109375, -0.85333251953125, -0.820098876953125, -0.786865234375, -0.753631591796875, -0.72039794921875, -0.687164306640625, -0.6539306640625, -0.620697021484375, -0.58746337890625, -0.554229736328125, -0.52099609375, -0.487762451171875, -0.45452880859375, -0.421295166015625, -0.3880615234375, -0.354827880859375, -0.32159423828125, -0.288360595703125, -0.255126953125, -0.221893310546875, -0.18865966796875, -0.155426025390625, -0.1221923828125, -0.088958740234375, -0.05572509765625, -0.022491455078125, 0.0107421875, 0.043975830078125, 0.07720947265625, 0.110443115234375, 0.1436767578125, 0.176910400390625, 0.21014404296875, 0.243377685546875, 0.276611328125, 0.309844970703125, 0.34307861328125, 0.376312255859375, 0.4095458984375, 0.442779541015625, 0.47601318359375, 0.509246826171875, 0.54248046875, 0.575714111328125, 0.60894775390625, 0.642181396484375, 0.6754150390625, 0.708648681640625, 0.74188232421875, 0.775115966796875, 0.808349609375, 0.841583251953125, 0.87481689453125, 0.908050537109375, 0.9412841796875, 0.974517822265625, 1.00775146484375, 1.040985107421875, 1.07421875]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 5.0, 2.0, 3.0, 6.0, 6.0, 8.0, 8.0, 16.0, 15.0, 12.0, 23.0, 23.0, 36.0, 36.0, 46.0, 41.0, 62.0, 58.0, 65.0, 75.0, 60.0, 52.0, 70.0, 44.0, 39.0, 27.0, 31.0, 26.0, 19.0, 22.0, 10.0, 6.0, 7.0, 9.0, 5.0, 6.0, 5.0, 11.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.264078140258789, -8.031244277954102, -7.798410892486572, -7.565577030181885, -7.3327436447143555, -7.099909782409668, -6.8670759201049805, -6.634242534637451, -6.401409149169922, -6.168575286865234, -5.935741901397705, -5.702908039093018, -5.470074653625488, -5.237240791320801, -5.004406929016113, -4.771573543548584, -4.5387396812438965, -4.305905818939209, -4.07307243347168, -3.840238571166992, -3.607405185699463, -3.3745713233947754, -3.141737699508667, -2.9089040756225586, -2.67607045173645, -2.443236827850342, -2.2104032039642334, -1.9775694608688354, -1.744735836982727, -1.5119022130966187, -1.2790684700012207, -1.0462348461151123, -0.8134007453918457, -0.5805671215057373, -0.34773343801498413, -0.11489975452423096, 0.11793386936187744, 0.35076749324798584, 0.5836012363433838, 0.8164348602294922, 1.0492684841156006, 1.282102108001709, 1.5149357318878174, 1.7477694749832153, 1.9806030988693237, 2.2134366035461426, 2.44627046585083, 2.6791040897369385, 2.911937713623047, 3.1447713375091553, 3.3776049613952637, 3.610438823699951, 3.8432722091674805, 4.076106071472168, 4.3089399337768555, 4.541773319244385, 4.774606704711914, 5.007440567016602, 5.240273952484131, 5.473107814788818, 5.705941200256348, 5.938775062561035, 6.171608924865723, 6.404442310333252, 6.6372761726379395]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 1.0, 3.0, 2.0, 9.0, 14.0, 12.0, 16.0, 27.0, 13.0, 22.0, 23.0, 26.0, 37.0, 35.0, 44.0, 51.0, 28.0, 41.0, 38.0, 36.0, 43.0, 35.0, 47.0, 40.0, 28.0, 40.0, 31.0, 38.0, 23.0, 29.0, 29.0, 21.0, 18.0, 15.0, 21.0, 13.0, 9.0, 9.0, 8.0, 4.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.141225814819336, -7.8848490715026855, -7.628472805023193, -7.372096061706543, -7.115719318389893, -6.859342575073242, -6.60296630859375, -6.3465895652771, -6.090212821960449, -5.833836078643799, -5.577459812164307, -5.321083068847656, -5.064706325531006, -4.8083295822143555, -4.551953315734863, -4.295576572418213, -4.039200305938721, -3.7828238010406494, -3.526447057723999, -3.2700705528259277, -3.0136938095092773, -2.757317304611206, -2.5009407997131348, -2.2445640563964844, -1.988187551498413, -1.7318109273910522, -1.4754343032836914, -1.2190577983856201, -0.9626811742782593, -0.7063045501708984, -0.44992804527282715, -0.1935514211654663, 0.06282520294189453, 0.319201797246933, 0.5755783915519714, 0.8319549560546875, 1.0883315801620483, 1.3447082042694092, 1.6010847091674805, 1.8574613332748413, 2.113837957382202, 2.3702144622802734, 2.626591205596924, 2.882967710494995, 3.1393442153930664, 3.395720958709717, 3.652097463607788, 3.9084739685058594, 4.16485071182251, 4.42122745513916, 4.677603721618652, 4.933980464935303, 5.190357208251953, 5.446733474731445, 5.703110218048096, 5.959486961364746, 6.215863227844238, 6.472239971160889, 6.728616237640381, 6.984992980957031, 7.241369724273682, 7.497746467590332, 7.754122734069824, 8.010499000549316, 8.266876220703125]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 18.0, 13.0, 46.0, 67.0, 121.0, 155.0, 216.0, 340.0, 525.0, 825.0, 1259.0, 1845.0, 2976.0, 4649.0, 7540.0, 12294.0, 20847.0, 35895.0, 63622.0, 116201.0, 221460.0, 429116.0, 760993.0, 954133.0, 714339.0, 394270.0, 203219.0, 106899.0, 57951.0, 32676.0, 19145.0, 11441.0, 7044.0, 4472.0, 2755.0, 1718.0, 1112.0, 715.0, 475.0, 308.0, 186.0, 132.0, 94.0, 60.0, 39.0, 24.0, 15.0, 11.0, 6.0, 9.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.77734375, -6.55462646484375, -6.3319091796875, -6.10919189453125, -5.886474609375, -5.66375732421875, -5.4410400390625, -5.21832275390625, -4.99560546875, -4.77288818359375, -4.5501708984375, -4.32745361328125, -4.104736328125, -3.88201904296875, -3.6593017578125, -3.43658447265625, -3.2138671875, -2.99114990234375, -2.7684326171875, -2.54571533203125, -2.322998046875, -2.10028076171875, -1.8775634765625, -1.65484619140625, -1.43212890625, -1.20941162109375, -0.9866943359375, -0.76397705078125, -0.541259765625, -0.31854248046875, -0.0958251953125, 0.12689208984375, 0.349609375, 0.57232666015625, 0.7950439453125, 1.01776123046875, 1.240478515625, 1.46319580078125, 1.6859130859375, 1.90863037109375, 2.13134765625, 2.35406494140625, 2.5767822265625, 2.79949951171875, 3.022216796875, 3.24493408203125, 3.4676513671875, 3.69036865234375, 3.9130859375, 4.13580322265625, 4.3585205078125, 4.58123779296875, 4.803955078125, 5.02667236328125, 5.2493896484375, 5.47210693359375, 5.69482421875, 5.91754150390625, 6.1402587890625, 6.36297607421875, 6.585693359375, 6.80841064453125, 7.0311279296875, 7.25384521484375, 7.4765625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 9.0, 5.0, 10.0, 23.0, 21.0, 21.0, 20.0, 26.0, 24.0, 22.0, 38.0, 34.0, 38.0, 25.0, 39.0, 51.0, 37.0, 38.0, 35.0, 37.0, 31.0, 41.0, 40.0, 30.0, 29.0, 35.0, 35.0, 31.0, 23.0, 25.0, 19.0, 13.0, 19.0, 17.0, 6.0, 8.0, 13.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-5.109375, -4.94708251953125, -4.7847900390625, -4.62249755859375, -4.460205078125, -4.29791259765625, -4.1356201171875, -3.97332763671875, -3.81103515625, -3.64874267578125, -3.4864501953125, -3.32415771484375, -3.161865234375, -2.99957275390625, -2.8372802734375, -2.67498779296875, -2.5126953125, -2.35040283203125, -2.1881103515625, -2.02581787109375, -1.863525390625, -1.70123291015625, -1.5389404296875, -1.37664794921875, -1.21435546875, -1.05206298828125, -0.8897705078125, -0.72747802734375, -0.565185546875, -0.40289306640625, -0.2406005859375, -0.07830810546875, 0.083984375, 0.24627685546875, 0.4085693359375, 0.57086181640625, 0.733154296875, 0.89544677734375, 1.0577392578125, 1.22003173828125, 1.38232421875, 1.54461669921875, 1.7069091796875, 1.86920166015625, 2.031494140625, 2.19378662109375, 2.3560791015625, 2.51837158203125, 2.6806640625, 2.84295654296875, 3.0052490234375, 3.16754150390625, 3.329833984375, 3.49212646484375, 3.6544189453125, 3.81671142578125, 3.97900390625, 4.14129638671875, 4.3035888671875, 4.46588134765625, 4.628173828125, 4.79046630859375, 4.9527587890625, 5.11505126953125, 5.27734375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 9.0, 16.0, 21.0, 30.0, 61.0, 72.0, 124.0, 181.0, 334.0, 457.0, 745.0, 1198.0, 1802.0, 2966.0, 4814.0, 8122.0, 13888.0, 24205.0, 43066.0, 78654.0, 146533.0, 273011.0, 484063.0, 739040.0, 834967.0, 653784.0, 396813.0, 219465.0, 117806.0, 64241.0, 34954.0, 19980.0, 11667.0, 6604.0, 4026.0, 2464.0, 1529.0, 907.0, 579.0, 389.0, 231.0, 179.0, 102.0, 66.0, 47.0, 29.0, 19.0, 14.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.890625, -6.683837890625, -6.47705078125, -6.270263671875, -6.0634765625, -5.856689453125, -5.64990234375, -5.443115234375, -5.236328125, -5.029541015625, -4.82275390625, -4.615966796875, -4.4091796875, -4.202392578125, -3.99560546875, -3.788818359375, -3.58203125, -3.375244140625, -3.16845703125, -2.961669921875, -2.7548828125, -2.548095703125, -2.34130859375, -2.134521484375, -1.927734375, -1.720947265625, -1.51416015625, -1.307373046875, -1.1005859375, -0.893798828125, -0.68701171875, -0.480224609375, -0.2734375, -0.066650390625, 0.14013671875, 0.346923828125, 0.5537109375, 0.760498046875, 0.96728515625, 1.174072265625, 1.380859375, 1.587646484375, 1.79443359375, 2.001220703125, 2.2080078125, 2.414794921875, 2.62158203125, 2.828369140625, 3.03515625, 3.241943359375, 3.44873046875, 3.655517578125, 3.8623046875, 4.069091796875, 4.27587890625, 4.482666015625, 4.689453125, 4.896240234375, 5.10302734375, 5.309814453125, 5.5166015625, 5.723388671875, 5.93017578125, 6.136962890625, 6.34375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 9.0, 4.0, 16.0, 24.0, 23.0, 30.0, 45.0, 53.0, 77.0, 96.0, 132.0, 138.0, 182.0, 207.0, 246.0, 233.0, 261.0, 309.0, 280.0, 245.0, 255.0, 209.0, 188.0, 169.0, 126.0, 110.0, 93.0, 60.0, 54.0, 42.0, 38.0, 37.0, 20.0, 18.0, 11.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83203125, -2.734375, -2.63671875, -2.5390625, -2.44140625, -2.34375, -2.24609375, -2.1484375, -2.05078125, -1.953125, -1.85546875, -1.7578125, -1.66015625, -1.5625, -1.46484375, -1.3671875, -1.26953125, -1.171875, -1.07421875, -0.9765625, -0.87890625, -0.78125, -0.68359375, -0.5859375, -0.48828125, -0.390625, -0.29296875, -0.1953125, -0.09765625, 0.0, 0.09765625, 0.1953125, 0.29296875, 0.390625, 0.48828125, 0.5859375, 0.68359375, 0.78125, 0.87890625, 0.9765625, 1.07421875, 1.171875, 1.26953125, 1.3671875, 1.46484375, 1.5625, 1.66015625, 1.7578125, 1.85546875, 1.953125, 2.05078125, 2.1484375, 2.24609375, 2.34375, 2.44140625, 2.5390625, 2.63671875, 2.734375, 2.83203125, 2.9296875, 3.02734375, 3.125, 3.22265625, 3.3203125, 3.41796875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 11.0, 7.0, 9.0, 6.0, 14.0, 18.0, 21.0, 31.0, 26.0, 38.0, 50.0, 50.0, 59.0, 80.0, 63.0, 83.0, 72.0, 58.0, 66.0, 46.0, 39.0, 25.0, 27.0, 13.0, 21.0, 13.0, 8.0, 10.0, 6.0, 8.0, 5.0, 2.0, 6.0, 1.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.670610427856445, -8.424235343933105, -8.177860260009766, -7.931485176086426, -7.685110092163086, -7.438735008239746, -7.192359924316406, -6.945984840393066, -6.699609756469727, -6.453234672546387, -6.206859588623047, -5.960484504699707, -5.714109420776367, -5.467734336853027, -5.2213592529296875, -4.974984169006348, -4.72860860824585, -4.48223352432251, -4.23585844039917, -3.98948335647583, -3.7431082725524902, -3.4967331886291504, -3.2503578662872314, -3.0039827823638916, -2.7576076984405518, -2.511232614517212, -2.264857530593872, -2.018482208251953, -1.7721072435379028, -1.525732159614563, -1.2793569564819336, -1.0329818725585938, -0.7866063117980957, -0.5402312278747559, -0.29385608434677124, -0.04748094081878662, 0.19889414310455322, 0.44526922702789307, 0.6916444301605225, 0.9380195140838623, 1.1843945980072021, 1.430769681930542, 1.6771447658538818, 1.9235199689865112, 2.1698951721191406, 2.4162702560424805, 2.6626453399658203, 2.90902042388916, 3.1553955078125, 3.40177059173584, 3.6481456756591797, 3.8945207595825195, 4.140895843505859, 4.387270927429199, 4.633646011352539, 4.880021095275879, 5.126396179199219, 5.372771263122559, 5.619146347045898, 5.865521430969238, 6.111896514892578, 6.358271598815918, 6.604646682739258, 6.851021766662598, 7.097397327423096]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 6.0, 9.0, 11.0, 9.0, 10.0, 12.0, 10.0, 18.0, 14.0, 16.0, 25.0, 35.0, 39.0, 35.0, 33.0, 43.0, 35.0, 41.0, 42.0, 45.0, 31.0, 38.0, 40.0, 50.0, 34.0, 42.0, 30.0, 28.0, 29.0, 23.0, 18.0, 31.0, 28.0, 15.0, 16.0, 13.0, 10.0, 8.0, 7.0, 10.0, 6.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.319005966186523, -7.080183029174805, -6.841360092163086, -6.602536678314209, -6.36371374130249, -6.1248908042907715, -5.8860673904418945, -5.647244453430176, -5.408421516418457, -5.169598579406738, -4.9307756423950195, -4.691952228546143, -4.453129291534424, -4.214306354522705, -3.9754831790924072, -3.7366600036621094, -3.4978370666503906, -3.259014129638672, -3.020190954208374, -2.781367778778076, -2.5425448417663574, -2.3037219047546387, -2.064898729324341, -1.8260756731033325, -1.5872526168823242, -1.348429560661316, -1.1096065044403076, -0.8707834482192993, -0.631960391998291, -0.3931373357772827, -0.15431427955627441, 0.08450877666473389, 0.3233318328857422, 0.5621548891067505, 0.8009779453277588, 1.039801001548767, 1.2786240577697754, 1.5174471139907837, 1.756270170211792, 1.9950932264328003, 2.2339162826538086, 2.4727392196655273, 2.711562395095825, 2.950385570526123, 3.189208507537842, 3.4280314445495605, 3.6668546199798584, 3.9056777954101562, 4.144500732421875, 4.383323669433594, 4.6221466064453125, 4.8609700202941895, 5.099792957305908, 5.338615894317627, 5.577439308166504, 5.816262245178223, 6.055085182189941, 6.29390811920166, 6.532731056213379, 6.771554470062256, 7.010377407073975, 7.249200344085693, 7.48802375793457, 7.726846694946289, 7.965669631958008]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 10.0, 12.0, 14.0, 22.0, 38.0, 44.0, 75.0, 78.0, 131.0, 206.0, 269.0, 380.0, 646.0, 874.0, 1313.0, 1904.0, 2909.0, 4208.0, 6372.0, 9596.0, 14634.0, 23068.0, 35385.0, 54359.0, 82686.0, 121490.0, 160636.0, 162163.0, 121942.0, 84277.0, 55124.0, 35665.0, 23200.0, 14917.0, 9911.0, 6502.0, 4388.0, 2967.0, 1931.0, 1365.0, 888.0, 640.0, 405.0, 277.0, 205.0, 144.0, 96.0, 61.0, 41.0, 25.0, 16.0, 17.0, 21.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0], "bins": [-0.923828125, -0.8949737548828125, -0.866119384765625, -0.8372650146484375, -0.80841064453125, -0.7795562744140625, -0.750701904296875, -0.7218475341796875, -0.6929931640625, -0.6641387939453125, -0.635284423828125, -0.6064300537109375, -0.57757568359375, -0.5487213134765625, -0.519866943359375, -0.4910125732421875, -0.462158203125, -0.4333038330078125, -0.404449462890625, -0.3755950927734375, -0.34674072265625, -0.3178863525390625, -0.289031982421875, -0.2601776123046875, -0.2313232421875, -0.2024688720703125, -0.173614501953125, -0.1447601318359375, -0.11590576171875, -0.0870513916015625, -0.058197021484375, -0.0293426513671875, -0.00048828125, 0.0283660888671875, 0.057220458984375, 0.0860748291015625, 0.11492919921875, 0.1437835693359375, 0.172637939453125, 0.2014923095703125, 0.2303466796875, 0.2592010498046875, 0.288055419921875, 0.3169097900390625, 0.34576416015625, 0.3746185302734375, 0.403472900390625, 0.4323272705078125, 0.461181640625, 0.4900360107421875, 0.518890380859375, 0.5477447509765625, 0.57659912109375, 0.6054534912109375, 0.634307861328125, 0.6631622314453125, 0.6920166015625, 0.7208709716796875, 0.749725341796875, 0.7785797119140625, 0.80743408203125, 0.8362884521484375, 0.865142822265625, 0.8939971923828125, 0.9228515625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 9.0, 0.0, 5.0, 3.0, 10.0, 6.0, 9.0, 13.0, 18.0, 12.0, 16.0, 15.0, 25.0, 18.0, 37.0, 33.0, 35.0, 28.0, 41.0, 34.0, 36.0, 35.0, 41.0, 42.0, 30.0, 37.0, 39.0, 45.0, 37.0, 33.0, 21.0, 30.0, 22.0, 29.0, 24.0, 22.0, 16.0, 18.0, 16.0, 13.0, 8.0, 9.0, 9.0, 6.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.90234375, -6.6767578125, -6.451171875, -6.2255859375, -6.0, -5.7744140625, -5.548828125, -5.3232421875, -5.09765625, -4.8720703125, -4.646484375, -4.4208984375, -4.1953125, -3.9697265625, -3.744140625, -3.5185546875, -3.29296875, -3.0673828125, -2.841796875, -2.6162109375, -2.390625, -2.1650390625, -1.939453125, -1.7138671875, -1.48828125, -1.2626953125, -1.037109375, -0.8115234375, -0.5859375, -0.3603515625, -0.134765625, 0.0908203125, 0.31640625, 0.5419921875, 0.767578125, 0.9931640625, 1.21875, 1.4443359375, 1.669921875, 1.8955078125, 2.12109375, 2.3466796875, 2.572265625, 2.7978515625, 3.0234375, 3.2490234375, 3.474609375, 3.7001953125, 3.92578125, 4.1513671875, 4.376953125, 4.6025390625, 4.828125, 5.0537109375, 5.279296875, 5.5048828125, 5.73046875, 5.9560546875, 6.181640625, 6.4072265625, 6.6328125, 6.8583984375, 7.083984375, 7.3095703125, 7.53515625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 10.0, 11.0, 24.0, 33.0, 45.0, 87.0, 101.0, 156.0, 268.0, 355.0, 574.0, 817.0, 1291.0, 1916.0, 2922.0, 4402.0, 6866.0, 10634.0, 16296.0, 25588.0, 40030.0, 62363.0, 96321.0, 143760.0, 183243.0, 154263.0, 105444.0, 68241.0, 43623.0, 27865.0, 17750.0, 11694.0, 7501.0, 4816.0, 3211.0, 2035.0, 1279.0, 953.0, 573.0, 393.0, 256.0, 180.0, 133.0, 83.0, 53.0, 35.0, 20.0, 16.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.017578125, -0.9863662719726562, -0.9551544189453125, -0.9239425659179688, -0.892730712890625, -0.8615188598632812, -0.8303070068359375, -0.7990951538085938, -0.76788330078125, -0.7366714477539062, -0.7054595947265625, -0.6742477416992188, -0.643035888671875, -0.6118240356445312, -0.5806121826171875, -0.5494003295898438, -0.5181884765625, -0.48697662353515625, -0.4557647705078125, -0.42455291748046875, -0.393341064453125, -0.36212921142578125, -0.3309173583984375, -0.29970550537109375, -0.26849365234375, -0.23728179931640625, -0.2060699462890625, -0.17485809326171875, -0.143646240234375, -0.11243438720703125, -0.0812225341796875, -0.05001068115234375, -0.018798828125, 0.01241302490234375, 0.0436248779296875, 0.07483673095703125, 0.106048583984375, 0.13726043701171875, 0.1684722900390625, 0.19968414306640625, 0.23089599609375, 0.26210784912109375, 0.2933197021484375, 0.32453155517578125, 0.355743408203125, 0.38695526123046875, 0.4181671142578125, 0.44937896728515625, 0.4805908203125, 0.5118026733398438, 0.5430145263671875, 0.5742263793945312, 0.605438232421875, 0.6366500854492188, 0.6678619384765625, 0.6990737915039062, 0.73028564453125, 0.7614974975585938, 0.7927093505859375, 0.8239212036132812, 0.855133056640625, 0.8863449096679688, 0.9175567626953125, 0.9487686157226562, 0.97998046875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 9.0, 3.0, 3.0, 6.0, 6.0, 6.0, 8.0, 12.0, 14.0, 11.0, 9.0, 15.0, 23.0, 30.0, 31.0, 21.0, 29.0, 25.0, 18.0, 30.0, 31.0, 34.0, 41.0, 35.0, 41.0, 38.0, 43.0, 31.0, 32.0, 37.0, 31.0, 30.0, 26.0, 26.0, 31.0, 23.0, 16.0, 18.0, 14.0, 24.0, 21.0, 9.0, 7.0, 14.0, 10.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0], "bins": [-4.30078125, -4.17498779296875, -4.0491943359375, -3.92340087890625, -3.797607421875, -3.67181396484375, -3.5460205078125, -3.42022705078125, -3.29443359375, -3.16864013671875, -3.0428466796875, -2.91705322265625, -2.791259765625, -2.66546630859375, -2.5396728515625, -2.41387939453125, -2.2880859375, -2.16229248046875, -2.0364990234375, -1.91070556640625, -1.784912109375, -1.65911865234375, -1.5333251953125, -1.40753173828125, -1.28173828125, -1.15594482421875, -1.0301513671875, -0.90435791015625, -0.778564453125, -0.65277099609375, -0.5269775390625, -0.40118408203125, -0.275390625, -0.14959716796875, -0.0238037109375, 0.10198974609375, 0.227783203125, 0.35357666015625, 0.4793701171875, 0.60516357421875, 0.73095703125, 0.85675048828125, 0.9825439453125, 1.10833740234375, 1.234130859375, 1.35992431640625, 1.4857177734375, 1.61151123046875, 1.7373046875, 1.86309814453125, 1.9888916015625, 2.11468505859375, 2.240478515625, 2.36627197265625, 2.4920654296875, 2.61785888671875, 2.74365234375, 2.86944580078125, 2.9952392578125, 3.12103271484375, 3.246826171875, 3.37261962890625, 3.4984130859375, 3.62420654296875, 3.75]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 8.0, 14.0, 28.0, 33.0, 32.0, 58.0, 72.0, 106.0, 176.0, 268.0, 437.0, 673.0, 1096.0, 1805.0, 3325.0, 6429.0, 13198.0, 29799.0, 73220.0, 196537.0, 392085.0, 198246.0, 73027.0, 29738.0, 13448.0, 6524.0, 3395.0, 1872.0, 1041.0, 642.0, 388.0, 285.0, 168.0, 122.0, 75.0, 63.0, 42.0, 25.0, 12.0, 11.0, 8.0, 8.0, 9.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09588623046875, -0.09302425384521484, -0.09016227722167969, -0.08730030059814453, -0.08443832397460938, -0.08157634735107422, -0.07871437072753906, -0.0758523941040039, -0.07299041748046875, -0.0701284408569336, -0.06726646423339844, -0.06440448760986328, -0.061542510986328125, -0.05868053436279297, -0.05581855773925781, -0.052956581115722656, -0.0500946044921875, -0.047232627868652344, -0.04437065124511719, -0.04150867462158203, -0.038646697998046875, -0.03578472137451172, -0.03292274475097656, -0.030060768127441406, -0.02719879150390625, -0.024336814880371094, -0.021474838256835938, -0.01861286163330078, -0.015750885009765625, -0.012888908386230469, -0.010026931762695312, -0.007164955139160156, -0.004302978515625, -0.0014410018920898438, 0.0014209747314453125, 0.004282951354980469, 0.007144927978515625, 0.010006904602050781, 0.012868881225585938, 0.015730857849121094, 0.01859283447265625, 0.021454811096191406, 0.024316787719726562, 0.02717876434326172, 0.030040740966796875, 0.03290271759033203, 0.03576469421386719, 0.038626670837402344, 0.0414886474609375, 0.044350624084472656, 0.04721260070800781, 0.05007457733154297, 0.052936553955078125, 0.05579853057861328, 0.05866050720214844, 0.061522483825683594, 0.06438446044921875, 0.0672464370727539, 0.07010841369628906, 0.07297039031982422, 0.07583236694335938, 0.07869434356689453, 0.08155632019042969, 0.08441829681396484, 0.0872802734375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 16.0, 9.0, 9.0, 14.0, 17.0, 27.0, 41.0, 42.0, 64.0, 55.0, 55.0, 67.0, 67.0, 69.0, 71.0, 62.0, 54.0, 51.0, 42.0, 35.0, 42.0, 22.0, 18.0, 15.0, 12.0, 4.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.621246337890625e-05, -1.5780329704284668e-05, -1.5348196029663086e-05, -1.4916062355041504e-05, -1.4483928680419922e-05, -1.405179500579834e-05, -1.3619661331176758e-05, -1.3187527656555176e-05, -1.2755393981933594e-05, -1.2323260307312012e-05, -1.189112663269043e-05, -1.1458992958068848e-05, -1.1026859283447266e-05, -1.0594725608825684e-05, -1.0162591934204102e-05, -9.73045825958252e-06, -9.298324584960938e-06, -8.866190910339355e-06, -8.434057235717773e-06, -8.001923561096191e-06, -7.569789886474609e-06, -7.137656211853027e-06, -6.705522537231445e-06, -6.273388862609863e-06, -5.841255187988281e-06, -5.409121513366699e-06, -4.976987838745117e-06, -4.544854164123535e-06, -4.112720489501953e-06, -3.680586814880371e-06, -3.248453140258789e-06, -2.816319465637207e-06, -2.384185791015625e-06, -1.952052116394043e-06, -1.519918441772461e-06, -1.087784767150879e-06, -6.556510925292969e-07, -2.2351741790771484e-07, 2.086162567138672e-07, 6.407499313354492e-07, 1.0728836059570312e-06, 1.5050172805786133e-06, 1.9371509552001953e-06, 2.3692846298217773e-06, 2.8014183044433594e-06, 3.2335519790649414e-06, 3.6656856536865234e-06, 4.0978193283081055e-06, 4.5299530029296875e-06, 4.9620866775512695e-06, 5.3942203521728516e-06, 5.826354026794434e-06, 6.258487701416016e-06, 6.690621376037598e-06, 7.12275505065918e-06, 7.554888725280762e-06, 7.987022399902344e-06, 8.419156074523926e-06, 8.851289749145508e-06, 9.28342342376709e-06, 9.715557098388672e-06, 1.0147690773010254e-05, 1.0579824447631836e-05, 1.1011958122253418e-05, 1.1444091796875e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 13.0, 14.0, 20.0, 39.0, 39.0, 49.0, 80.0, 103.0, 190.0, 279.0, 413.0, 688.0, 1149.0, 2209.0, 4347.0, 10135.0, 25663.0, 71330.0, 218310.0, 422638.0, 188360.0, 61955.0, 22388.0, 9040.0, 4027.0, 2000.0, 1131.0, 720.0, 382.0, 249.0, 184.0, 126.0, 75.0, 59.0, 44.0, 29.0, 19.0, 18.0, 9.0, 6.0, 4.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.132568359375, -0.12835121154785156, -0.12413406372070312, -0.11991691589355469, -0.11569976806640625, -0.11148262023925781, -0.10726547241210938, -0.10304832458496094, -0.0988311767578125, -0.09461402893066406, -0.09039688110351562, -0.08617973327636719, -0.08196258544921875, -0.07774543762207031, -0.07352828979492188, -0.06931114196777344, -0.065093994140625, -0.06087684631347656, -0.056659698486328125, -0.05244255065917969, -0.04822540283203125, -0.04400825500488281, -0.039791107177734375, -0.03557395935058594, -0.0313568115234375, -0.027139663696289062, -0.022922515869140625, -0.018705368041992188, -0.01448822021484375, -0.010271072387695312, -0.006053924560546875, -0.0018367767333984375, 0.00238037109375, 0.0065975189208984375, 0.010814666748046875, 0.015031814575195312, 0.01924896240234375, 0.023466110229492188, 0.027683258056640625, 0.03190040588378906, 0.0361175537109375, 0.04033470153808594, 0.044551849365234375, 0.04876899719238281, 0.05298614501953125, 0.05720329284667969, 0.061420440673828125, 0.06563758850097656, 0.069854736328125, 0.07407188415527344, 0.07828903198242188, 0.08250617980957031, 0.08672332763671875, 0.09094047546386719, 0.09515762329101562, 0.09937477111816406, 0.1035919189453125, 0.10780906677246094, 0.11202621459960938, 0.11624336242675781, 0.12046051025390625, 0.12467765808105469, 0.12889480590820312, 0.13311195373535156, 0.1373291015625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 2.0, 8.0, 18.0, 21.0, 24.0, 22.0, 34.0, 39.0, 53.0, 45.0, 79.0, 69.0, 94.0, 100.0, 84.0, 49.0, 37.0, 43.0, 28.0, 28.0, 16.0, 23.0, 13.0, 14.0, 12.0, 8.0, 7.0, 4.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0504150390625, -0.04892444610595703, -0.04743385314941406, -0.045943260192871094, -0.044452667236328125, -0.042962074279785156, -0.04147148132324219, -0.03998088836669922, -0.03849029541015625, -0.03699970245361328, -0.03550910949707031, -0.034018516540527344, -0.032527923583984375, -0.031037330627441406, -0.029546737670898438, -0.02805614471435547, -0.0265655517578125, -0.02507495880126953, -0.023584365844726562, -0.022093772888183594, -0.020603179931640625, -0.019112586975097656, -0.017621994018554688, -0.01613140106201172, -0.01464080810546875, -0.013150215148925781, -0.011659622192382812, -0.010169029235839844, -0.008678436279296875, -0.007187843322753906, -0.0056972503662109375, -0.004206657409667969, -0.002716064453125, -0.0012254714965820312, 0.0002651214599609375, 0.0017557144165039062, 0.003246307373046875, 0.004736900329589844, 0.0062274932861328125, 0.007718086242675781, 0.00920867919921875, 0.010699272155761719, 0.012189865112304688, 0.013680458068847656, 0.015171051025390625, 0.016661643981933594, 0.018152236938476562, 0.01964282989501953, 0.0211334228515625, 0.02262401580810547, 0.024114608764648438, 0.025605201721191406, 0.027095794677734375, 0.028586387634277344, 0.030076980590820312, 0.03156757354736328, 0.03305816650390625, 0.03454875946044922, 0.03603935241699219, 0.037529945373535156, 0.039020538330078125, 0.040511131286621094, 0.04200172424316406, 0.04349231719970703, 0.04498291015625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 9.0, 9.0, 6.0, 7.0, 16.0, 14.0, 17.0, 29.0, 29.0, 35.0, 39.0, 49.0, 55.0, 68.0, 71.0, 80.0, 67.0, 69.0, 63.0, 49.0, 43.0, 31.0, 30.0, 19.0, 18.0, 15.0, 10.0, 14.0, 5.0, 7.0, 8.0, 1.0, 4.0, 4.0, 3.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.527007102966309, -8.28763484954834, -8.048262596130371, -7.8088908195495605, -7.569518566131592, -7.330146312713623, -7.0907745361328125, -6.851402282714844, -6.612030029296875, -6.372657775878906, -6.1332855224609375, -5.893913745880127, -5.654541492462158, -5.4151692390441895, -5.175797462463379, -4.93642520904541, -4.697052955627441, -4.457680702209473, -4.218308448791504, -3.9789366722106934, -3.7395644187927246, -3.500192165374756, -3.260820150375366, -3.0214481353759766, -2.782075881958008, -2.542703628540039, -2.3033316135406494, -2.0639595985412598, -1.824587345123291, -1.5852152109146118, -1.3458430767059326, -1.1064709424972534, -0.8670992851257324, -0.6277271509170532, -0.388355016708374, -0.14898288249969482, 0.09038925170898438, 0.3297613859176636, 0.5691335201263428, 0.808505654335022, 1.0478777885437012, 1.2872499227523804, 1.5266220569610596, 1.7659941911697388, 2.005366325378418, 2.2447385787963867, 2.4841105937957764, 2.723482608795166, 2.9628548622131348, 3.2022271156311035, 3.441599130630493, 3.680971145629883, 3.9203433990478516, 4.15971565246582, 4.399087905883789, 4.6384596824646, 4.877831935882568, 5.117204189300537, 5.356575965881348, 5.595948219299316, 5.835320472717285, 6.074692726135254, 6.314064979553223, 6.553436756134033, 6.792809009552002]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 1.0, 6.0, 9.0, 10.0, 10.0, 9.0, 9.0, 12.0, 20.0, 13.0, 14.0, 26.0, 36.0, 39.0, 33.0, 34.0, 43.0, 37.0, 40.0, 39.0, 48.0, 32.0, 36.0, 41.0, 48.0, 39.0, 41.0, 28.0, 29.0, 26.0, 25.0, 20.0, 30.0, 28.0, 14.0, 17.0, 13.0, 10.0, 9.0, 7.0, 9.0, 6.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.308221817016602, -7.069567680358887, -6.830913543701172, -6.592259407043457, -6.353605270385742, -6.114951133728027, -5.8762969970703125, -5.637642860412598, -5.398988723754883, -5.160334587097168, -4.921680450439453, -4.683026313781738, -4.444372177124023, -4.205718040466309, -3.967064142227173, -3.728410005569458, -3.4897561073303223, -3.2511019706726074, -3.0124478340148926, -2.7737936973571777, -2.535139560699463, -2.296485424041748, -2.0578315258026123, -1.8191773891448975, -1.5805232524871826, -1.3418691158294678, -1.103214979171753, -0.8645609617233276, -0.6259068250656128, -0.38725268840789795, -0.14859867095947266, 0.09005546569824219, 0.32870912551879883, 0.5673632621765137, 0.8060173392295837, 1.0446714162826538, 1.2833255529403687, 1.5219796895980835, 1.7606337070465088, 1.9992878437042236, 2.2379419803619385, 2.4765961170196533, 2.715250253677368, 2.953904151916504, 3.1925582885742188, 3.4312124252319336, 3.6698665618896484, 3.9085206985473633, 4.147174835205078, 4.385828971862793, 4.624483108520508, 4.863137245178223, 5.1017913818359375, 5.340445518493652, 5.579099655151367, 5.817753791809082, 6.056407928466797, 6.295062065124512, 6.533716201782227, 6.772370338439941, 7.011024475097656, 7.249678611755371, 7.488332748413086, 7.726986885070801, 7.965640544891357]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 17.0, 20.0, 38.0, 43.0, 74.0, 106.0, 184.0, 235.0, 397.0, 553.0, 831.0, 1300.0, 2024.0, 3154.0, 4815.0, 7507.0, 12006.0, 18728.0, 29544.0, 45955.0, 69358.0, 99598.0, 129495.0, 145380.0, 137793.0, 111109.0, 79332.0, 53383.0, 34518.0, 22277.0, 13916.0, 8803.0, 5623.0, 3544.0, 2385.0, 1539.0, 1003.0, 651.0, 439.0, 287.0, 208.0, 118.0, 88.0, 46.0, 40.0, 30.0, 17.0, 9.0, 11.0, 8.0, 7.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.1796875, -5.02117919921875, -4.8626708984375, -4.70416259765625, -4.545654296875, -4.38714599609375, -4.2286376953125, -4.07012939453125, -3.91162109375, -3.75311279296875, -3.5946044921875, -3.43609619140625, -3.277587890625, -3.11907958984375, -2.9605712890625, -2.80206298828125, -2.6435546875, -2.48504638671875, -2.3265380859375, -2.16802978515625, -2.009521484375, -1.85101318359375, -1.6925048828125, -1.53399658203125, -1.37548828125, -1.21697998046875, -1.0584716796875, -0.89996337890625, -0.741455078125, -0.58294677734375, -0.4244384765625, -0.26593017578125, -0.107421875, 0.05108642578125, 0.2095947265625, 0.36810302734375, 0.526611328125, 0.68511962890625, 0.8436279296875, 1.00213623046875, 1.16064453125, 1.31915283203125, 1.4776611328125, 1.63616943359375, 1.794677734375, 1.95318603515625, 2.1116943359375, 2.27020263671875, 2.4287109375, 2.58721923828125, 2.7457275390625, 2.90423583984375, 3.062744140625, 3.22125244140625, 3.3797607421875, 3.53826904296875, 3.69677734375, 3.85528564453125, 4.0137939453125, 4.17230224609375, 4.330810546875, 4.48931884765625, 4.6478271484375, 4.80633544921875, 4.96484375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 6.0, 3.0, 10.0, 14.0, 10.0, 8.0, 14.0, 15.0, 23.0, 25.0, 21.0, 21.0, 39.0, 30.0, 22.0, 32.0, 27.0, 50.0, 37.0, 49.0, 27.0, 38.0, 45.0, 34.0, 30.0, 41.0, 36.0, 33.0, 22.0, 26.0, 16.0, 29.0, 19.0, 25.0, 22.0, 15.0, 17.0, 10.0, 14.0, 10.0, 6.0, 5.0, 3.0, 5.0, 7.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.5546875, -6.33892822265625, -6.1231689453125, -5.90740966796875, -5.691650390625, -5.47589111328125, -5.2601318359375, -5.04437255859375, -4.82861328125, -4.61285400390625, -4.3970947265625, -4.18133544921875, -3.965576171875, -3.74981689453125, -3.5340576171875, -3.31829833984375, -3.1025390625, -2.88677978515625, -2.6710205078125, -2.45526123046875, -2.239501953125, -2.02374267578125, -1.8079833984375, -1.59222412109375, -1.37646484375, -1.16070556640625, -0.9449462890625, -0.72918701171875, -0.513427734375, -0.29766845703125, -0.0819091796875, 0.13385009765625, 0.349609375, 0.56536865234375, 0.7811279296875, 0.99688720703125, 1.212646484375, 1.42840576171875, 1.6441650390625, 1.85992431640625, 2.07568359375, 2.29144287109375, 2.5072021484375, 2.72296142578125, 2.938720703125, 3.15447998046875, 3.3702392578125, 3.58599853515625, 3.8017578125, 4.01751708984375, 4.2332763671875, 4.44903564453125, 4.664794921875, 4.88055419921875, 5.0963134765625, 5.31207275390625, 5.52783203125, 5.74359130859375, 5.9593505859375, 6.17510986328125, 6.390869140625, 6.60662841796875, 6.8223876953125, 7.03814697265625, 7.25390625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 10.0, 11.0, 14.0, 32.0, 37.0, 71.0, 108.0, 174.0, 259.0, 459.0, 858.0, 1406.0, 2354.0, 4248.0, 7607.0, 13319.0, 23741.0, 42349.0, 74242.0, 121432.0, 171247.0, 187519.0, 153497.0, 103208.0, 61255.0, 34757.0, 19230.0, 10680.0, 6077.0, 3433.0, 2001.0, 1195.0, 716.0, 398.0, 248.0, 150.0, 85.0, 42.0, 31.0, 15.0, 14.0, 6.0, 7.0, 4.0, 5.0, 5.0, 3.0, 0.0, 0.0, 2.0], "bins": [-7.1484375, -6.946044921875, -6.74365234375, -6.541259765625, -6.3388671875, -6.136474609375, -5.93408203125, -5.731689453125, -5.529296875, -5.326904296875, -5.12451171875, -4.922119140625, -4.7197265625, -4.517333984375, -4.31494140625, -4.112548828125, -3.91015625, -3.707763671875, -3.50537109375, -3.302978515625, -3.1005859375, -2.898193359375, -2.69580078125, -2.493408203125, -2.291015625, -2.088623046875, -1.88623046875, -1.683837890625, -1.4814453125, -1.279052734375, -1.07666015625, -0.874267578125, -0.671875, -0.469482421875, -0.26708984375, -0.064697265625, 0.1376953125, 0.340087890625, 0.54248046875, 0.744873046875, 0.947265625, 1.149658203125, 1.35205078125, 1.554443359375, 1.7568359375, 1.959228515625, 2.16162109375, 2.364013671875, 2.56640625, 2.768798828125, 2.97119140625, 3.173583984375, 3.3759765625, 3.578369140625, 3.78076171875, 3.983154296875, 4.185546875, 4.387939453125, 4.59033203125, 4.792724609375, 4.9951171875, 5.197509765625, 5.39990234375, 5.602294921875, 5.8046875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 6.0, 6.0, 10.0, 12.0, 16.0, 15.0, 30.0, 21.0, 24.0, 13.0, 36.0, 25.0, 28.0, 38.0, 31.0, 33.0, 44.0, 41.0, 58.0, 40.0, 28.0, 33.0, 44.0, 42.0, 35.0, 35.0, 46.0, 24.0, 21.0, 33.0, 21.0, 9.0, 13.0, 16.0, 15.0, 8.0, 12.0, 7.0, 7.0, 6.0, 2.0, 4.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.01953125, -3.88262939453125, -3.7457275390625, -3.60882568359375, -3.471923828125, -3.33502197265625, -3.1981201171875, -3.06121826171875, -2.92431640625, -2.78741455078125, -2.6505126953125, -2.51361083984375, -2.376708984375, -2.23980712890625, -2.1029052734375, -1.96600341796875, -1.8291015625, -1.69219970703125, -1.5552978515625, -1.41839599609375, -1.281494140625, -1.14459228515625, -1.0076904296875, -0.87078857421875, -0.73388671875, -0.59698486328125, -0.4600830078125, -0.32318115234375, -0.186279296875, -0.04937744140625, 0.0875244140625, 0.22442626953125, 0.361328125, 0.49822998046875, 0.6351318359375, 0.77203369140625, 0.908935546875, 1.04583740234375, 1.1827392578125, 1.31964111328125, 1.45654296875, 1.59344482421875, 1.7303466796875, 1.86724853515625, 2.004150390625, 2.14105224609375, 2.2779541015625, 2.41485595703125, 2.5517578125, 2.68865966796875, 2.8255615234375, 2.96246337890625, 3.099365234375, 3.23626708984375, 3.3731689453125, 3.51007080078125, 3.64697265625, 3.78387451171875, 3.9207763671875, 4.05767822265625, 4.194580078125, 4.33148193359375, 4.4683837890625, 4.60528564453125, 4.7421875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 13.0, 15.0, 26.0, 42.0, 52.0, 81.0, 129.0, 182.0, 260.0, 371.0, 628.0, 944.0, 1403.0, 2233.0, 3566.0, 5813.0, 9485.0, 15742.0, 26745.0, 44409.0, 73185.0, 116037.0, 163945.0, 180987.0, 147867.0, 99705.0, 61347.0, 36938.0, 21753.0, 13336.0, 8010.0, 4866.0, 3082.0, 1848.0, 1186.0, 788.0, 511.0, 328.0, 209.0, 152.0, 102.0, 73.0, 49.0, 34.0, 33.0, 14.0, 9.0, 9.0, 4.0, 3.0, 3.0, 1.0, 2.0], "bins": [-2.123046875, -2.061187744140625, -1.99932861328125, -1.937469482421875, -1.8756103515625, -1.813751220703125, -1.75189208984375, -1.690032958984375, -1.628173828125, -1.566314697265625, -1.50445556640625, -1.442596435546875, -1.3807373046875, -1.318878173828125, -1.25701904296875, -1.195159912109375, -1.13330078125, -1.071441650390625, -1.00958251953125, -0.947723388671875, -0.8858642578125, -0.824005126953125, -0.76214599609375, -0.700286865234375, -0.638427734375, -0.576568603515625, -0.51470947265625, -0.452850341796875, -0.3909912109375, -0.329132080078125, -0.26727294921875, -0.205413818359375, -0.1435546875, -0.081695556640625, -0.01983642578125, 0.042022705078125, 0.1038818359375, 0.165740966796875, 0.22760009765625, 0.289459228515625, 0.351318359375, 0.413177490234375, 0.47503662109375, 0.536895751953125, 0.5987548828125, 0.660614013671875, 0.72247314453125, 0.784332275390625, 0.84619140625, 0.908050537109375, 0.96990966796875, 1.031768798828125, 1.0936279296875, 1.155487060546875, 1.21734619140625, 1.279205322265625, 1.341064453125, 1.402923583984375, 1.46478271484375, 1.526641845703125, 1.5885009765625, 1.650360107421875, 1.71221923828125, 1.774078369140625, 1.8359375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 8.0, 22.0, 29.0, 28.0, 39.0, 67.0, 67.0, 75.0, 88.0, 91.0, 104.0, 83.0, 63.0, 58.0, 50.0, 46.0, 18.0, 23.0, 10.0, 5.0, 8.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002532005310058594, -0.00024623051285743713, -0.0002392604947090149, -0.00023229047656059265, -0.0002253204584121704, -0.00021835044026374817, -0.00021138042211532593, -0.0002044104039669037, -0.00019744038581848145, -0.0001904703676700592, -0.00018350034952163696, -0.00017653033137321472, -0.00016956031322479248, -0.00016259029507637024, -0.000155620276927948, -0.00014865025877952576, -0.00014168024063110352, -0.00013471022248268127, -0.00012774020433425903, -0.00012077018618583679, -0.00011380016803741455, -0.00010683014988899231, -9.986013174057007e-05, -9.289011359214783e-05, -8.592009544372559e-05, -7.895007729530334e-05, -7.19800591468811e-05, -6.501004099845886e-05, -5.804002285003662e-05, -5.107000470161438e-05, -4.409998655319214e-05, -3.71299684047699e-05, -3.0159950256347656e-05, -2.3189932107925415e-05, -1.6219913959503174e-05, -9.249895811080933e-06, -2.2798776626586914e-06, 4.69014048576355e-06, 1.1660158634185791e-05, 1.8630176782608032e-05, 2.5600194931030273e-05, 3.2570213079452515e-05, 3.9540231227874756e-05, 4.6510249376297e-05, 5.348026752471924e-05, 6.045028567314148e-05, 6.742030382156372e-05, 7.439032196998596e-05, 8.13603401184082e-05, 8.833035826683044e-05, 9.530037641525269e-05, 0.00010227039456367493, 0.00010924041271209717, 0.00011621043086051941, 0.00012318044900894165, 0.0001301504671573639, 0.00013712048530578613, 0.00014409050345420837, 0.00015106052160263062, 0.00015803053975105286, 0.0001650005578994751, 0.00017197057604789734, 0.00017894059419631958, 0.00018591061234474182, 0.00019288063049316406]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 10.0, 12.0, 11.0, 30.0, 48.0, 38.0, 78.0, 107.0, 169.0, 254.0, 404.0, 687.0, 1054.0, 1815.0, 3056.0, 5218.0, 8912.0, 15891.0, 28495.0, 50871.0, 90344.0, 150054.0, 202933.0, 189019.0, 127628.0, 74881.0, 42105.0, 23277.0, 13004.0, 7375.0, 4326.0, 2551.0, 1448.0, 899.0, 543.0, 329.0, 245.0, 137.0, 98.0, 68.0, 50.0, 41.0, 15.0, 9.0, 9.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05078125, -1.979644775390625, -1.90850830078125, -1.837371826171875, -1.7662353515625, -1.695098876953125, -1.62396240234375, -1.552825927734375, -1.481689453125, -1.410552978515625, -1.33941650390625, -1.268280029296875, -1.1971435546875, -1.126007080078125, -1.05487060546875, -0.983734130859375, -0.91259765625, -0.841461181640625, -0.77032470703125, -0.699188232421875, -0.6280517578125, -0.556915283203125, -0.48577880859375, -0.414642333984375, -0.343505859375, -0.272369384765625, -0.20123291015625, -0.130096435546875, -0.0589599609375, 0.012176513671875, 0.08331298828125, 0.154449462890625, 0.2255859375, 0.296722412109375, 0.36785888671875, 0.438995361328125, 0.5101318359375, 0.581268310546875, 0.65240478515625, 0.723541259765625, 0.794677734375, 0.865814208984375, 0.93695068359375, 1.008087158203125, 1.0792236328125, 1.150360107421875, 1.22149658203125, 1.292633056640625, 1.36376953125, 1.434906005859375, 1.50604248046875, 1.577178955078125, 1.6483154296875, 1.719451904296875, 1.79058837890625, 1.861724853515625, 1.932861328125, 2.003997802734375, 2.07513427734375, 2.146270751953125, 2.2174072265625, 2.288543701171875, 2.35968017578125, 2.430816650390625, 2.501953125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 4.0, 4.0, 7.0, 6.0, 7.0, 15.0, 11.0, 17.0, 18.0, 26.0, 29.0, 62.0, 49.0, 62.0, 64.0, 66.0, 76.0, 71.0, 70.0, 50.0, 53.0, 40.0, 34.0, 36.0, 21.0, 16.0, 16.0, 21.0, 10.0, 8.0, 7.0, 3.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7958984375, -0.765167236328125, -0.73443603515625, -0.703704833984375, -0.6729736328125, -0.642242431640625, -0.61151123046875, -0.580780029296875, -0.550048828125, -0.519317626953125, -0.48858642578125, -0.457855224609375, -0.4271240234375, -0.396392822265625, -0.36566162109375, -0.334930419921875, -0.30419921875, -0.273468017578125, -0.24273681640625, -0.212005615234375, -0.1812744140625, -0.150543212890625, -0.11981201171875, -0.089080810546875, -0.058349609375, -0.027618408203125, 0.00311279296875, 0.033843994140625, 0.0645751953125, 0.095306396484375, 0.12603759765625, 0.156768798828125, 0.1875, 0.218231201171875, 0.24896240234375, 0.279693603515625, 0.3104248046875, 0.341156005859375, 0.37188720703125, 0.402618408203125, 0.433349609375, 0.464080810546875, 0.49481201171875, 0.525543212890625, 0.5562744140625, 0.587005615234375, 0.61773681640625, 0.648468017578125, 0.67919921875, 0.709930419921875, 0.74066162109375, 0.771392822265625, 0.8021240234375, 0.832855224609375, 0.86358642578125, 0.894317626953125, 0.925048828125, 0.955780029296875, 0.98651123046875, 1.017242431640625, 1.0479736328125, 1.078704833984375, 1.10943603515625, 1.140167236328125, 1.1708984375]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 6.0, 9.0, 11.0, 11.0, 17.0, 24.0, 24.0, 41.0, 32.0, 60.0, 49.0, 58.0, 77.0, 73.0, 84.0, 73.0, 71.0, 52.0, 37.0, 35.0, 30.0, 24.0, 14.0, 10.0, 14.0, 12.0, 6.0, 7.0, 8.0, 5.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.540040969848633, -8.28781509399414, -8.035590171813965, -7.783364295959473, -7.531138896942139, -7.278913497924805, -7.026688098907471, -6.774462699890137, -6.5222368240356445, -6.2700114250183105, -6.017786026000977, -5.765560150146484, -5.51333475112915, -5.261109352111816, -5.008883953094482, -4.756658554077148, -4.5044331550598145, -4.2522077560424805, -3.9999821186065674, -3.7477567195892334, -3.4955310821533203, -3.2433056831359863, -2.9910802841186523, -2.7388548851013184, -2.4866292476654053, -2.2344038486480713, -1.9821782112121582, -1.7299528121948242, -1.4777272939682007, -1.2255017757415771, -0.9732763767242432, -0.7210508584976196, -0.4688253402709961, -0.21659985184669495, 0.0356256365776062, 0.28785109519958496, 0.5400766134262085, 0.792302131652832, 1.044527530670166, 1.2967530488967896, 1.548978567123413, 1.8012040853500366, 2.05342960357666, 2.305655002593994, 2.557880401611328, 2.810106039047241, 3.062331438064575, 3.3145570755004883, 3.5667824745178223, 3.8190078735351562, 4.07123327255249, 4.323458671569824, 4.575684547424316, 4.82790994644165, 5.080135345458984, 5.332360744476318, 5.584586143493652, 5.836811542510986, 6.08903694152832, 6.3412628173828125, 6.5934882164001465, 6.8457136154174805, 7.0979390144348145, 7.350164413452148, 7.602390289306641]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 7.0, 9.0, 8.0, 12.0, 12.0, 14.0, 19.0, 25.0, 32.0, 22.0, 29.0, 35.0, 41.0, 25.0, 51.0, 32.0, 45.0, 33.0, 44.0, 42.0, 38.0, 36.0, 45.0, 36.0, 37.0, 27.0, 31.0, 35.0, 30.0, 23.0, 28.0, 14.0, 17.0, 10.0, 13.0, 12.0, 3.0, 6.0, 3.0, 10.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.754640579223633, -7.506252288818359, -7.257863521575928, -7.009475231170654, -6.761086940765381, -6.512698173522949, -6.264309883117676, -6.015921592712402, -5.767533302307129, -5.5191450119018555, -5.270756244659424, -5.02236795425415, -4.773979663848877, -4.525590896606445, -4.277202606201172, -4.028814315795898, -3.780425548553467, -3.5320370197296143, -3.283648729324341, -3.0352602005004883, -2.786871910095215, -2.5384833812713623, -2.2900948524475098, -2.0417065620422363, -1.7933180332183838, -1.5449296236038208, -1.2965412139892578, -1.0481526851654053, -0.7997642755508423, -0.5513758659362793, -0.30298733711242676, -0.05459892749786377, 0.19378948211669922, 0.4421779215335846, 0.69056636095047, 0.9389548301696777, 1.1873432397842407, 1.4357316493988037, 1.6841201782226562, 1.9325085878372192, 2.1808969974517822, 2.4292855262756348, 2.677673816680908, 2.9260623455047607, 3.1744508743286133, 3.4228391647338867, 3.6712276935577393, 3.919616222381592, 4.168004512786865, 4.416392803192139, 4.66478157043457, 4.913169860839844, 5.161558151245117, 5.409946441650391, 5.658335208892822, 5.906723499298096, 6.155112266540527, 6.403500556945801, 6.651889324188232, 6.900277614593506, 7.148665904998779, 7.397054672241211, 7.645442962646484, 7.893831253051758, 8.142219543457031]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 5.0, 7.0, 9.0, 12.0, 11.0, 28.0, 44.0, 48.0, 91.0, 121.0, 145.0, 251.0, 335.0, 473.0, 735.0, 1146.0, 1660.0, 2564.0, 4147.0, 6558.0, 10448.0, 16771.0, 28712.0, 49589.0, 89156.0, 165708.0, 318377.0, 603666.0, 929283.0, 865699.0, 515096.0, 265891.0, 138163.0, 75026.0, 42169.0, 24106.0, 14329.0, 8826.0, 5485.0, 3249.0, 2096.0, 1383.0, 926.0, 571.0, 424.0, 241.0, 176.0, 104.0, 60.0, 53.0, 47.0, 30.0, 13.0, 11.0, 9.0, 4.0, 4.0, 0.0, 3.0, 2.0], "bins": [-7.04296875, -6.82861328125, -6.6142578125, -6.39990234375, -6.185546875, -5.97119140625, -5.7568359375, -5.54248046875, -5.328125, -5.11376953125, -4.8994140625, -4.68505859375, -4.470703125, -4.25634765625, -4.0419921875, -3.82763671875, -3.61328125, -3.39892578125, -3.1845703125, -2.97021484375, -2.755859375, -2.54150390625, -2.3271484375, -2.11279296875, -1.8984375, -1.68408203125, -1.4697265625, -1.25537109375, -1.041015625, -0.82666015625, -0.6123046875, -0.39794921875, -0.18359375, 0.03076171875, 0.2451171875, 0.45947265625, 0.673828125, 0.88818359375, 1.1025390625, 1.31689453125, 1.53125, 1.74560546875, 1.9599609375, 2.17431640625, 2.388671875, 2.60302734375, 2.8173828125, 3.03173828125, 3.24609375, 3.46044921875, 3.6748046875, 3.88916015625, 4.103515625, 4.31787109375, 4.5322265625, 4.74658203125, 4.9609375, 5.17529296875, 5.3896484375, 5.60400390625, 5.818359375, 6.03271484375, 6.2470703125, 6.46142578125, 6.67578125]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 10.0, 17.0, 13.0, 19.0, 17.0, 12.0, 26.0, 27.0, 36.0, 36.0, 38.0, 33.0, 37.0, 43.0, 42.0, 49.0, 36.0, 39.0, 36.0, 38.0, 42.0, 33.0, 25.0, 43.0, 33.0, 31.0, 29.0, 20.0, 20.0, 18.0, 15.0, 16.0, 10.0, 9.0, 6.0, 3.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.890625, -4.72674560546875, -4.5628662109375, -4.39898681640625, -4.235107421875, -4.07122802734375, -3.9073486328125, -3.74346923828125, -3.57958984375, -3.41571044921875, -3.2518310546875, -3.08795166015625, -2.924072265625, -2.76019287109375, -2.5963134765625, -2.43243408203125, -2.2685546875, -2.10467529296875, -1.9407958984375, -1.77691650390625, -1.613037109375, -1.44915771484375, -1.2852783203125, -1.12139892578125, -0.95751953125, -0.79364013671875, -0.6297607421875, -0.46588134765625, -0.302001953125, -0.13812255859375, 0.0257568359375, 0.18963623046875, 0.353515625, 0.51739501953125, 0.6812744140625, 0.84515380859375, 1.009033203125, 1.17291259765625, 1.3367919921875, 1.50067138671875, 1.66455078125, 1.82843017578125, 1.9923095703125, 2.15618896484375, 2.320068359375, 2.48394775390625, 2.6478271484375, 2.81170654296875, 2.9755859375, 3.13946533203125, 3.3033447265625, 3.46722412109375, 3.631103515625, 3.79498291015625, 3.9588623046875, 4.12274169921875, 4.28662109375, 4.45050048828125, 4.6143798828125, 4.77825927734375, 4.942138671875, 5.10601806640625, 5.2698974609375, 5.43377685546875, 5.59765625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 10.0, 4.0, 14.0, 9.0, 14.0, 15.0, 31.0, 45.0, 56.0, 84.0, 136.0, 199.0, 293.0, 454.0, 687.0, 951.0, 1524.0, 2411.0, 3898.0, 6198.0, 10154.0, 16980.0, 29179.0, 51386.0, 91927.0, 169075.0, 308725.0, 530787.0, 770932.0, 804917.0, 592913.0, 352887.0, 196659.0, 107117.0, 59262.0, 33869.0, 19718.0, 11460.0, 6982.0, 4500.0, 2791.0, 1728.0, 1127.0, 754.0, 457.0, 309.0, 219.0, 134.0, 95.0, 65.0, 44.0, 32.0, 25.0, 18.0, 14.0, 10.0, 2.0, 5.0, 2.0, 4.0], "bins": [-6.39453125, -6.20147705078125, -6.0084228515625, -5.81536865234375, -5.622314453125, -5.42926025390625, -5.2362060546875, -5.04315185546875, -4.85009765625, -4.65704345703125, -4.4639892578125, -4.27093505859375, -4.077880859375, -3.88482666015625, -3.6917724609375, -3.49871826171875, -3.3056640625, -3.11260986328125, -2.9195556640625, -2.72650146484375, -2.533447265625, -2.34039306640625, -2.1473388671875, -1.95428466796875, -1.76123046875, -1.56817626953125, -1.3751220703125, -1.18206787109375, -0.989013671875, -0.79595947265625, -0.6029052734375, -0.40985107421875, -0.216796875, -0.02374267578125, 0.1693115234375, 0.36236572265625, 0.555419921875, 0.74847412109375, 0.9415283203125, 1.13458251953125, 1.32763671875, 1.52069091796875, 1.7137451171875, 1.90679931640625, 2.099853515625, 2.29290771484375, 2.4859619140625, 2.67901611328125, 2.8720703125, 3.06512451171875, 3.2581787109375, 3.45123291015625, 3.644287109375, 3.83734130859375, 4.0303955078125, 4.22344970703125, 4.41650390625, 4.60955810546875, 4.8026123046875, 4.99566650390625, 5.188720703125, 5.38177490234375, 5.5748291015625, 5.76788330078125, 5.9609375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 13.0, 10.0, 10.0, 19.0, 26.0, 32.0, 35.0, 54.0, 63.0, 92.0, 100.0, 144.0, 167.0, 192.0, 227.0, 251.0, 285.0, 293.0, 293.0, 278.0, 243.0, 240.0, 172.0, 163.0, 129.0, 99.0, 104.0, 60.0, 61.0, 45.0, 50.0, 25.0, 21.0, 26.0, 13.0, 9.0, 7.0, 5.0, 5.0, 6.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.34112548828125, -2.2486572265625, -2.15618896484375, -2.063720703125, -1.97125244140625, -1.8787841796875, -1.78631591796875, -1.69384765625, -1.60137939453125, -1.5089111328125, -1.41644287109375, -1.323974609375, -1.23150634765625, -1.1390380859375, -1.04656982421875, -0.9541015625, -0.86163330078125, -0.7691650390625, -0.67669677734375, -0.584228515625, -0.49176025390625, -0.3992919921875, -0.30682373046875, -0.21435546875, -0.12188720703125, -0.0294189453125, 0.06304931640625, 0.155517578125, 0.24798583984375, 0.3404541015625, 0.43292236328125, 0.525390625, 0.61785888671875, 0.7103271484375, 0.80279541015625, 0.895263671875, 0.98773193359375, 1.0802001953125, 1.17266845703125, 1.26513671875, 1.35760498046875, 1.4500732421875, 1.54254150390625, 1.635009765625, 1.72747802734375, 1.8199462890625, 1.91241455078125, 2.0048828125, 2.09735107421875, 2.1898193359375, 2.28228759765625, 2.374755859375, 2.46722412109375, 2.5596923828125, 2.65216064453125, 2.74462890625, 2.83709716796875, 2.9295654296875, 3.02203369140625, 3.114501953125, 3.20697021484375, 3.2994384765625, 3.39190673828125, 3.484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 10.0, 6.0, 10.0, 16.0, 24.0, 26.0, 35.0, 42.0, 51.0, 63.0, 81.0, 81.0, 91.0, 86.0, 81.0, 67.0, 41.0, 34.0, 40.0, 20.0, 21.0, 11.0, 17.0, 11.0, 12.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.712641716003418, -10.419923782348633, -10.127204895019531, -9.83448600769043, -9.541768074035645, -9.24905014038086, -8.956331253051758, -8.663612365722656, -8.370894432067871, -8.078176498413086, -7.785457611083984, -7.492739200592041, -7.200020790100098, -6.907302379608154, -6.614583969116211, -6.321865558624268, -6.029147148132324, -5.736428737640381, -5.4437103271484375, -5.150991916656494, -4.858273506164551, -4.565555095672607, -4.272836685180664, -3.9801182746887207, -3.6873998641967773, -3.394681453704834, -3.1019630432128906, -2.8092446327209473, -2.516526222229004, -2.2238078117370605, -1.9310894012451172, -1.6383709907531738, -1.3456535339355469, -1.0529351234436035, -0.7602167129516602, -0.4674983024597168, -0.17477989196777344, 0.11793851852416992, 0.4106569290161133, 0.7033753395080566, 0.99609375, 1.2888121604919434, 1.5815305709838867, 1.87424898147583, 2.1669673919677734, 2.459685802459717, 2.75240421295166, 3.0451226234436035, 3.337841033935547, 3.6305594444274902, 3.9232778549194336, 4.215996265411377, 4.50871467590332, 4.801433086395264, 5.094151496887207, 5.38686990737915, 5.679588317871094, 5.972306728363037, 6.2650251388549805, 6.557743549346924, 6.850461959838867, 7.1431803703308105, 7.435898780822754, 7.728617191314697, 8.02133560180664]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 8.0, 3.0, 4.0, 6.0, 9.0, 17.0, 15.0, 12.0, 24.0, 26.0, 23.0, 17.0, 37.0, 34.0, 30.0, 32.0, 49.0, 47.0, 43.0, 53.0, 46.0, 35.0, 39.0, 37.0, 36.0, 41.0, 34.0, 26.0, 33.0, 30.0, 29.0, 21.0, 18.0, 13.0, 14.0, 13.0, 13.0, 6.0, 7.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.8291192054748535, -7.59544038772583, -7.361761093139648, -7.128082275390625, -6.894403457641602, -6.66072416305542, -6.4270453453063965, -6.193366050720215, -5.959687232971191, -5.726008415222168, -5.492329120635986, -5.258650302886963, -5.024971008300781, -4.791292190551758, -4.557613372802734, -4.323934555053711, -4.090255260467529, -3.8565762042999268, -3.622897148132324, -3.389218330383301, -3.1555392742156982, -2.9218602180480957, -2.6881814002990723, -2.4545023441314697, -2.220823287963867, -1.9871442317962646, -1.7534652948379517, -1.5197863578796387, -1.2861073017120361, -1.0524282455444336, -0.8187493085861206, -0.5850703716278076, -0.3513913154602051, -0.11771231889724731, 0.11596667766571045, 0.3496456742286682, 0.583324670791626, 0.8170037269592285, 1.0506826639175415, 1.2843616008758545, 1.518040657043457, 1.7517197132110596, 1.9853986501693726, 2.2190775871276855, 2.452756643295288, 2.6864356994628906, 2.920114517211914, 3.1537935733795166, 3.387472629547119, 3.6211516857147217, 3.854830741882324, 4.088509559631348, 4.322188377380371, 4.555867671966553, 4.789546489715576, 5.023225784301758, 5.256904602050781, 5.490583419799805, 5.724262714385986, 5.95794153213501, 6.191620826721191, 6.425299644470215, 6.658978462219238, 6.892657279968262, 7.126336574554443]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 9.0, 11.0, 15.0, 24.0, 53.0, 74.0, 85.0, 149.0, 266.0, 396.0, 569.0, 936.0, 1522.0, 2458.0, 3753.0, 6155.0, 9833.0, 16517.0, 26869.0, 44211.0, 71181.0, 114181.0, 172471.0, 198012.0, 141613.0, 90994.0, 56703.0, 34497.0, 21124.0, 13022.0, 7769.0, 4978.0, 2966.0, 1956.0, 1151.0, 724.0, 449.0, 287.0, 221.0, 129.0, 85.0, 47.0, 39.0, 19.0, 13.0, 13.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.11328125, -1.079803466796875, -1.04632568359375, -1.012847900390625, -0.9793701171875, -0.945892333984375, -0.91241455078125, -0.878936767578125, -0.845458984375, -0.811981201171875, -0.77850341796875, -0.745025634765625, -0.7115478515625, -0.678070068359375, -0.64459228515625, -0.611114501953125, -0.57763671875, -0.544158935546875, -0.51068115234375, -0.477203369140625, -0.4437255859375, -0.410247802734375, -0.37677001953125, -0.343292236328125, -0.309814453125, -0.276336669921875, -0.24285888671875, -0.209381103515625, -0.1759033203125, -0.142425537109375, -0.10894775390625, -0.075469970703125, -0.0419921875, -0.008514404296875, 0.02496337890625, 0.058441162109375, 0.0919189453125, 0.125396728515625, 0.15887451171875, 0.192352294921875, 0.225830078125, 0.259307861328125, 0.29278564453125, 0.326263427734375, 0.3597412109375, 0.393218994140625, 0.42669677734375, 0.460174560546875, 0.49365234375, 0.527130126953125, 0.56060791015625, 0.594085693359375, 0.6275634765625, 0.661041259765625, 0.69451904296875, 0.727996826171875, 0.761474609375, 0.794952392578125, 0.82843017578125, 0.861907958984375, 0.8953857421875, 0.928863525390625, 0.96234130859375, 0.995819091796875, 1.029296875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 5.0, 6.0, 6.0, 11.0, 9.0, 15.0, 19.0, 20.0, 25.0, 23.0, 30.0, 35.0, 34.0, 37.0, 33.0, 45.0, 44.0, 40.0, 44.0, 39.0, 45.0, 27.0, 37.0, 44.0, 37.0, 26.0, 31.0, 24.0, 30.0, 26.0, 17.0, 20.0, 16.0, 15.0, 18.0, 12.0, 5.0, 10.0, 7.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.1171875, -6.8917236328125, -6.666259765625, -6.4407958984375, -6.21533203125, -5.9898681640625, -5.764404296875, -5.5389404296875, -5.3134765625, -5.0880126953125, -4.862548828125, -4.6370849609375, -4.41162109375, -4.1861572265625, -3.960693359375, -3.7352294921875, -3.509765625, -3.2843017578125, -3.058837890625, -2.8333740234375, -2.60791015625, -2.3824462890625, -2.156982421875, -1.9315185546875, -1.7060546875, -1.4805908203125, -1.255126953125, -1.0296630859375, -0.80419921875, -0.5787353515625, -0.353271484375, -0.1278076171875, 0.09765625, 0.3231201171875, 0.548583984375, 0.7740478515625, 0.99951171875, 1.2249755859375, 1.450439453125, 1.6759033203125, 1.9013671875, 2.1268310546875, 2.352294921875, 2.5777587890625, 2.80322265625, 3.0286865234375, 3.254150390625, 3.4796142578125, 3.705078125, 3.9305419921875, 4.156005859375, 4.3814697265625, 4.60693359375, 4.8323974609375, 5.057861328125, 5.2833251953125, 5.5087890625, 5.7342529296875, 5.959716796875, 6.1851806640625, 6.41064453125, 6.6361083984375, 6.861572265625, 7.0870361328125, 7.3125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 5.0, 6.0, 4.0, 5.0, 10.0, 16.0, 20.0, 25.0, 52.0, 63.0, 103.0, 151.0, 187.0, 283.0, 362.0, 576.0, 856.0, 1192.0, 1770.0, 2693.0, 4180.0, 6364.0, 9929.0, 15863.0, 25016.0, 40493.0, 63201.0, 99034.0, 147348.0, 182905.0, 154296.0, 105721.0, 68582.0, 42994.0, 26881.0, 16952.0, 10626.0, 6717.0, 4371.0, 2925.0, 1813.0, 1245.0, 880.0, 580.0, 373.0, 257.0, 175.0, 150.0, 94.0, 78.0, 39.0, 36.0, 20.0, 20.0, 16.0, 8.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.919921875, -0.88983154296875, -0.8597412109375, -0.82965087890625, -0.799560546875, -0.76947021484375, -0.7393798828125, -0.70928955078125, -0.67919921875, -0.64910888671875, -0.6190185546875, -0.58892822265625, -0.558837890625, -0.52874755859375, -0.4986572265625, -0.46856689453125, -0.4384765625, -0.40838623046875, -0.3782958984375, -0.34820556640625, -0.318115234375, -0.28802490234375, -0.2579345703125, -0.22784423828125, -0.19775390625, -0.16766357421875, -0.1375732421875, -0.10748291015625, -0.077392578125, -0.04730224609375, -0.0172119140625, 0.01287841796875, 0.04296875, 0.07305908203125, 0.1031494140625, 0.13323974609375, 0.163330078125, 0.19342041015625, 0.2235107421875, 0.25360107421875, 0.28369140625, 0.31378173828125, 0.3438720703125, 0.37396240234375, 0.404052734375, 0.43414306640625, 0.4642333984375, 0.49432373046875, 0.5244140625, 0.55450439453125, 0.5845947265625, 0.61468505859375, 0.644775390625, 0.67486572265625, 0.7049560546875, 0.73504638671875, 0.76513671875, 0.79522705078125, 0.8253173828125, 0.85540771484375, 0.885498046875, 0.91558837890625, 0.9456787109375, 0.97576904296875, 1.005859375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 8.0, 4.0, 4.0, 11.0, 13.0, 21.0, 20.0, 22.0, 36.0, 18.0, 29.0, 38.0, 26.0, 33.0, 36.0, 39.0, 42.0, 40.0, 46.0, 41.0, 36.0, 41.0, 37.0, 30.0, 50.0, 41.0, 38.0, 30.0, 17.0, 23.0, 20.0, 14.0, 12.0, 13.0, 12.0, 9.0, 7.0, 9.0, 12.0, 4.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3359375, -4.1962890625, -4.056640625, -3.9169921875, -3.77734375, -3.6376953125, -3.498046875, -3.3583984375, -3.21875, -3.0791015625, -2.939453125, -2.7998046875, -2.66015625, -2.5205078125, -2.380859375, -2.2412109375, -2.1015625, -1.9619140625, -1.822265625, -1.6826171875, -1.54296875, -1.4033203125, -1.263671875, -1.1240234375, -0.984375, -0.8447265625, -0.705078125, -0.5654296875, -0.42578125, -0.2861328125, -0.146484375, -0.0068359375, 0.1328125, 0.2724609375, 0.412109375, 0.5517578125, 0.69140625, 0.8310546875, 0.970703125, 1.1103515625, 1.25, 1.3896484375, 1.529296875, 1.6689453125, 1.80859375, 1.9482421875, 2.087890625, 2.2275390625, 2.3671875, 2.5068359375, 2.646484375, 2.7861328125, 2.92578125, 3.0654296875, 3.205078125, 3.3447265625, 3.484375, 3.6240234375, 3.763671875, 3.9033203125, 4.04296875, 4.1826171875, 4.322265625, 4.4619140625, 4.6015625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 16.0, 12.0, 21.0, 30.0, 39.0, 40.0, 62.0, 85.0, 125.0, 176.0, 255.0, 359.0, 598.0, 799.0, 1179.0, 1881.0, 3086.0, 5099.0, 8836.0, 16840.0, 33598.0, 75392.0, 180844.0, 356251.0, 200178.0, 83461.0, 37136.0, 18115.0, 9496.0, 5345.0, 3170.0, 2063.0, 1340.0, 851.0, 543.0, 380.0, 244.0, 171.0, 113.0, 97.0, 55.0, 51.0, 39.0, 29.0, 17.0, 14.0, 8.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.08929443359375, -0.08655166625976562, -0.08380889892578125, -0.08106613159179688, -0.0783233642578125, -0.07558059692382812, -0.07283782958984375, -0.07009506225585938, -0.067352294921875, -0.06460952758789062, -0.06186676025390625, -0.059123992919921875, -0.0563812255859375, -0.053638458251953125, -0.05089569091796875, -0.048152923583984375, -0.04541015625, -0.042667388916015625, -0.03992462158203125, -0.037181854248046875, -0.0344390869140625, -0.031696319580078125, -0.02895355224609375, -0.026210784912109375, -0.023468017578125, -0.020725250244140625, -0.01798248291015625, -0.015239715576171875, -0.0124969482421875, -0.009754180908203125, -0.00701141357421875, -0.004268646240234375, -0.00152587890625, 0.001216888427734375, 0.00395965576171875, 0.006702423095703125, 0.0094451904296875, 0.012187957763671875, 0.01493072509765625, 0.017673492431640625, 0.020416259765625, 0.023159027099609375, 0.02590179443359375, 0.028644561767578125, 0.0313873291015625, 0.034130096435546875, 0.03687286376953125, 0.039615631103515625, 0.0423583984375, 0.045101165771484375, 0.04784393310546875, 0.050586700439453125, 0.0533294677734375, 0.056072235107421875, 0.05881500244140625, 0.061557769775390625, 0.064300537109375, 0.06704330444335938, 0.06978607177734375, 0.07252883911132812, 0.0752716064453125, 0.07801437377929688, 0.08075714111328125, 0.08349990844726562, 0.08624267578125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 6.0, 8.0, 15.0, 19.0, 29.0, 28.0, 22.0, 35.0, 58.0, 44.0, 53.0, 60.0, 85.0, 53.0, 64.0, 56.0, 57.0, 51.0, 45.0, 34.0, 30.0, 37.0, 22.0, 16.0, 12.0, 17.0, 8.0, 6.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4603137969970703e-05, -1.416727900505066e-05, -1.3731420040130615e-05, -1.3295561075210571e-05, -1.2859702110290527e-05, -1.2423843145370483e-05, -1.198798418045044e-05, -1.1552125215530396e-05, -1.1116266250610352e-05, -1.0680407285690308e-05, -1.0244548320770264e-05, -9.80868935585022e-06, -9.372830390930176e-06, -8.936971426010132e-06, -8.501112461090088e-06, -8.065253496170044e-06, -7.62939453125e-06, -7.193535566329956e-06, -6.757676601409912e-06, -6.321817636489868e-06, -5.885958671569824e-06, -5.45009970664978e-06, -5.014240741729736e-06, -4.578381776809692e-06, -4.1425228118896484e-06, -3.7066638469696045e-06, -3.2708048820495605e-06, -2.8349459171295166e-06, -2.3990869522094727e-06, -1.9632279872894287e-06, -1.5273690223693848e-06, -1.0915100574493408e-06, -6.556510925292969e-07, -2.1979212760925293e-07, 2.1606683731079102e-07, 6.51925802230835e-07, 1.087784767150879e-06, 1.5236437320709229e-06, 1.959502696990967e-06, 2.3953616619110107e-06, 2.8312206268310547e-06, 3.2670795917510986e-06, 3.7029385566711426e-06, 4.1387975215911865e-06, 4.5746564865112305e-06, 5.010515451431274e-06, 5.446374416351318e-06, 5.882233381271362e-06, 6.318092346191406e-06, 6.75395131111145e-06, 7.189810276031494e-06, 7.625669240951538e-06, 8.061528205871582e-06, 8.497387170791626e-06, 8.93324613571167e-06, 9.369105100631714e-06, 9.804964065551758e-06, 1.0240823030471802e-05, 1.0676681995391846e-05, 1.111254096031189e-05, 1.1548399925231934e-05, 1.1984258890151978e-05, 1.2420117855072021e-05, 1.2855976819992065e-05, 1.329183578491211e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 2.0, 10.0, 17.0, 19.0, 35.0, 46.0, 84.0, 123.0, 198.0, 317.0, 530.0, 861.0, 1433.0, 2378.0, 4222.0, 7223.0, 13691.0, 28072.0, 65528.0, 178988.0, 394746.0, 209504.0, 74739.0, 31405.0, 15415.0, 8026.0, 4378.0, 2613.0, 1498.0, 929.0, 534.0, 358.0, 212.0, 156.0, 89.0, 58.0, 36.0, 28.0, 24.0, 10.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10968017578125, -0.10570240020751953, -0.10172462463378906, -0.0977468490600586, -0.09376907348632812, -0.08979129791259766, -0.08581352233886719, -0.08183574676513672, -0.07785797119140625, -0.07388019561767578, -0.06990242004394531, -0.06592464447021484, -0.061946868896484375, -0.057969093322753906, -0.05399131774902344, -0.05001354217529297, -0.0460357666015625, -0.04205799102783203, -0.03808021545410156, -0.034102439880371094, -0.030124664306640625, -0.026146888732910156, -0.022169113159179688, -0.01819133758544922, -0.01421356201171875, -0.010235786437988281, -0.0062580108642578125, -0.0022802352905273438, 0.001697540283203125, 0.005675315856933594, 0.009653091430664062, 0.013630867004394531, 0.017608642578125, 0.02158641815185547, 0.025564193725585938, 0.029541969299316406, 0.033519744873046875, 0.037497520446777344, 0.04147529602050781, 0.04545307159423828, 0.04943084716796875, 0.05340862274169922, 0.05738639831542969, 0.061364173889160156, 0.06534194946289062, 0.0693197250366211, 0.07329750061035156, 0.07727527618408203, 0.0812530517578125, 0.08523082733154297, 0.08920860290527344, 0.0931863784790039, 0.09716415405273438, 0.10114192962646484, 0.10511970520019531, 0.10909748077392578, 0.11307525634765625, 0.11705303192138672, 0.12103080749511719, 0.12500858306884766, 0.12898635864257812, 0.1329641342163086, 0.13694190979003906, 0.14091968536376953, 0.1448974609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 6.0, 8.0, 8.0, 8.0, 11.0, 15.0, 10.0, 14.0, 23.0, 16.0, 34.0, 38.0, 49.0, 40.0, 58.0, 59.0, 79.0, 80.0, 68.0, 67.0, 54.0, 32.0, 28.0, 40.0, 30.0, 25.0, 17.0, 15.0, 11.0, 8.0, 10.0, 8.0, 6.0, 4.0, 3.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.043060302734375, -0.04184532165527344, -0.040630340576171875, -0.03941535949707031, -0.03820037841796875, -0.03698539733886719, -0.035770416259765625, -0.03455543518066406, -0.0333404541015625, -0.03212547302246094, -0.030910491943359375, -0.029695510864257812, -0.02848052978515625, -0.027265548706054688, -0.026050567626953125, -0.024835586547851562, -0.02362060546875, -0.022405624389648438, -0.021190643310546875, -0.019975662231445312, -0.01876068115234375, -0.017545700073242188, -0.016330718994140625, -0.015115737915039062, -0.0139007568359375, -0.012685775756835938, -0.011470794677734375, -0.010255813598632812, -0.00904083251953125, -0.007825851440429688, -0.006610870361328125, -0.0053958892822265625, -0.004180908203125, -0.0029659271240234375, -0.001750946044921875, -0.0005359649658203125, 0.00067901611328125, 0.0018939971923828125, 0.003108978271484375, 0.0043239593505859375, 0.0055389404296875, 0.0067539215087890625, 0.007968902587890625, 0.009183883666992188, 0.01039886474609375, 0.011613845825195312, 0.012828826904296875, 0.014043807983398438, 0.0152587890625, 0.016473770141601562, 0.017688751220703125, 0.018903732299804688, 0.02011871337890625, 0.021333694458007812, 0.022548675537109375, 0.023763656616210938, 0.0249786376953125, 0.026193618774414062, 0.027408599853515625, 0.028623580932617188, 0.02983856201171875, 0.031053543090820312, 0.032268524169921875, 0.03348350524902344, 0.034698486328125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 13.0, 5.0, 7.0, 13.0, 26.0, 31.0, 28.0, 49.0, 41.0, 64.0, 80.0, 85.0, 92.0, 96.0, 76.0, 67.0, 47.0, 31.0, 37.0, 24.0, 15.0, 15.0, 12.0, 15.0, 11.0, 8.0, 3.0, 4.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.860321044921875, -10.564451217651367, -10.26858139038086, -9.972710609436035, -9.676840782165527, -9.38097095489502, -9.085101127624512, -8.789231300354004, -8.49336051940918, -8.197490692138672, -7.901620388031006, -7.605750560760498, -7.309880256652832, -7.014010429382324, -6.718140602111816, -6.422270774841309, -6.126400947570801, -5.830531120300293, -5.534660816192627, -5.238790988922119, -4.942920684814453, -4.647050857543945, -4.3511810302734375, -4.05531120300293, -3.7594408988952637, -3.4635708332061768, -3.16770076751709, -2.871830940246582, -2.575960874557495, -2.280090808868408, -1.9842208623886108, -1.6883509159088135, -1.3924798965454102, -1.0966098308563232, -0.8007398843765259, -0.5048698782920837, -0.2089998722076416, 0.08687019348144531, 0.3827401399612427, 0.67861008644104, 0.974480152130127, 1.2703502178192139, 1.5662201642990112, 1.8620901107788086, 2.1579601764678955, 2.4538302421569824, 2.7497000694274902, 3.045570135116577, 3.341440200805664, 3.637310266494751, 3.933180332183838, 4.229050159454346, 4.524920463562012, 4.8207902908325195, 5.116660118103027, 5.412529945373535, 5.708400249481201, 6.004270076751709, 6.300140380859375, 6.596010208129883, 6.891880035400391, 7.187750339508057, 7.4836201667785645, 7.7794904708862305, 8.075360298156738]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 4.0, 6.0, 8.0, 18.0, 15.0, 12.0, 23.0, 27.0, 22.0, 19.0, 34.0, 35.0, 32.0, 29.0, 50.0, 49.0, 42.0, 53.0, 45.0, 37.0, 36.0, 39.0, 36.0, 42.0, 32.0, 28.0, 30.0, 32.0, 30.0, 19.0, 19.0, 13.0, 14.0, 13.0, 14.0, 5.0, 7.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.827064037322998, -7.593979358673096, -7.360895156860352, -7.127810478210449, -6.894725799560547, -6.6616411209106445, -6.4285569190979, -6.195472240447998, -5.962388038635254, -5.729303359985352, -5.496219158172607, -5.263134479522705, -5.030049800872803, -4.796965599060059, -4.563880920410156, -4.330796241760254, -4.097711563110352, -3.8646271228790283, -3.631542444229126, -3.3984580039978027, -3.1653733253479004, -2.932288885116577, -2.699204444885254, -2.4661197662353516, -2.2330353260040283, -1.9999507665634155, -1.7668662071228027, -1.5337817668914795, -1.3006972074508667, -1.067612648010254, -0.8345282077789307, -0.6014436483383179, -0.3683590888977051, -0.13527455925941467, 0.09780997037887573, 0.33089447021484375, 0.5639790296554565, 0.7970635890960693, 1.0301480293273926, 1.2632325887680054, 1.4963171482086182, 1.729401707649231, 1.9624862670898438, 2.195570707321167, 2.4286551475524902, 2.6617398262023926, 2.894824266433716, 3.127908706665039, 3.3609933853149414, 3.5940778255462646, 3.827162504196167, 4.06024694442749, 4.293331623077393, 4.526415824890137, 4.759500503540039, 4.992585182189941, 5.225669860839844, 5.458754539489746, 5.69183874130249, 5.924923419952393, 6.158008098602295, 6.391092300415039, 6.624176979064941, 6.857261657714844, 7.090345859527588]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 11.0, 8.0, 19.0, 21.0, 25.0, 37.0, 64.0, 121.0, 170.0, 277.0, 464.0, 667.0, 1063.0, 1743.0, 2841.0, 4701.0, 7629.0, 12712.0, 20822.0, 34855.0, 55489.0, 87873.0, 126121.0, 156970.0, 159646.0, 130174.0, 91454.0, 59144.0, 36919.0, 22326.0, 13235.0, 8159.0, 4870.0, 3038.0, 1819.0, 1100.0, 740.0, 462.0, 287.0, 160.0, 103.0, 71.0, 44.0, 37.0, 23.0, 20.0, 14.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.55859375, -5.38519287109375, -5.2117919921875, -5.03839111328125, -4.864990234375, -4.69158935546875, -4.5181884765625, -4.34478759765625, -4.17138671875, -3.99798583984375, -3.8245849609375, -3.65118408203125, -3.477783203125, -3.30438232421875, -3.1309814453125, -2.95758056640625, -2.7841796875, -2.61077880859375, -2.4373779296875, -2.26397705078125, -2.090576171875, -1.91717529296875, -1.7437744140625, -1.57037353515625, -1.39697265625, -1.22357177734375, -1.0501708984375, -0.87677001953125, -0.703369140625, -0.52996826171875, -0.3565673828125, -0.18316650390625, -0.009765625, 0.16363525390625, 0.3370361328125, 0.51043701171875, 0.683837890625, 0.85723876953125, 1.0306396484375, 1.20404052734375, 1.37744140625, 1.55084228515625, 1.7242431640625, 1.89764404296875, 2.071044921875, 2.24444580078125, 2.4178466796875, 2.59124755859375, 2.7646484375, 2.93804931640625, 3.1114501953125, 3.28485107421875, 3.458251953125, 3.63165283203125, 3.8050537109375, 3.97845458984375, 4.15185546875, 4.32525634765625, 4.4986572265625, 4.67205810546875, 4.845458984375, 5.01885986328125, 5.1922607421875, 5.36566162109375, 5.5390625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 15.0, 13.0, 26.0, 22.0, 21.0, 29.0, 30.0, 40.0, 27.0, 44.0, 50.0, 44.0, 46.0, 62.0, 50.0, 49.0, 33.0, 40.0, 52.0, 44.0, 32.0, 29.0, 32.0, 36.0, 18.0, 16.0, 20.0, 13.0, 9.0, 6.0, 7.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.0234375, -8.75909423828125, -8.4947509765625, -8.23040771484375, -7.966064453125, -7.70172119140625, -7.4373779296875, -7.17303466796875, -6.90869140625, -6.64434814453125, -6.3800048828125, -6.11566162109375, -5.851318359375, -5.58697509765625, -5.3226318359375, -5.05828857421875, -4.7939453125, -4.52960205078125, -4.2652587890625, -4.00091552734375, -3.736572265625, -3.47222900390625, -3.2078857421875, -2.94354248046875, -2.67919921875, -2.41485595703125, -2.1505126953125, -1.88616943359375, -1.621826171875, -1.35748291015625, -1.0931396484375, -0.82879638671875, -0.564453125, -0.30010986328125, -0.0357666015625, 0.22857666015625, 0.492919921875, 0.75726318359375, 1.0216064453125, 1.28594970703125, 1.55029296875, 1.81463623046875, 2.0789794921875, 2.34332275390625, 2.607666015625, 2.87200927734375, 3.1363525390625, 3.40069580078125, 3.6650390625, 3.92938232421875, 4.1937255859375, 4.45806884765625, 4.722412109375, 4.98675537109375, 5.2510986328125, 5.51544189453125, 5.77978515625, 6.04412841796875, 6.3084716796875, 6.57281494140625, 6.837158203125, 7.10150146484375, 7.3658447265625, 7.63018798828125, 7.89453125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 6.0, 5.0, 6.0, 18.0, 22.0, 26.0, 49.0, 51.0, 70.0, 114.0, 161.0, 232.0, 368.0, 522.0, 751.0, 1153.0, 1758.0, 2608.0, 3985.0, 6164.0, 9789.0, 15514.0, 24429.0, 38564.0, 59334.0, 87747.0, 118681.0, 143394.0, 145240.0, 122637.0, 90784.0, 62331.0, 40461.0, 25700.0, 16388.0, 10369.0, 6597.0, 4257.0, 2718.0, 1853.0, 1155.0, 794.0, 573.0, 372.0, 241.0, 184.0, 126.0, 83.0, 71.0, 40.0, 18.0, 25.0, 14.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.55169677734375, -4.4002685546875, -4.24884033203125, -4.097412109375, -3.94598388671875, -3.7945556640625, -3.64312744140625, -3.49169921875, -3.34027099609375, -3.1888427734375, -3.03741455078125, -2.885986328125, -2.73455810546875, -2.5831298828125, -2.43170166015625, -2.2802734375, -2.12884521484375, -1.9774169921875, -1.82598876953125, -1.674560546875, -1.52313232421875, -1.3717041015625, -1.22027587890625, -1.06884765625, -0.91741943359375, -0.7659912109375, -0.61456298828125, -0.463134765625, -0.31170654296875, -0.1602783203125, -0.00885009765625, 0.142578125, 0.29400634765625, 0.4454345703125, 0.59686279296875, 0.748291015625, 0.89971923828125, 1.0511474609375, 1.20257568359375, 1.35400390625, 1.50543212890625, 1.6568603515625, 1.80828857421875, 1.959716796875, 2.11114501953125, 2.2625732421875, 2.41400146484375, 2.5654296875, 2.71685791015625, 2.8682861328125, 3.01971435546875, 3.171142578125, 3.32257080078125, 3.4739990234375, 3.62542724609375, 3.77685546875, 3.92828369140625, 4.0797119140625, 4.23114013671875, 4.382568359375, 4.53399658203125, 4.6854248046875, 4.83685302734375, 4.98828125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 8.0, 10.0, 8.0, 12.0, 2.0, 17.0, 13.0, 19.0, 18.0, 27.0, 25.0, 39.0, 32.0, 40.0, 37.0, 39.0, 42.0, 44.0, 45.0, 39.0, 32.0, 44.0, 50.0, 36.0, 40.0, 41.0, 38.0, 23.0, 17.0, 23.0, 18.0, 19.0, 26.0, 10.0, 11.0, 12.0, 12.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.5234375, -4.39093017578125, -4.2584228515625, -4.12591552734375, -3.993408203125, -3.86090087890625, -3.7283935546875, -3.59588623046875, -3.46337890625, -3.33087158203125, -3.1983642578125, -3.06585693359375, -2.933349609375, -2.80084228515625, -2.6683349609375, -2.53582763671875, -2.4033203125, -2.27081298828125, -2.1383056640625, -2.00579833984375, -1.873291015625, -1.74078369140625, -1.6082763671875, -1.47576904296875, -1.34326171875, -1.21075439453125, -1.0782470703125, -0.94573974609375, -0.813232421875, -0.68072509765625, -0.5482177734375, -0.41571044921875, -0.283203125, -0.15069580078125, -0.0181884765625, 0.11431884765625, 0.246826171875, 0.37933349609375, 0.5118408203125, 0.64434814453125, 0.77685546875, 0.90936279296875, 1.0418701171875, 1.17437744140625, 1.306884765625, 1.43939208984375, 1.5718994140625, 1.70440673828125, 1.8369140625, 1.96942138671875, 2.1019287109375, 2.23443603515625, 2.366943359375, 2.49945068359375, 2.6319580078125, 2.76446533203125, 2.89697265625, 3.02947998046875, 3.1619873046875, 3.29449462890625, 3.427001953125, 3.55950927734375, 3.6920166015625, 3.82452392578125, 3.95703125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 7.0, 2.0, 3.0, 11.0, 8.0, 16.0, 22.0, 31.0, 50.0, 94.0, 111.0, 148.0, 268.0, 428.0, 662.0, 958.0, 1372.0, 2223.0, 3378.0, 5403.0, 8566.0, 13993.0, 22960.0, 38365.0, 62211.0, 98436.0, 144492.0, 176574.0, 161085.0, 114500.0, 73579.0, 45598.0, 27832.0, 16784.0, 10522.0, 6463.0, 4040.0, 2494.0, 1654.0, 1084.0, 715.0, 478.0, 300.0, 205.0, 153.0, 98.0, 52.0, 58.0, 37.0, 10.0, 18.0, 7.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6513671875, -1.5937957763671875, -1.536224365234375, -1.4786529541015625, -1.42108154296875, -1.3635101318359375, -1.305938720703125, -1.2483673095703125, -1.1907958984375, -1.1332244873046875, -1.075653076171875, -1.0180816650390625, -0.96051025390625, -0.9029388427734375, -0.845367431640625, -0.7877960205078125, -0.730224609375, -0.6726531982421875, -0.615081787109375, -0.5575103759765625, -0.49993896484375, -0.4423675537109375, -0.384796142578125, -0.3272247314453125, -0.2696533203125, -0.2120819091796875, -0.154510498046875, -0.0969390869140625, -0.03936767578125, 0.0182037353515625, 0.075775146484375, 0.1333465576171875, 0.19091796875, 0.2484893798828125, 0.306060791015625, 0.3636322021484375, 0.42120361328125, 0.4787750244140625, 0.536346435546875, 0.5939178466796875, 0.6514892578125, 0.7090606689453125, 0.766632080078125, 0.8242034912109375, 0.88177490234375, 0.9393463134765625, 0.996917724609375, 1.0544891357421875, 1.112060546875, 1.1696319580078125, 1.227203369140625, 1.2847747802734375, 1.34234619140625, 1.3999176025390625, 1.457489013671875, 1.5150604248046875, 1.5726318359375, 1.6302032470703125, 1.687774658203125, 1.7453460693359375, 1.80291748046875, 1.8604888916015625, 1.918060302734375, 1.9756317138671875, 2.033203125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 7.0, 6.0, 13.0, 14.0, 17.0, 18.0, 19.0, 29.0, 22.0, 35.0, 36.0, 42.0, 47.0, 54.0, 48.0, 47.0, 61.0, 42.0, 52.0, 50.0, 42.0, 40.0, 40.0, 44.0, 21.0, 30.0, 21.0, 14.0, 15.0, 12.0, 9.0, 7.0, 7.0, 1.0, 5.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0001137852668762207, -0.00011017825454473495, -0.0001065712422132492, -0.00010296422988176346, -9.935721755027771e-05, -9.575020521879196e-05, -9.214319288730621e-05, -8.853618055582047e-05, -8.492916822433472e-05, -8.132215589284897e-05, -7.771514356136322e-05, -7.410813122987747e-05, -7.050111889839172e-05, -6.689410656690598e-05, -6.328709423542023e-05, -5.968008190393448e-05, -5.607306957244873e-05, -5.246605724096298e-05, -4.8859044909477234e-05, -4.5252032577991486e-05, -4.164502024650574e-05, -3.803800791501999e-05, -3.443099558353424e-05, -3.082398325204849e-05, -2.7216970920562744e-05, -2.3609958589076996e-05, -2.0002946257591248e-05, -1.63959339261055e-05, -1.2788921594619751e-05, -9.181909263134003e-06, -5.574896931648254e-06, -1.967884600162506e-06, 1.6391277313232422e-06, 5.2461400628089905e-06, 8.853152394294739e-06, 1.2460164725780487e-05, 1.6067177057266235e-05, 1.9674189388751984e-05, 2.3281201720237732e-05, 2.688821405172348e-05, 3.049522638320923e-05, 3.410223871469498e-05, 3.7709251046180725e-05, 4.1316263377666473e-05, 4.492327570915222e-05, 4.853028804063797e-05, 5.213730037212372e-05, 5.5744312703609467e-05, 5.9351325035095215e-05, 6.295833736658096e-05, 6.656534969806671e-05, 7.017236202955246e-05, 7.377937436103821e-05, 7.738638669252396e-05, 8.09933990240097e-05, 8.460041135549545e-05, 8.82074236869812e-05, 9.181443601846695e-05, 9.54214483499527e-05, 9.902846068143845e-05, 0.0001026354730129242, 0.00010624248534440994, 0.00010984949767589569, 0.00011345651000738144, 0.00011706352233886719]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 9.0, 17.0, 19.0, 25.0, 38.0, 76.0, 106.0, 170.0, 287.0, 438.0, 707.0, 1090.0, 1958.0, 3152.0, 5538.0, 9829.0, 17522.0, 32323.0, 59570.0, 105859.0, 170581.0, 211111.0, 176155.0, 111250.0, 63217.0, 33879.0, 18884.0, 10420.0, 5941.0, 3338.0, 1897.0, 1160.0, 720.0, 442.0, 296.0, 195.0, 111.0, 81.0, 34.0, 34.0, 31.0, 12.0, 12.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.330078125, -2.2606201171875, -2.191162109375, -2.1217041015625, -2.05224609375, -1.9827880859375, -1.913330078125, -1.8438720703125, -1.7744140625, -1.7049560546875, -1.635498046875, -1.5660400390625, -1.49658203125, -1.4271240234375, -1.357666015625, -1.2882080078125, -1.21875, -1.1492919921875, -1.079833984375, -1.0103759765625, -0.94091796875, -0.8714599609375, -0.802001953125, -0.7325439453125, -0.6630859375, -0.5936279296875, -0.524169921875, -0.4547119140625, -0.38525390625, -0.3157958984375, -0.246337890625, -0.1768798828125, -0.107421875, -0.0379638671875, 0.031494140625, 0.1009521484375, 0.17041015625, 0.2398681640625, 0.309326171875, 0.3787841796875, 0.4482421875, 0.5177001953125, 0.587158203125, 0.6566162109375, 0.72607421875, 0.7955322265625, 0.864990234375, 0.9344482421875, 1.00390625, 1.0733642578125, 1.142822265625, 1.2122802734375, 1.28173828125, 1.3511962890625, 1.420654296875, 1.4901123046875, 1.5595703125, 1.6290283203125, 1.698486328125, 1.7679443359375, 1.83740234375, 1.9068603515625, 1.976318359375, 2.0457763671875, 2.115234375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 6.0, 5.0, 10.0, 6.0, 15.0, 21.0, 28.0, 36.0, 48.0, 66.0, 99.0, 89.0, 106.0, 95.0, 81.0, 71.0, 55.0, 43.0, 38.0, 26.0, 16.0, 13.0, 11.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3701171875, -1.3292236328125, -1.288330078125, -1.2474365234375, -1.20654296875, -1.1656494140625, -1.124755859375, -1.0838623046875, -1.04296875, -1.0020751953125, -0.961181640625, -0.9202880859375, -0.87939453125, -0.8385009765625, -0.797607421875, -0.7567138671875, -0.7158203125, -0.6749267578125, -0.634033203125, -0.5931396484375, -0.55224609375, -0.5113525390625, -0.470458984375, -0.4295654296875, -0.388671875, -0.3477783203125, -0.306884765625, -0.2659912109375, -0.22509765625, -0.1842041015625, -0.143310546875, -0.1024169921875, -0.0615234375, -0.0206298828125, 0.020263671875, 0.0611572265625, 0.10205078125, 0.1429443359375, 0.183837890625, 0.2247314453125, 0.265625, 0.3065185546875, 0.347412109375, 0.3883056640625, 0.42919921875, 0.4700927734375, 0.510986328125, 0.5518798828125, 0.5927734375, 0.6336669921875, 0.674560546875, 0.7154541015625, 0.75634765625, 0.7972412109375, 0.838134765625, 0.8790283203125, 0.919921875, 0.9608154296875, 1.001708984375, 1.0426025390625, 1.08349609375, 1.1243896484375, 1.165283203125, 1.2061767578125, 1.2470703125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 2.0, 7.0, 5.0, 10.0, 15.0, 14.0, 22.0, 32.0, 39.0, 44.0, 42.0, 72.0, 72.0, 92.0, 70.0, 80.0, 61.0, 69.0, 53.0, 28.0, 38.0, 27.0, 20.0, 17.0, 22.0, 6.0, 14.0, 7.0, 1.0, 5.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.017345428466797, -8.749435424804688, -8.481525421142578, -8.213615417480469, -7.945705413818359, -7.67779541015625, -7.409885883331299, -7.1419758796691895, -6.87406587600708, -6.606155872344971, -6.338245868682861, -6.070335865020752, -5.802426338195801, -5.534516334533691, -5.266606330871582, -4.998696327209473, -4.730786323547363, -4.462876319885254, -4.1949663162231445, -3.9270565509796143, -3.659146547317505, -3.3912365436553955, -3.1233267784118652, -2.855416774749756, -2.5875067710876465, -2.319596767425537, -2.0516867637634277, -1.7837769985198975, -1.515866994857788, -1.2479569911956787, -0.9800471067428589, -0.7121372222900391, -0.4442281723022461, -0.1763182282447815, 0.0915917158126831, 0.3595016598701477, 0.6274116039276123, 0.8953216075897217, 1.1632314920425415, 1.4311413764953613, 1.6990513801574707, 1.96696138381958, 2.2348713874816895, 2.5027811527252197, 2.770691156387329, 3.0386011600494385, 3.3065109252929688, 3.574420928955078, 3.8423309326171875, 4.110240936279297, 4.378150939941406, 4.646060943603516, 4.913970947265625, 5.181880950927734, 5.4497904777526855, 5.717700481414795, 5.985610485076904, 6.253520488739014, 6.521430492401123, 6.789340496063232, 7.057250022888184, 7.325160026550293, 7.593070030212402, 7.860980033874512, 8.128890037536621]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 4.0, 7.0, 7.0, 11.0, 18.0, 22.0, 25.0, 14.0, 16.0, 23.0, 34.0, 29.0, 28.0, 31.0, 31.0, 40.0, 33.0, 39.0, 35.0, 39.0, 38.0, 42.0, 29.0, 50.0, 47.0, 42.0, 32.0, 27.0, 19.0, 27.0, 21.0, 17.0, 26.0, 19.0, 13.0, 10.0, 4.0, 11.0, 7.0, 8.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.877549171447754, -6.6620073318481445, -6.446465492248535, -6.230923652648926, -6.015382289886475, -5.799840450286865, -5.584298610687256, -5.3687567710876465, -5.153215408325195, -4.937673568725586, -4.722131729125977, -4.506589889526367, -4.291048526763916, -4.075506687164307, -3.8599648475646973, -3.644423007965088, -3.4288811683654785, -3.213339328765869, -2.997797727584839, -2.7822558879852295, -2.566714286804199, -2.35117244720459, -2.1356306076049805, -1.9200888872146606, -1.7045471668243408, -1.489005446434021, -1.2734637260437012, -1.0579218864440918, -0.842380166053772, -0.6268384456634521, -0.4112966060638428, -0.19575488567352295, 0.019786834716796875, 0.2353285849094391, 0.4508703351020813, 0.6664121150970459, 0.8819538354873657, 1.0974955558776855, 1.313037395477295, 1.5285791158676147, 1.7441208362579346, 1.9596625566482544, 2.175204277038574, 2.3907461166381836, 2.606287956237793, 2.8218295574188232, 3.0373713970184326, 3.252912998199463, 3.4684548377990723, 3.6839966773986816, 3.899538278579712, 4.115079879760742, 4.330621719360352, 4.546163558959961, 4.76170539855957, 4.97724723815918, 5.192789077758789, 5.408330917358398, 5.623872756958008, 5.839414596557617, 6.054955959320068, 6.270497798919678, 6.486039638519287, 6.7015814781188965, 6.917122840881348]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 8.0, 7.0, 12.0, 19.0, 35.0, 39.0, 55.0, 76.0, 119.0, 164.0, 237.0, 391.0, 577.0, 855.0, 1310.0, 2027.0, 3085.0, 5031.0, 8095.0, 13105.0, 21820.0, 37225.0, 64854.0, 116101.0, 214586.0, 404598.0, 708133.0, 929936.0, 738746.0, 422709.0, 222402.0, 118539.0, 64712.0, 36970.0, 21644.0, 13182.0, 8061.0, 5014.0, 3321.0, 2187.0, 1414.0, 920.0, 634.0, 415.0, 312.0, 194.0, 137.0, 95.0, 59.0, 44.0, 27.0, 20.0, 14.0, 9.0, 5.0, 3.0, 2.0], "bins": [-6.85546875, -6.65692138671875, -6.4583740234375, -6.25982666015625, -6.061279296875, -5.86273193359375, -5.6641845703125, -5.46563720703125, -5.26708984375, -5.06854248046875, -4.8699951171875, -4.67144775390625, -4.472900390625, -4.27435302734375, -4.0758056640625, -3.87725830078125, -3.6787109375, -3.48016357421875, -3.2816162109375, -3.08306884765625, -2.884521484375, -2.68597412109375, -2.4874267578125, -2.28887939453125, -2.09033203125, -1.89178466796875, -1.6932373046875, -1.49468994140625, -1.296142578125, -1.09759521484375, -0.8990478515625, -0.70050048828125, -0.501953125, -0.30340576171875, -0.1048583984375, 0.09368896484375, 0.292236328125, 0.49078369140625, 0.6893310546875, 0.88787841796875, 1.08642578125, 1.28497314453125, 1.4835205078125, 1.68206787109375, 1.880615234375, 2.07916259765625, 2.2777099609375, 2.47625732421875, 2.6748046875, 2.87335205078125, 3.0718994140625, 3.27044677734375, 3.468994140625, 3.66754150390625, 3.8660888671875, 4.06463623046875, 4.26318359375, 4.46173095703125, 4.6602783203125, 4.85882568359375, 5.057373046875, 5.25592041015625, 5.4544677734375, 5.65301513671875, 5.8515625]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 3.0, 15.0, 16.0, 13.0, 15.0, 18.0, 23.0, 16.0, 26.0, 35.0, 34.0, 39.0, 40.0, 27.0, 36.0, 45.0, 39.0, 39.0, 39.0, 42.0, 51.0, 38.0, 33.0, 40.0, 33.0, 29.0, 30.0, 28.0, 21.0, 17.0, 22.0, 22.0, 10.0, 9.0, 11.0, 13.0, 5.0, 2.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8359375, -4.68536376953125, -4.5347900390625, -4.38421630859375, -4.233642578125, -4.08306884765625, -3.9324951171875, -3.78192138671875, -3.63134765625, -3.48077392578125, -3.3302001953125, -3.17962646484375, -3.029052734375, -2.87847900390625, -2.7279052734375, -2.57733154296875, -2.4267578125, -2.27618408203125, -2.1256103515625, -1.97503662109375, -1.824462890625, -1.67388916015625, -1.5233154296875, -1.37274169921875, -1.22216796875, -1.07159423828125, -0.9210205078125, -0.77044677734375, -0.619873046875, -0.46929931640625, -0.3187255859375, -0.16815185546875, -0.017578125, 0.13299560546875, 0.2835693359375, 0.43414306640625, 0.584716796875, 0.73529052734375, 0.8858642578125, 1.03643798828125, 1.18701171875, 1.33758544921875, 1.4881591796875, 1.63873291015625, 1.789306640625, 1.93988037109375, 2.0904541015625, 2.24102783203125, 2.3916015625, 2.54217529296875, 2.6927490234375, 2.84332275390625, 2.993896484375, 3.14447021484375, 3.2950439453125, 3.44561767578125, 3.59619140625, 3.74676513671875, 3.8973388671875, 4.04791259765625, 4.198486328125, 4.34906005859375, 4.4996337890625, 4.65020751953125, 4.80078125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 12.0, 14.0, 22.0, 25.0, 46.0, 69.0, 107.0, 177.0, 269.0, 415.0, 705.0, 1148.0, 1885.0, 3122.0, 5212.0, 9221.0, 16042.0, 28602.0, 52459.0, 98340.0, 187156.0, 351836.0, 611610.0, 849214.0, 802318.0, 532872.0, 297461.0, 157650.0, 83627.0, 44842.0, 24686.0, 13876.0, 7891.0, 4485.0, 2613.0, 1627.0, 1029.0, 604.0, 345.0, 249.0, 155.0, 87.0, 56.0, 41.0, 24.0, 15.0, 7.0, 5.0, 5.0, 2.0, 2.0], "bins": [-7.33984375, -7.1407470703125, -6.941650390625, -6.7425537109375, -6.54345703125, -6.3443603515625, -6.145263671875, -5.9461669921875, -5.7470703125, -5.5479736328125, -5.348876953125, -5.1497802734375, -4.95068359375, -4.7515869140625, -4.552490234375, -4.3533935546875, -4.154296875, -3.9552001953125, -3.756103515625, -3.5570068359375, -3.35791015625, -3.1588134765625, -2.959716796875, -2.7606201171875, -2.5615234375, -2.3624267578125, -2.163330078125, -1.9642333984375, -1.76513671875, -1.5660400390625, -1.366943359375, -1.1678466796875, -0.96875, -0.7696533203125, -0.570556640625, -0.3714599609375, -0.17236328125, 0.0267333984375, 0.225830078125, 0.4249267578125, 0.6240234375, 0.8231201171875, 1.022216796875, 1.2213134765625, 1.42041015625, 1.6195068359375, 1.818603515625, 2.0177001953125, 2.216796875, 2.4158935546875, 2.614990234375, 2.8140869140625, 3.01318359375, 3.2122802734375, 3.411376953125, 3.6104736328125, 3.8095703125, 4.0086669921875, 4.207763671875, 4.4068603515625, 4.60595703125, 4.8050537109375, 5.004150390625, 5.2032470703125, 5.40234375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 13.0, 14.0, 23.0, 27.0, 23.0, 50.0, 45.0, 55.0, 69.0, 78.0, 91.0, 102.0, 141.0, 192.0, 202.0, 201.0, 217.0, 236.0, 240.0, 252.0, 246.0, 203.0, 216.0, 170.0, 168.0, 115.0, 103.0, 104.0, 83.0, 63.0, 52.0, 52.0, 43.0, 28.0, 27.0, 29.0, 21.0, 18.0, 11.0, 10.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.12109375, -2.04632568359375, -1.9715576171875, -1.89678955078125, -1.822021484375, -1.74725341796875, -1.6724853515625, -1.59771728515625, -1.52294921875, -1.44818115234375, -1.3734130859375, -1.29864501953125, -1.223876953125, -1.14910888671875, -1.0743408203125, -0.99957275390625, -0.9248046875, -0.85003662109375, -0.7752685546875, -0.70050048828125, -0.625732421875, -0.55096435546875, -0.4761962890625, -0.40142822265625, -0.32666015625, -0.25189208984375, -0.1771240234375, -0.10235595703125, -0.027587890625, 0.04718017578125, 0.1219482421875, 0.19671630859375, 0.271484375, 0.34625244140625, 0.4210205078125, 0.49578857421875, 0.570556640625, 0.64532470703125, 0.7200927734375, 0.79486083984375, 0.86962890625, 0.94439697265625, 1.0191650390625, 1.09393310546875, 1.168701171875, 1.24346923828125, 1.3182373046875, 1.39300537109375, 1.4677734375, 1.54254150390625, 1.6173095703125, 1.69207763671875, 1.766845703125, 1.84161376953125, 1.9163818359375, 1.99114990234375, 2.06591796875, 2.14068603515625, 2.2154541015625, 2.29022216796875, 2.364990234375, 2.43975830078125, 2.5145263671875, 2.58929443359375, 2.6640625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 14.0, 24.0, 33.0, 32.0, 44.0, 64.0, 58.0, 87.0, 83.0, 99.0, 79.0, 83.0, 64.0, 49.0, 51.0, 32.0, 19.0, 16.0, 21.0, 7.0, 13.0, 1.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.017004013061523, -10.706232070922852, -10.39546012878418, -10.084689140319824, -9.773917198181152, -9.46314525604248, -9.152373313903809, -8.841602325439453, -8.530830383300781, -8.22005844116211, -7.909286975860596, -7.598515033721924, -7.28774356842041, -6.976971626281738, -6.666199684143066, -6.355428218841553, -6.044656276702881, -5.733884334564209, -5.423112869262695, -5.112340927124023, -4.80156946182251, -4.490797519683838, -4.180026054382324, -3.8692541122436523, -3.5584824085235596, -3.247710704803467, -2.936939001083374, -2.6261672973632812, -2.3153953552246094, -2.0046238899230957, -1.6938519477844238, -1.383080244064331, -1.0723085403442383, -0.7615368366241455, -0.45076507329940796, -0.1399933099746704, 0.17077839374542236, 0.48155009746551514, 0.7923219203948975, 1.1030936241149902, 1.413865327835083, 1.7246370315551758, 2.0354087352752686, 2.3461804389953613, 2.656952381134033, 2.967723846435547, 3.2784957885742188, 3.5892674922943115, 3.9000391960144043, 4.210811138153076, 4.52158260345459, 4.832354545593262, 5.143126010894775, 5.453897953033447, 5.764669418334961, 6.075441360473633, 6.386213302612305, 6.696985244750977, 7.00775671005249, 7.318528652191162, 7.629300117492676, 7.940072059631348, 8.25084400177002, 8.561614990234375, 8.872386932373047]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 13.0, 7.0, 8.0, 15.0, 16.0, 15.0, 22.0, 19.0, 17.0, 29.0, 40.0, 37.0, 41.0, 45.0, 35.0, 39.0, 37.0, 53.0, 40.0, 54.0, 32.0, 43.0, 35.0, 36.0, 33.0, 27.0, 23.0, 36.0, 18.0, 21.0, 25.0, 20.0, 13.0, 10.0, 5.0, 11.0, 8.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.860989093780518, -6.641122817993164, -6.4212565422058105, -6.201390266418457, -5.9815239906311035, -5.76165771484375, -5.5417914390563965, -5.321925163269043, -5.1020588874816895, -4.882192611694336, -4.662326335906982, -4.442460060119629, -4.222593784332275, -4.002727508544922, -3.7828612327575684, -3.562994956970215, -3.3431286811828613, -3.123262405395508, -2.9033961296081543, -2.683529853820801, -2.4636635780334473, -2.2437973022460938, -2.0239310264587402, -1.8040647506713867, -1.5841984748840332, -1.3643321990966797, -1.1444659233093262, -0.9245996475219727, -0.7047333717346191, -0.4848670959472656, -0.2650008201599121, -0.045134544372558594, 0.17473173141479492, 0.39459800720214844, 0.614464282989502, 0.8343305587768555, 1.054196834564209, 1.2740631103515625, 1.493929386138916, 1.7137956619262695, 1.933661937713623, 2.1535282135009766, 2.37339448928833, 2.5932607650756836, 2.813127040863037, 3.0329933166503906, 3.252859592437744, 3.4727258682250977, 3.692592144012451, 3.9124584197998047, 4.132324695587158, 4.352190971374512, 4.572057247161865, 4.791923522949219, 5.011789798736572, 5.231656074523926, 5.451522350311279, 5.671388626098633, 5.891254901885986, 6.11112117767334, 6.330987453460693, 6.550853729248047, 6.7707200050354, 6.990586280822754, 7.210452556610107]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 11.0, 20.0, 24.0, 44.0, 69.0, 87.0, 150.0, 215.0, 345.0, 466.0, 749.0, 1093.0, 1729.0, 2740.0, 4271.0, 6486.0, 10490.0, 16648.0, 26635.0, 42567.0, 68233.0, 107209.0, 160318.0, 189288.0, 147821.0, 96790.0, 61028.0, 38406.0, 23792.0, 14897.0, 9243.0, 5897.0, 3740.0, 2417.0, 1573.0, 1026.0, 675.0, 429.0, 289.0, 203.0, 139.0, 114.0, 59.0, 40.0, 28.0, 18.0, 14.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.88818359375, -0.85894775390625, -0.8297119140625, -0.80047607421875, -0.771240234375, -0.74200439453125, -0.7127685546875, -0.68353271484375, -0.654296875, -0.62506103515625, -0.5958251953125, -0.56658935546875, -0.537353515625, -0.50811767578125, -0.4788818359375, -0.44964599609375, -0.42041015625, -0.39117431640625, -0.3619384765625, -0.33270263671875, -0.303466796875, -0.27423095703125, -0.2449951171875, -0.21575927734375, -0.1865234375, -0.15728759765625, -0.1280517578125, -0.09881591796875, -0.069580078125, -0.04034423828125, -0.0111083984375, 0.01812744140625, 0.04736328125, 0.07659912109375, 0.1058349609375, 0.13507080078125, 0.164306640625, 0.19354248046875, 0.2227783203125, 0.25201416015625, 0.28125, 0.31048583984375, 0.3397216796875, 0.36895751953125, 0.398193359375, 0.42742919921875, 0.4566650390625, 0.48590087890625, 0.51513671875, 0.54437255859375, 0.5736083984375, 0.60284423828125, 0.632080078125, 0.66131591796875, 0.6905517578125, 0.71978759765625, 0.7490234375, 0.77825927734375, 0.8074951171875, 0.83673095703125, 0.865966796875, 0.89520263671875, 0.9244384765625, 0.95367431640625, 0.98291015625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 9.0, 16.0, 16.0, 12.0, 19.0, 18.0, 26.0, 24.0, 33.0, 40.0, 37.0, 46.0, 42.0, 45.0, 48.0, 43.0, 51.0, 39.0, 54.0, 58.0, 35.0, 35.0, 28.0, 37.0, 36.0, 30.0, 18.0, 13.0, 20.0, 14.0, 8.0, 8.0, 7.0, 9.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.462158203125, -7.21337890625, -6.964599609375, -6.7158203125, -6.467041015625, -6.21826171875, -5.969482421875, -5.720703125, -5.471923828125, -5.22314453125, -4.974365234375, -4.7255859375, -4.476806640625, -4.22802734375, -3.979248046875, -3.73046875, -3.481689453125, -3.23291015625, -2.984130859375, -2.7353515625, -2.486572265625, -2.23779296875, -1.989013671875, -1.740234375, -1.491455078125, -1.24267578125, -0.993896484375, -0.7451171875, -0.496337890625, -0.24755859375, 0.001220703125, 0.25, 0.498779296875, 0.74755859375, 0.996337890625, 1.2451171875, 1.493896484375, 1.74267578125, 1.991455078125, 2.240234375, 2.489013671875, 2.73779296875, 2.986572265625, 3.2353515625, 3.484130859375, 3.73291015625, 3.981689453125, 4.23046875, 4.479248046875, 4.72802734375, 4.976806640625, 5.2255859375, 5.474365234375, 5.72314453125, 5.971923828125, 6.220703125, 6.469482421875, 6.71826171875, 6.967041015625, 7.2158203125, 7.464599609375, 7.71337890625, 7.962158203125, 8.2109375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 3.0, 5.0, 13.0, 20.0, 32.0, 64.0, 80.0, 158.0, 288.0, 549.0, 1028.0, 1973.0, 3842.0, 8281.0, 16502.0, 34253.0, 71317.0, 146805.0, 261859.0, 245315.0, 131681.0, 64577.0, 30382.0, 14729.0, 7296.0, 3589.0, 1875.0, 898.0, 486.0, 254.0, 161.0, 86.0, 55.0, 33.0, 23.0, 11.0, 4.0, 3.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.64453125, -1.597442626953125, -1.55035400390625, -1.503265380859375, -1.4561767578125, -1.409088134765625, -1.36199951171875, -1.314910888671875, -1.267822265625, -1.220733642578125, -1.17364501953125, -1.126556396484375, -1.0794677734375, -1.032379150390625, -0.98529052734375, -0.938201904296875, -0.89111328125, -0.844024658203125, -0.79693603515625, -0.749847412109375, -0.7027587890625, -0.655670166015625, -0.60858154296875, -0.561492919921875, -0.514404296875, -0.467315673828125, -0.42022705078125, -0.373138427734375, -0.3260498046875, -0.278961181640625, -0.23187255859375, -0.184783935546875, -0.1376953125, -0.090606689453125, -0.04351806640625, 0.003570556640625, 0.0506591796875, 0.097747802734375, 0.14483642578125, 0.191925048828125, 0.239013671875, 0.286102294921875, 0.33319091796875, 0.380279541015625, 0.4273681640625, 0.474456787109375, 0.52154541015625, 0.568634033203125, 0.61572265625, 0.662811279296875, 0.70989990234375, 0.756988525390625, 0.8040771484375, 0.851165771484375, 0.89825439453125, 0.945343017578125, 0.992431640625, 1.039520263671875, 1.08660888671875, 1.133697509765625, 1.1807861328125, 1.227874755859375, 1.27496337890625, 1.322052001953125, 1.369140625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 5.0, 1.0, 8.0, 9.0, 8.0, 12.0, 15.0, 16.0, 16.0, 16.0, 23.0, 15.0, 24.0, 24.0, 34.0, 39.0, 44.0, 29.0, 21.0, 27.0, 54.0, 38.0, 44.0, 38.0, 42.0, 33.0, 52.0, 39.0, 36.0, 29.0, 23.0, 26.0, 22.0, 29.0, 24.0, 17.0, 13.0, 10.0, 9.0, 8.0, 9.0, 10.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.734375, -3.60504150390625, -3.4757080078125, -3.34637451171875, -3.217041015625, -3.08770751953125, -2.9583740234375, -2.82904052734375, -2.69970703125, -2.57037353515625, -2.4410400390625, -2.31170654296875, -2.182373046875, -2.05303955078125, -1.9237060546875, -1.79437255859375, -1.6650390625, -1.53570556640625, -1.4063720703125, -1.27703857421875, -1.147705078125, -1.01837158203125, -0.8890380859375, -0.75970458984375, -0.63037109375, -0.50103759765625, -0.3717041015625, -0.24237060546875, -0.113037109375, 0.01629638671875, 0.1456298828125, 0.27496337890625, 0.404296875, 0.53363037109375, 0.6629638671875, 0.79229736328125, 0.921630859375, 1.05096435546875, 1.1802978515625, 1.30963134765625, 1.43896484375, 1.56829833984375, 1.6976318359375, 1.82696533203125, 1.956298828125, 2.08563232421875, 2.2149658203125, 2.34429931640625, 2.4736328125, 2.60296630859375, 2.7322998046875, 2.86163330078125, 2.990966796875, 3.12030029296875, 3.2496337890625, 3.37896728515625, 3.50830078125, 3.63763427734375, 3.7669677734375, 3.89630126953125, 4.025634765625, 4.15496826171875, 4.2843017578125, 4.41363525390625, 4.54296875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 9.0, 8.0, 11.0, 9.0, 14.0, 30.0, 46.0, 64.0, 87.0, 140.0, 209.0, 293.0, 467.0, 816.0, 1351.0, 2146.0, 3846.0, 7170.0, 14238.0, 32340.0, 84935.0, 262514.0, 406310.0, 140208.0, 49016.0, 20504.0, 9732.0, 4952.0, 2802.0, 1620.0, 958.0, 615.0, 397.0, 233.0, 149.0, 110.0, 70.0, 35.0, 28.0, 27.0, 15.0, 10.0, 14.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.138427734375, -0.13449859619140625, -0.1305694580078125, -0.12664031982421875, -0.122711181640625, -0.11878204345703125, -0.1148529052734375, -0.11092376708984375, -0.10699462890625, -0.10306549072265625, -0.0991363525390625, -0.09520721435546875, -0.091278076171875, -0.08734893798828125, -0.0834197998046875, -0.07949066162109375, -0.0755615234375, -0.07163238525390625, -0.0677032470703125, -0.06377410888671875, -0.059844970703125, -0.05591583251953125, -0.0519866943359375, -0.04805755615234375, -0.04412841796875, -0.04019927978515625, -0.0362701416015625, -0.03234100341796875, -0.028411865234375, -0.02448272705078125, -0.0205535888671875, -0.01662445068359375, -0.0126953125, -0.00876617431640625, -0.0048370361328125, -0.00090789794921875, 0.003021240234375, 0.00695037841796875, 0.0108795166015625, 0.01480865478515625, 0.01873779296875, 0.02266693115234375, 0.0265960693359375, 0.03052520751953125, 0.034454345703125, 0.03838348388671875, 0.0423126220703125, 0.04624176025390625, 0.0501708984375, 0.05410003662109375, 0.0580291748046875, 0.06195831298828125, 0.065887451171875, 0.06981658935546875, 0.0737457275390625, 0.07767486572265625, 0.08160400390625, 0.08553314208984375, 0.0894622802734375, 0.09339141845703125, 0.097320556640625, 0.10124969482421875, 0.1051788330078125, 0.10910797119140625, 0.113037109375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 8.0, 9.0, 16.0, 21.0, 25.0, 34.0, 40.0, 52.0, 74.0, 76.0, 87.0, 96.0, 81.0, 93.0, 74.0, 63.0, 48.0, 25.0, 25.0, 19.0, 7.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8417835235595703e-05, -1.7696060240268707e-05, -1.697428524494171e-05, -1.6252510249614716e-05, -1.553073525428772e-05, -1.4808960258960724e-05, -1.4087185263633728e-05, -1.3365410268306732e-05, -1.2643635272979736e-05, -1.192186027765274e-05, -1.1200085282325745e-05, -1.0478310286998749e-05, -9.756535291671753e-06, -9.034760296344757e-06, -8.312985301017761e-06, -7.591210305690765e-06, -6.8694353103637695e-06, -6.147660315036774e-06, -5.425885319709778e-06, -4.704110324382782e-06, -3.982335329055786e-06, -3.2605603337287903e-06, -2.5387853384017944e-06, -1.8170103430747986e-06, -1.0952353477478027e-06, -3.734603524208069e-07, 3.4831464290618896e-07, 1.0700896382331848e-06, 1.7918646335601807e-06, 2.5136396288871765e-06, 3.2354146242141724e-06, 3.957189619541168e-06, 4.678964614868164e-06, 5.40073961019516e-06, 6.122514605522156e-06, 6.844289600849152e-06, 7.5660645961761475e-06, 8.287839591503143e-06, 9.00961458683014e-06, 9.731389582157135e-06, 1.0453164577484131e-05, 1.1174939572811127e-05, 1.1896714568138123e-05, 1.2618489563465118e-05, 1.3340264558792114e-05, 1.406203955411911e-05, 1.4783814549446106e-05, 1.5505589544773102e-05, 1.6227364540100098e-05, 1.6949139535427094e-05, 1.767091453075409e-05, 1.8392689526081085e-05, 1.911446452140808e-05, 1.9836239516735077e-05, 2.0558014512062073e-05, 2.127978950738907e-05, 2.2001564502716064e-05, 2.272333949804306e-05, 2.3445114493370056e-05, 2.4166889488697052e-05, 2.4888664484024048e-05, 2.5610439479351044e-05, 2.633221447467804e-05, 2.7053989470005035e-05, 2.777576446533203e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 5.0, 8.0, 12.0, 17.0, 29.0, 39.0, 51.0, 74.0, 88.0, 148.0, 199.0, 349.0, 502.0, 843.0, 1475.0, 2608.0, 4752.0, 9224.0, 21095.0, 60727.0, 240937.0, 497717.0, 137301.0, 39056.0, 15130.0, 7096.0, 3747.0, 2137.0, 1186.0, 681.0, 435.0, 314.0, 184.0, 115.0, 76.0, 52.0, 42.0, 31.0, 17.0, 14.0, 11.0, 4.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.17138671875, -0.16533279418945312, -0.15927886962890625, -0.15322494506835938, -0.1471710205078125, -0.14111709594726562, -0.13506317138671875, -0.12900924682617188, -0.122955322265625, -0.11690139770507812, -0.11084747314453125, -0.10479354858398438, -0.0987396240234375, -0.09268569946289062, -0.08663177490234375, -0.08057785034179688, -0.07452392578125, -0.06847000122070312, -0.06241607666015625, -0.056362152099609375, -0.0503082275390625, -0.044254302978515625, -0.03820037841796875, -0.032146453857421875, -0.026092529296875, -0.020038604736328125, -0.01398468017578125, -0.007930755615234375, -0.0018768310546875, 0.004177093505859375, 0.01023101806640625, 0.016284942626953125, 0.0223388671875, 0.028392791748046875, 0.03444671630859375, 0.040500640869140625, 0.0465545654296875, 0.052608489990234375, 0.05866241455078125, 0.06471633911132812, 0.070770263671875, 0.07682418823242188, 0.08287811279296875, 0.08893203735351562, 0.0949859619140625, 0.10103988647460938, 0.10709381103515625, 0.11314773559570312, 0.11920166015625, 0.12525558471679688, 0.13130950927734375, 0.13736343383789062, 0.1434173583984375, 0.14947128295898438, 0.15552520751953125, 0.16157913208007812, 0.167633056640625, 0.17368698120117188, 0.17974090576171875, 0.18579483032226562, 0.1918487548828125, 0.19790267944335938, 0.20395660400390625, 0.21001052856445312, 0.216064453125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 7.0, 9.0, 10.0, 24.0, 23.0, 32.0, 48.0, 60.0, 90.0, 114.0, 119.0, 87.0, 90.0, 80.0, 46.0, 41.0, 35.0, 19.0, 10.0, 5.0, 7.0, 4.0, 2.0, 4.0, 5.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.06793212890625, -0.06612539291381836, -0.06431865692138672, -0.06251192092895508, -0.06070518493652344, -0.0588984489440918, -0.057091712951660156, -0.055284976959228516, -0.053478240966796875, -0.051671504974365234, -0.049864768981933594, -0.04805803298950195, -0.04625129699707031, -0.04444456100463867, -0.04263782501220703, -0.04083108901977539, -0.03902435302734375, -0.03721761703491211, -0.03541088104248047, -0.03360414505004883, -0.03179740905761719, -0.029990673065185547, -0.028183937072753906, -0.026377201080322266, -0.024570465087890625, -0.022763729095458984, -0.020956993103027344, -0.019150257110595703, -0.017343521118164062, -0.015536785125732422, -0.013730049133300781, -0.01192331314086914, -0.0101165771484375, -0.00830984115600586, -0.006503105163574219, -0.004696369171142578, -0.0028896331787109375, -0.0010828971862792969, 0.0007238388061523438, 0.0025305747985839844, 0.004337310791015625, 0.006144046783447266, 0.007950782775878906, 0.009757518768310547, 0.011564254760742188, 0.013370990753173828, 0.015177726745605469, 0.01698446273803711, 0.01879119873046875, 0.02059793472290039, 0.02240467071533203, 0.024211406707763672, 0.026018142700195312, 0.027824878692626953, 0.029631614685058594, 0.031438350677490234, 0.033245086669921875, 0.035051822662353516, 0.036858558654785156, 0.0386652946472168, 0.04047203063964844, 0.04227876663208008, 0.04408550262451172, 0.04589223861694336, 0.047698974609375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 16.0, 22.0, 30.0, 33.0, 43.0, 61.0, 57.0, 79.0, 93.0, 90.0, 87.0, 71.0, 78.0, 47.0, 53.0, 32.0, 24.0, 15.0, 19.0, 9.0, 12.0, 4.0, 1.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.06884765625, -10.758285522460938, -10.447723388671875, -10.137161254882812, -9.82659912109375, -9.516037940979004, -9.205475807189941, -8.894913673400879, -8.584351539611816, -8.273789405822754, -7.963227272033691, -7.652665615081787, -7.342103481292725, -7.031541347503662, -6.720979690551758, -6.410417556762695, -6.099855422973633, -5.78929328918457, -5.478731155395508, -5.1681694984436035, -4.857607364654541, -4.5470452308654785, -4.236483573913574, -3.9259214401245117, -3.615359306335449, -3.3047971725463867, -2.9942352771759033, -2.68367338180542, -2.3731112480163574, -2.062549114227295, -1.7519872188568115, -1.4414253234863281, -1.130864143371582, -0.8203021287918091, -0.5097401142120361, -0.19917809963226318, 0.11138391494750977, 0.4219459295272827, 0.7325079441070557, 1.043069839477539, 1.3536319732666016, 1.6641939878463745, 1.9747560024261475, 2.285317897796631, 2.5958800315856934, 2.906442165374756, 3.2170040607452393, 3.5275659561157227, 3.838128089904785, 4.148690223693848, 4.45925235748291, 4.7698140144348145, 5.080376148223877, 5.3909382820129395, 5.701499938964844, 6.012062072753906, 6.322624206542969, 6.633186340332031, 6.943748474121094, 7.254310131072998, 7.5648722648620605, 7.875434398651123, 8.185996055603027, 8.49655818939209, 8.807120323181152]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 13.0, 7.0, 8.0, 15.0, 16.0, 15.0, 22.0, 18.0, 18.0, 28.0, 41.0, 35.0, 43.0, 44.0, 34.0, 40.0, 37.0, 51.0, 44.0, 52.0, 32.0, 45.0, 31.0, 38.0, 31.0, 30.0, 24.0, 34.0, 18.0, 22.0, 24.0, 21.0, 13.0, 10.0, 5.0, 11.0, 8.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.825133323669434, -6.605824947357178, -6.386516094207764, -6.167207717895508, -5.947899341583252, -5.728590488433838, -5.509282112121582, -5.289973258972168, -5.070664882659912, -4.851356506347656, -4.632047653198242, -4.412739276885986, -4.1934309005737305, -3.9741220474243164, -3.7548136711120605, -3.5355050563812256, -3.3161966800689697, -3.0968880653381348, -2.877579689025879, -2.658271074295044, -2.438962459564209, -2.219654083251953, -2.000345468521118, -1.7810368537902832, -1.5617283582687378, -1.3424198627471924, -1.1231112480163574, -0.903802752494812, -0.6844941973686218, -0.46518564224243164, -0.24587714672088623, -0.02656853199005127, 0.19273996353149414, 0.4120485186576843, 0.6313570737838745, 0.8506655693054199, 1.0699741840362549, 1.2892826795578003, 1.5085911750793457, 1.7278997898101807, 1.947208285331726, 2.1665167808532715, 2.3858253955841064, 2.6051340103149414, 2.8244423866271973, 3.0437510013580322, 3.263059616088867, 3.482367992401123, 3.701676607131958, 3.920985221862793, 4.140293598175049, 4.359601974487305, 4.578910827636719, 4.798219203948975, 5.0175275802612305, 5.2368364334106445, 5.4561448097229, 5.675453186035156, 5.89476203918457, 6.114070415496826, 6.333378791809082, 6.552687644958496, 6.771996021270752, 6.991304397583008, 7.210613250732422]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 12.0, 16.0, 20.0, 29.0, 43.0, 81.0, 130.0, 199.0, 316.0, 460.0, 847.0, 1389.0, 2289.0, 3651.0, 6163.0, 10396.0, 17873.0, 30208.0, 51124.0, 81780.0, 122823.0, 157905.0, 165948.0, 139999.0, 99222.0, 62732.0, 38128.0, 22004.0, 13279.0, 7771.0, 4601.0, 2796.0, 1667.0, 972.0, 624.0, 413.0, 258.0, 141.0, 94.0, 58.0, 37.0, 19.0, 18.0, 8.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.82421875, -5.65399169921875, -5.4837646484375, -5.31353759765625, -5.143310546875, -4.97308349609375, -4.8028564453125, -4.63262939453125, -4.46240234375, -4.29217529296875, -4.1219482421875, -3.95172119140625, -3.781494140625, -3.61126708984375, -3.4410400390625, -3.27081298828125, -3.1005859375, -2.93035888671875, -2.7601318359375, -2.58990478515625, -2.419677734375, -2.24945068359375, -2.0792236328125, -1.90899658203125, -1.73876953125, -1.56854248046875, -1.3983154296875, -1.22808837890625, -1.057861328125, -0.88763427734375, -0.7174072265625, -0.54718017578125, -0.376953125, -0.20672607421875, -0.0364990234375, 0.13372802734375, 0.303955078125, 0.47418212890625, 0.6444091796875, 0.81463623046875, 0.98486328125, 1.15509033203125, 1.3253173828125, 1.49554443359375, 1.665771484375, 1.83599853515625, 2.0062255859375, 2.17645263671875, 2.3466796875, 2.51690673828125, 2.6871337890625, 2.85736083984375, 3.027587890625, 3.19781494140625, 3.3680419921875, 3.53826904296875, 3.70849609375, 3.87872314453125, 4.0489501953125, 4.21917724609375, 4.389404296875, 4.55963134765625, 4.7298583984375, 4.90008544921875, 5.0703125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 9.0, 5.0, 8.0, 13.0, 7.0, 16.0, 10.0, 17.0, 20.0, 24.0, 24.0, 24.0, 40.0, 48.0, 37.0, 33.0, 49.0, 44.0, 57.0, 42.0, 46.0, 46.0, 49.0, 28.0, 35.0, 36.0, 34.0, 32.0, 26.0, 31.0, 20.0, 15.0, 17.0, 15.0, 10.0, 7.0, 7.0, 4.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.46875, -8.23675537109375, -8.0047607421875, -7.77276611328125, -7.540771484375, -7.30877685546875, -7.0767822265625, -6.84478759765625, -6.61279296875, -6.38079833984375, -6.1488037109375, -5.91680908203125, -5.684814453125, -5.45281982421875, -5.2208251953125, -4.98883056640625, -4.7568359375, -4.52484130859375, -4.2928466796875, -4.06085205078125, -3.828857421875, -3.59686279296875, -3.3648681640625, -3.13287353515625, -2.90087890625, -2.66888427734375, -2.4368896484375, -2.20489501953125, -1.972900390625, -1.74090576171875, -1.5089111328125, -1.27691650390625, -1.044921875, -0.81292724609375, -0.5809326171875, -0.34893798828125, -0.116943359375, 0.11505126953125, 0.3470458984375, 0.57904052734375, 0.81103515625, 1.04302978515625, 1.2750244140625, 1.50701904296875, 1.739013671875, 1.97100830078125, 2.2030029296875, 2.43499755859375, 2.6669921875, 2.89898681640625, 3.1309814453125, 3.36297607421875, 3.594970703125, 3.82696533203125, 4.0589599609375, 4.29095458984375, 4.52294921875, 4.75494384765625, 4.9869384765625, 5.21893310546875, 5.450927734375, 5.68292236328125, 5.9149169921875, 6.14691162109375, 6.37890625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 15.0, 16.0, 22.0, 37.0, 55.0, 74.0, 119.0, 199.0, 299.0, 377.0, 662.0, 1035.0, 1568.0, 2568.0, 4052.0, 6390.0, 10492.0, 17210.0, 27028.0, 42200.0, 64085.0, 92390.0, 121451.0, 141996.0, 139993.0, 117888.0, 87639.0, 60605.0, 40264.0, 25361.0, 16016.0, 10034.0, 5968.0, 3798.0, 2303.0, 1552.0, 952.0, 618.0, 412.0, 260.0, 185.0, 122.0, 82.0, 56.0, 36.0, 31.0, 14.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.66015625, -4.51422119140625, -4.3682861328125, -4.22235107421875, -4.076416015625, -3.93048095703125, -3.7845458984375, -3.63861083984375, -3.49267578125, -3.34674072265625, -3.2008056640625, -3.05487060546875, -2.908935546875, -2.76300048828125, -2.6170654296875, -2.47113037109375, -2.3251953125, -2.17926025390625, -2.0333251953125, -1.88739013671875, -1.741455078125, -1.59552001953125, -1.4495849609375, -1.30364990234375, -1.15771484375, -1.01177978515625, -0.8658447265625, -0.71990966796875, -0.573974609375, -0.42803955078125, -0.2821044921875, -0.13616943359375, 0.009765625, 0.15570068359375, 0.3016357421875, 0.44757080078125, 0.593505859375, 0.73944091796875, 0.8853759765625, 1.03131103515625, 1.17724609375, 1.32318115234375, 1.4691162109375, 1.61505126953125, 1.760986328125, 1.90692138671875, 2.0528564453125, 2.19879150390625, 2.3447265625, 2.49066162109375, 2.6365966796875, 2.78253173828125, 2.928466796875, 3.07440185546875, 3.2203369140625, 3.36627197265625, 3.51220703125, 3.65814208984375, 3.8040771484375, 3.95001220703125, 4.095947265625, 4.24188232421875, 4.3878173828125, 4.53375244140625, 4.6796875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 9.0, 15.0, 11.0, 13.0, 25.0, 17.0, 26.0, 27.0, 30.0, 25.0, 40.0, 33.0, 27.0, 43.0, 45.0, 36.0, 29.0, 37.0, 27.0, 34.0, 38.0, 48.0, 30.0, 42.0, 33.0, 27.0, 31.0, 23.0, 20.0, 15.0, 18.0, 24.0, 13.0, 14.0, 17.0, 6.0, 5.0, 11.0, 7.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.431640625, -3.311309814453125, -3.19097900390625, -3.070648193359375, -2.9503173828125, -2.829986572265625, -2.70965576171875, -2.589324951171875, -2.468994140625, -2.348663330078125, -2.22833251953125, -2.108001708984375, -1.9876708984375, -1.867340087890625, -1.74700927734375, -1.626678466796875, -1.50634765625, -1.386016845703125, -1.26568603515625, -1.145355224609375, -1.0250244140625, -0.904693603515625, -0.78436279296875, -0.664031982421875, -0.543701171875, -0.423370361328125, -0.30303955078125, -0.182708740234375, -0.0623779296875, 0.057952880859375, 0.17828369140625, 0.298614501953125, 0.4189453125, 0.539276123046875, 0.65960693359375, 0.779937744140625, 0.9002685546875, 1.020599365234375, 1.14093017578125, 1.261260986328125, 1.381591796875, 1.501922607421875, 1.62225341796875, 1.742584228515625, 1.8629150390625, 1.983245849609375, 2.10357666015625, 2.223907470703125, 2.34423828125, 2.464569091796875, 2.58489990234375, 2.705230712890625, 2.8255615234375, 2.945892333984375, 3.06622314453125, 3.186553955078125, 3.306884765625, 3.427215576171875, 3.54754638671875, 3.667877197265625, 3.7882080078125, 3.908538818359375, 4.02886962890625, 4.149200439453125, 4.26953125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 10.0, 10.0, 12.0, 14.0, 18.0, 44.0, 48.0, 60.0, 110.0, 122.0, 200.0, 313.0, 404.0, 670.0, 977.0, 1463.0, 2255.0, 3521.0, 5378.0, 8587.0, 13105.0, 20606.0, 32500.0, 50658.0, 76570.0, 110902.0, 144678.0, 155149.0, 133865.0, 97936.0, 66961.0, 43644.0, 27844.0, 17990.0, 11286.0, 7073.0, 4775.0, 2984.0, 2011.0, 1212.0, 819.0, 576.0, 382.0, 257.0, 166.0, 126.0, 85.0, 63.0, 37.0, 24.0, 23.0, 14.0, 11.0, 6.0, 1.0, 6.0, 2.0, 3.0, 2.0], "bins": [-1.638671875, -1.587982177734375, -1.53729248046875, -1.486602783203125, -1.4359130859375, -1.385223388671875, -1.33453369140625, -1.283843994140625, -1.233154296875, -1.182464599609375, -1.13177490234375, -1.081085205078125, -1.0303955078125, -0.979705810546875, -0.92901611328125, -0.878326416015625, -0.82763671875, -0.776947021484375, -0.72625732421875, -0.675567626953125, -0.6248779296875, -0.574188232421875, -0.52349853515625, -0.472808837890625, -0.422119140625, -0.371429443359375, -0.32073974609375, -0.270050048828125, -0.2193603515625, -0.168670654296875, -0.11798095703125, -0.067291259765625, -0.0166015625, 0.034088134765625, 0.08477783203125, 0.135467529296875, 0.1861572265625, 0.236846923828125, 0.28753662109375, 0.338226318359375, 0.388916015625, 0.439605712890625, 0.49029541015625, 0.540985107421875, 0.5916748046875, 0.642364501953125, 0.69305419921875, 0.743743896484375, 0.79443359375, 0.845123291015625, 0.89581298828125, 0.946502685546875, 0.9971923828125, 1.047882080078125, 1.09857177734375, 1.149261474609375, 1.199951171875, 1.250640869140625, 1.30133056640625, 1.352020263671875, 1.4027099609375, 1.453399658203125, 1.50408935546875, 1.554779052734375, 1.60546875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 6.0, 5.0, 9.0, 9.0, 14.0, 18.0, 24.0, 28.0, 36.0, 35.0, 48.0, 49.0, 49.0, 56.0, 53.0, 71.0, 64.0, 74.0, 59.0, 52.0, 34.0, 35.0, 31.0, 26.0, 22.0, 22.0, 19.0, 14.0, 9.0, 8.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00016558170318603516, -0.00016101635992527008, -0.000156451016664505, -0.00015188567340373993, -0.00014732033014297485, -0.00014275498688220978, -0.0001381896436214447, -0.00013362430036067963, -0.00012905895709991455, -0.00012449361383914948, -0.0001199282705783844, -0.00011536292731761932, -0.00011079758405685425, -0.00010623224079608917, -0.0001016668975353241, -9.710155427455902e-05, -9.253621101379395e-05, -8.797086775302887e-05, -8.34055244922638e-05, -7.884018123149872e-05, -7.427483797073364e-05, -6.970949470996857e-05, -6.514415144920349e-05, -6.0578808188438416e-05, -5.601346492767334e-05, -5.1448121666908264e-05, -4.688277840614319e-05, -4.231743514537811e-05, -3.775209188461304e-05, -3.318674862384796e-05, -2.8621405363082886e-05, -2.405606210231781e-05, -1.9490718841552734e-05, -1.4925375580787659e-05, -1.0360032320022583e-05, -5.794689059257507e-06, -1.2293457984924316e-06, 3.335997462272644e-06, 7.90134072303772e-06, 1.2466683983802795e-05, 1.703202724456787e-05, 2.1597370505332947e-05, 2.6162713766098022e-05, 3.07280570268631e-05, 3.5293400287628174e-05, 3.985874354839325e-05, 4.4424086809158325e-05, 4.89894300699234e-05, 5.3554773330688477e-05, 5.812011659145355e-05, 6.268545985221863e-05, 6.72508031129837e-05, 7.181614637374878e-05, 7.638148963451385e-05, 8.094683289527893e-05, 8.5512176156044e-05, 9.007751941680908e-05, 9.464286267757416e-05, 9.920820593833923e-05, 0.00010377354919910431, 0.00010833889245986938, 0.00011290423572063446, 0.00011746957898139954, 0.00012203492224216461, 0.0001266002655029297]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 14.0, 8.0, 17.0, 26.0, 32.0, 48.0, 74.0, 117.0, 200.0, 299.0, 457.0, 806.0, 1295.0, 2235.0, 3728.0, 6515.0, 11399.0, 20317.0, 36263.0, 62654.0, 106245.0, 161758.0, 195630.0, 167849.0, 113055.0, 67606.0, 38793.0, 21715.0, 12371.0, 7000.0, 3920.0, 2407.0, 1400.0, 862.0, 516.0, 336.0, 214.0, 132.0, 88.0, 55.0, 35.0, 14.0, 22.0, 12.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.052734375, -1.987701416015625, -1.92266845703125, -1.857635498046875, -1.7926025390625, -1.727569580078125, -1.66253662109375, -1.597503662109375, -1.532470703125, -1.467437744140625, -1.40240478515625, -1.337371826171875, -1.2723388671875, -1.207305908203125, -1.14227294921875, -1.077239990234375, -1.01220703125, -0.947174072265625, -0.88214111328125, -0.817108154296875, -0.7520751953125, -0.687042236328125, -0.62200927734375, -0.556976318359375, -0.491943359375, -0.426910400390625, -0.36187744140625, -0.296844482421875, -0.2318115234375, -0.166778564453125, -0.10174560546875, -0.036712646484375, 0.0283203125, 0.093353271484375, 0.15838623046875, 0.223419189453125, 0.2884521484375, 0.353485107421875, 0.41851806640625, 0.483551025390625, 0.548583984375, 0.613616943359375, 0.67864990234375, 0.743682861328125, 0.8087158203125, 0.873748779296875, 0.93878173828125, 1.003814697265625, 1.06884765625, 1.133880615234375, 1.19891357421875, 1.263946533203125, 1.3289794921875, 1.394012451171875, 1.45904541015625, 1.524078369140625, 1.589111328125, 1.654144287109375, 1.71917724609375, 1.784210205078125, 1.8492431640625, 1.914276123046875, 1.97930908203125, 2.044342041015625, 2.109375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 4.0, 11.0, 10.0, 15.0, 29.0, 22.0, 29.0, 49.0, 41.0, 46.0, 58.0, 62.0, 60.0, 67.0, 60.0, 65.0, 73.0, 51.0, 55.0, 32.0, 35.0, 31.0, 17.0, 11.0, 8.0, 6.0, 12.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7939453125, -0.7631378173828125, -0.732330322265625, -0.7015228271484375, -0.67071533203125, -0.6399078369140625, -0.609100341796875, -0.5782928466796875, -0.5474853515625, -0.5166778564453125, -0.485870361328125, -0.4550628662109375, -0.42425537109375, -0.3934478759765625, -0.362640380859375, -0.3318328857421875, -0.301025390625, -0.2702178955078125, -0.239410400390625, -0.2086029052734375, -0.17779541015625, -0.1469879150390625, -0.116180419921875, -0.0853729248046875, -0.0545654296875, -0.0237579345703125, 0.007049560546875, 0.0378570556640625, 0.06866455078125, 0.0994720458984375, 0.130279541015625, 0.1610870361328125, 0.19189453125, 0.2227020263671875, 0.253509521484375, 0.2843170166015625, 0.31512451171875, 0.3459320068359375, 0.376739501953125, 0.4075469970703125, 0.4383544921875, 0.4691619873046875, 0.499969482421875, 0.5307769775390625, 0.56158447265625, 0.5923919677734375, 0.623199462890625, 0.6540069580078125, 0.684814453125, 0.7156219482421875, 0.746429443359375, 0.7772369384765625, 0.80804443359375, 0.8388519287109375, 0.869659423828125, 0.9004669189453125, 0.9312744140625, 0.9620819091796875, 0.992889404296875, 1.0236968994140625, 1.05450439453125, 1.0853118896484375, 1.116119384765625, 1.1469268798828125, 1.177734375]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 9.0, 13.0, 20.0, 28.0, 38.0, 45.0, 40.0, 72.0, 72.0, 97.0, 108.0, 96.0, 70.0, 70.0, 59.0, 35.0, 30.0, 31.0, 13.0, 17.0, 6.0, 8.0, 9.0, 2.0, 3.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.441414833068848, -9.121736526489258, -8.802057266235352, -8.482378959655762, -8.162699699401855, -7.843021392822266, -7.523342609405518, -7.2036638259887695, -6.8839850425720215, -6.564306259155273, -6.244627475738525, -5.924948692321777, -5.6052703857421875, -5.285591125488281, -4.965912818908691, -4.646234035491943, -4.326555252075195, -4.006876468658447, -3.687197685241699, -3.3675191402435303, -3.0478403568267822, -2.728161573410034, -2.4084830284118652, -2.088804244995117, -1.7691254615783691, -1.449446678161621, -1.1297680139541626, -0.8100892901420593, -0.49041056632995605, -0.170731782913208, 0.1489468812942505, 0.468625545501709, 0.788304328918457, 1.107983112335205, 1.4276617765426636, 1.747340440750122, 2.06701922416687, 2.386698007583618, 2.706376552581787, 3.026055335998535, 3.345734119415283, 3.6654129028320312, 3.9850916862487793, 4.304770469665527, 4.624448776245117, 4.944128036499023, 5.263806343078613, 5.583485126495361, 5.903163909912109, 6.222842693328857, 6.5425214767456055, 6.8622002601623535, 7.181879043579102, 7.501557350158691, 7.8212361335754395, 8.140914916992188, 8.460594177246094, 8.780272483825684, 9.09995174407959, 9.41963005065918, 9.739309310913086, 10.058987617492676, 10.378666877746582, 10.698345184326172, 11.018023490905762]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 4.0, 6.0, 4.0, 8.0, 10.0, 9.0, 11.0, 17.0, 19.0, 20.0, 16.0, 32.0, 40.0, 25.0, 33.0, 46.0, 25.0, 46.0, 46.0, 34.0, 59.0, 50.0, 36.0, 34.0, 40.0, 33.0, 27.0, 22.0, 29.0, 28.0, 34.0, 23.0, 21.0, 21.0, 20.0, 11.0, 11.0, 7.0, 10.0, 6.0, 3.0, 7.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.004836082458496, -6.7925920486450195, -6.580348491668701, -6.368104457855225, -6.155860900878906, -5.94361686706543, -5.731372833251953, -5.519128799438477, -5.306885242462158, -5.094641208648682, -4.882397651672363, -4.670153617858887, -4.45790958404541, -4.245666027069092, -4.033421993255615, -3.8211781978607178, -3.6089344024658203, -3.396690607070923, -3.1844468116760254, -2.972202777862549, -2.7599589824676514, -2.547715187072754, -2.3354711532592773, -2.12322735786438, -1.9109835624694824, -1.698739767074585, -1.486495852470398, -1.274251937866211, -1.0620081424713135, -0.849764347076416, -0.637520432472229, -0.425276517868042, -0.21303319931030273, -0.000789344310760498, 0.21145451068878174, 0.423698365688324, 0.6359422206878662, 0.8481860160827637, 1.0604299306869507, 1.2726738452911377, 1.4849176406860352, 1.6971614360809326, 1.9094053506851196, 2.1216492652893066, 2.333893060684204, 2.5461368560791016, 2.758380889892578, 2.9706246852874756, 3.182868480682373, 3.3951122760772705, 3.607356071472168, 3.8196001052856445, 4.031844139099121, 4.2440876960754395, 4.456331729888916, 4.668575286865234, 4.880819320678711, 5.0930633544921875, 5.305306911468506, 5.517550945281982, 5.729794502258301, 5.942038536071777, 6.154282569885254, 6.3665266036987305, 6.578770160675049]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 6.0, 6.0, 8.0, 23.0, 19.0, 44.0, 41.0, 68.0, 99.0, 166.0, 219.0, 366.0, 545.0, 816.0, 1258.0, 1968.0, 2985.0, 4646.0, 7594.0, 12129.0, 20155.0, 33241.0, 58764.0, 104438.0, 191769.0, 356992.0, 635013.0, 886222.0, 788571.0, 486219.0, 264495.0, 143141.0, 78973.0, 44413.0, 26519.0, 15442.0, 9741.0, 6058.0, 3893.0, 2525.0, 1616.0, 1046.0, 701.0, 433.0, 297.0, 203.0, 132.0, 97.0, 72.0, 31.0, 21.0, 19.0, 12.0, 8.0, 3.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-5.59375, -5.40582275390625, -5.2178955078125, -5.02996826171875, -4.842041015625, -4.65411376953125, -4.4661865234375, -4.27825927734375, -4.09033203125, -3.90240478515625, -3.7144775390625, -3.52655029296875, -3.338623046875, -3.15069580078125, -2.9627685546875, -2.77484130859375, -2.5869140625, -2.39898681640625, -2.2110595703125, -2.02313232421875, -1.835205078125, -1.64727783203125, -1.4593505859375, -1.27142333984375, -1.08349609375, -0.89556884765625, -0.7076416015625, -0.51971435546875, -0.331787109375, -0.14385986328125, 0.0440673828125, 0.23199462890625, 0.419921875, 0.60784912109375, 0.7957763671875, 0.98370361328125, 1.171630859375, 1.35955810546875, 1.5474853515625, 1.73541259765625, 1.92333984375, 2.11126708984375, 2.2991943359375, 2.48712158203125, 2.675048828125, 2.86297607421875, 3.0509033203125, 3.23883056640625, 3.4267578125, 3.61468505859375, 3.8026123046875, 3.99053955078125, 4.178466796875, 4.36639404296875, 4.5543212890625, 4.74224853515625, 4.93017578125, 5.11810302734375, 5.3060302734375, 5.49395751953125, 5.681884765625, 5.86981201171875, 6.0577392578125, 6.24566650390625, 6.43359375]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 7.0, 7.0, 8.0, 12.0, 9.0, 24.0, 18.0, 23.0, 20.0, 20.0, 37.0, 31.0, 44.0, 35.0, 38.0, 40.0, 38.0, 51.0, 38.0, 45.0, 44.0, 48.0, 26.0, 35.0, 37.0, 31.0, 31.0, 24.0, 22.0, 23.0, 29.0, 14.0, 15.0, 13.0, 10.0, 8.0, 9.0, 5.0, 2.0, 8.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.47265625, -4.3275146484375, -4.182373046875, -4.0372314453125, -3.89208984375, -3.7469482421875, -3.601806640625, -3.4566650390625, -3.3115234375, -3.1663818359375, -3.021240234375, -2.8760986328125, -2.73095703125, -2.5858154296875, -2.440673828125, -2.2955322265625, -2.150390625, -2.0052490234375, -1.860107421875, -1.7149658203125, -1.56982421875, -1.4246826171875, -1.279541015625, -1.1343994140625, -0.9892578125, -0.8441162109375, -0.698974609375, -0.5538330078125, -0.40869140625, -0.2635498046875, -0.118408203125, 0.0267333984375, 0.171875, 0.3170166015625, 0.462158203125, 0.6072998046875, 0.75244140625, 0.8975830078125, 1.042724609375, 1.1878662109375, 1.3330078125, 1.4781494140625, 1.623291015625, 1.7684326171875, 1.91357421875, 2.0587158203125, 2.203857421875, 2.3489990234375, 2.494140625, 2.6392822265625, 2.784423828125, 2.9295654296875, 3.07470703125, 3.2198486328125, 3.364990234375, 3.5101318359375, 3.6552734375, 3.8004150390625, 3.945556640625, 4.0906982421875, 4.23583984375, 4.3809814453125, 4.526123046875, 4.6712646484375, 4.81640625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 12.0, 8.0, 16.0, 20.0, 48.0, 45.0, 93.0, 156.0, 243.0, 332.0, 603.0, 969.0, 1599.0, 2671.0, 4435.0, 7278.0, 12691.0, 22127.0, 39570.0, 71558.0, 130718.0, 242059.0, 433227.0, 688048.0, 836963.0, 700432.0, 444459.0, 249643.0, 135253.0, 73906.0, 40554.0, 22500.0, 12975.0, 7793.0, 4374.0, 2642.0, 1605.0, 951.0, 629.0, 392.0, 265.0, 160.0, 95.0, 59.0, 46.0, 24.0, 14.0, 13.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.073486328125, -4.88916015625, -4.704833984375, -4.5205078125, -4.336181640625, -4.15185546875, -3.967529296875, -3.783203125, -3.598876953125, -3.41455078125, -3.230224609375, -3.0458984375, -2.861572265625, -2.67724609375, -2.492919921875, -2.30859375, -2.124267578125, -1.93994140625, -1.755615234375, -1.5712890625, -1.386962890625, -1.20263671875, -1.018310546875, -0.833984375, -0.649658203125, -0.46533203125, -0.281005859375, -0.0966796875, 0.087646484375, 0.27197265625, 0.456298828125, 0.640625, 0.824951171875, 1.00927734375, 1.193603515625, 1.3779296875, 1.562255859375, 1.74658203125, 1.930908203125, 2.115234375, 2.299560546875, 2.48388671875, 2.668212890625, 2.8525390625, 3.036865234375, 3.22119140625, 3.405517578125, 3.58984375, 3.774169921875, 3.95849609375, 4.142822265625, 4.3271484375, 4.511474609375, 4.69580078125, 4.880126953125, 5.064453125, 5.248779296875, 5.43310546875, 5.617431640625, 5.8017578125, 5.986083984375, 6.17041015625, 6.354736328125, 6.5390625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 6.0, 4.0, 5.0, 5.0, 18.0, 14.0, 23.0, 34.0, 45.0, 55.0, 72.0, 76.0, 125.0, 121.0, 169.0, 181.0, 204.0, 252.0, 241.0, 265.0, 284.0, 238.0, 256.0, 197.0, 221.0, 180.0, 148.0, 121.0, 99.0, 85.0, 64.0, 64.0, 53.0, 30.0, 27.0, 19.0, 19.0, 9.0, 11.0, 15.0, 6.0, 9.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.982421875, -1.9027099609375, -1.822998046875, -1.7432861328125, -1.66357421875, -1.5838623046875, -1.504150390625, -1.4244384765625, -1.3447265625, -1.2650146484375, -1.185302734375, -1.1055908203125, -1.02587890625, -0.9461669921875, -0.866455078125, -0.7867431640625, -0.70703125, -0.6273193359375, -0.547607421875, -0.4678955078125, -0.38818359375, -0.3084716796875, -0.228759765625, -0.1490478515625, -0.0693359375, 0.0103759765625, 0.090087890625, 0.1697998046875, 0.24951171875, 0.3292236328125, 0.408935546875, 0.4886474609375, 0.568359375, 0.6480712890625, 0.727783203125, 0.8074951171875, 0.88720703125, 0.9669189453125, 1.046630859375, 1.1263427734375, 1.2060546875, 1.2857666015625, 1.365478515625, 1.4451904296875, 1.52490234375, 1.6046142578125, 1.684326171875, 1.7640380859375, 1.84375, 1.9234619140625, 2.003173828125, 2.0828857421875, 2.16259765625, 2.2423095703125, 2.322021484375, 2.4017333984375, 2.4814453125, 2.5611572265625, 2.640869140625, 2.7205810546875, 2.80029296875, 2.8800048828125, 2.959716796875, 3.0394287109375, 3.119140625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 2.0, 7.0, 9.0, 16.0, 24.0, 30.0, 32.0, 45.0, 51.0, 70.0, 101.0, 88.0, 90.0, 88.0, 63.0, 66.0, 47.0, 35.0, 28.0, 21.0, 15.0, 11.0, 7.0, 15.0, 5.0, 6.0, 7.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.222775459289551, -6.947085380554199, -6.6713948249816895, -6.395704746246338, -6.120014190673828, -5.844324111938477, -5.568634033203125, -5.292943477630615, -5.0172529220581055, -4.741562843322754, -4.465872287750244, -4.190182209014893, -3.914491653442383, -3.6388015747070312, -3.3631112575531006, -3.08742094039917, -2.8117308616638184, -2.5360405445098877, -2.260350227355957, -1.984660029411316, -1.7089697122573853, -1.4332793951034546, -1.1575891971588135, -0.8818988800048828, -0.6062085628509521, -0.33051827549934387, -0.054827988147735596, 0.2208622694015503, 0.49655258655548096, 0.7722429037094116, 1.0479331016540527, 1.3236234188079834, 1.599313735961914, 1.8750040531158447, 2.1506943702697754, 2.426384449005127, 2.7020750045776367, 2.9777650833129883, 3.253455400466919, 3.5291457176208496, 3.8048360347747803, 4.080526351928711, 4.3562164306640625, 4.631906986236572, 4.907597064971924, 5.183287620544434, 5.458977699279785, 5.734667778015137, 6.0103583335876465, 6.286048412322998, 6.561738967895508, 6.837429046630859, 7.113119602203369, 7.388809680938721, 7.6645002365112305, 7.940190315246582, 8.215880393981934, 8.491570472717285, 8.767260551452637, 9.042951583862305, 9.318641662597656, 9.594331741333008, 9.87002182006836, 10.145711898803711, 10.421402931213379]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 4.0, 7.0, 7.0, 13.0, 13.0, 14.0, 17.0, 18.0, 24.0, 14.0, 26.0, 23.0, 36.0, 28.0, 34.0, 48.0, 36.0, 35.0, 45.0, 40.0, 29.0, 32.0, 40.0, 49.0, 32.0, 29.0, 31.0, 29.0, 32.0, 33.0, 20.0, 19.0, 22.0, 15.0, 25.0, 11.0, 8.0, 4.0, 13.0, 7.0, 5.0, 10.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-5.9167046546936035, -5.733064651489258, -5.54942512512207, -5.365785121917725, -5.182145118713379, -4.998505592346191, -4.814865589141846, -4.6312255859375, -4.4475860595703125, -4.263946056365967, -4.080306529998779, -3.8966665267944336, -3.713026523590088, -3.5293867588043213, -3.3457469940185547, -3.162106990814209, -2.9784669876098633, -2.7948272228240967, -2.611187219619751, -2.4275474548339844, -2.2439074516296387, -2.060267686843872, -1.8766279220581055, -1.6929880380630493, -1.5093481540679932, -1.325708270072937, -1.1420683860778809, -0.9584286212921143, -0.7747887372970581, -0.591148853302002, -0.40750908851623535, -0.2238692045211792, -0.040228843688964844, 0.14341101050376892, 0.3270508646965027, 0.5106906890869141, 0.6943305730819702, 0.8779704570770264, 1.061610221862793, 1.2452501058578491, 1.4288899898529053, 1.6125298738479614, 1.7961697578430176, 1.9798095226287842, 2.163449287414551, 2.3470892906188965, 2.530729055404663, 2.7143688201904297, 2.8980088233947754, 3.081648588180542, 3.2652885913848877, 3.4489283561706543, 3.632568359375, 3.8162081241607666, 3.999847888946533, 4.183487892150879, 4.367127418518066, 4.550767421722412, 4.7344069480896, 4.918046951293945, 5.101686954498291, 5.285326957702637, 5.468966484069824, 5.65260648727417, 5.836246490478516]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 12.0, 19.0, 21.0, 29.0, 56.0, 102.0, 133.0, 227.0, 328.0, 515.0, 768.0, 1291.0, 1904.0, 2775.0, 4354.0, 6534.0, 10545.0, 16333.0, 25607.0, 40087.0, 63366.0, 97170.0, 143923.0, 179220.0, 154075.0, 107084.0, 69320.0, 44143.0, 27965.0, 17768.0, 11578.0, 7401.0, 4862.0, 3162.0, 2074.0, 1319.0, 864.0, 577.0, 371.0, 247.0, 177.0, 92.0, 57.0, 40.0, 22.0, 16.0, 6.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78662109375, -0.7617340087890625, -0.736846923828125, -0.7119598388671875, -0.68707275390625, -0.6621856689453125, -0.637298583984375, -0.6124114990234375, -0.5875244140625, -0.5626373291015625, -0.537750244140625, -0.5128631591796875, -0.48797607421875, -0.4630889892578125, -0.438201904296875, -0.4133148193359375, -0.388427734375, -0.3635406494140625, -0.338653564453125, -0.3137664794921875, -0.28887939453125, -0.2639923095703125, -0.239105224609375, -0.2142181396484375, -0.1893310546875, -0.1644439697265625, -0.139556884765625, -0.1146697998046875, -0.08978271484375, -0.0648956298828125, -0.040008544921875, -0.0151214599609375, 0.009765625, 0.0346527099609375, 0.059539794921875, 0.0844268798828125, 0.10931396484375, 0.1342010498046875, 0.159088134765625, 0.1839752197265625, 0.2088623046875, 0.2337493896484375, 0.258636474609375, 0.2835235595703125, 0.30841064453125, 0.3332977294921875, 0.358184814453125, 0.3830718994140625, 0.407958984375, 0.4328460693359375, 0.457733154296875, 0.4826202392578125, 0.50750732421875, 0.5323944091796875, 0.557281494140625, 0.5821685791015625, 0.6070556640625, 0.6319427490234375, 0.656829833984375, 0.6817169189453125, 0.70660400390625, 0.7314910888671875, 0.756378173828125, 0.7812652587890625, 0.80615234375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 8.0, 5.0, 9.0, 4.0, 9.0, 13.0, 19.0, 13.0, 19.0, 16.0, 29.0, 22.0, 29.0, 30.0, 35.0, 49.0, 39.0, 44.0, 38.0, 39.0, 41.0, 42.0, 46.0, 37.0, 48.0, 28.0, 38.0, 33.0, 28.0, 29.0, 31.0, 23.0, 22.0, 15.0, 11.0, 14.0, 10.0, 8.0, 8.0, 8.0, 3.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.66607666015625, -5.4610595703125, -5.25604248046875, -5.051025390625, -4.84600830078125, -4.6409912109375, -4.43597412109375, -4.23095703125, -4.02593994140625, -3.8209228515625, -3.61590576171875, -3.410888671875, -3.20587158203125, -3.0008544921875, -2.79583740234375, -2.5908203125, -2.38580322265625, -2.1807861328125, -1.97576904296875, -1.770751953125, -1.56573486328125, -1.3607177734375, -1.15570068359375, -0.95068359375, -0.74566650390625, -0.5406494140625, -0.33563232421875, -0.130615234375, 0.07440185546875, 0.2794189453125, 0.48443603515625, 0.689453125, 0.89447021484375, 1.0994873046875, 1.30450439453125, 1.509521484375, 1.71453857421875, 1.9195556640625, 2.12457275390625, 2.32958984375, 2.53460693359375, 2.7396240234375, 2.94464111328125, 3.149658203125, 3.35467529296875, 3.5596923828125, 3.76470947265625, 3.9697265625, 4.17474365234375, 4.3797607421875, 4.58477783203125, 4.789794921875, 4.99481201171875, 5.1998291015625, 5.40484619140625, 5.60986328125, 5.81488037109375, 6.0198974609375, 6.22491455078125, 6.429931640625, 6.63494873046875, 6.8399658203125, 7.04498291015625, 7.25]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 7.0, 8.0, 15.0, 23.0, 26.0, 39.0, 68.0, 71.0, 140.0, 229.0, 302.0, 439.0, 762.0, 1178.0, 1824.0, 2906.0, 4750.0, 7615.0, 12487.0, 20252.0, 33347.0, 54630.0, 87453.0, 137498.0, 187027.0, 175289.0, 121717.0, 76265.0, 47158.0, 28824.0, 17703.0, 10872.0, 6660.0, 4101.0, 2566.0, 1565.0, 957.0, 605.0, 388.0, 259.0, 154.0, 114.0, 86.0, 47.0, 42.0, 20.0, 16.0, 18.0, 11.0, 8.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.9228515625, -0.8947601318359375, -0.866668701171875, -0.8385772705078125, -0.81048583984375, -0.7823944091796875, -0.754302978515625, -0.7262115478515625, -0.6981201171875, -0.6700286865234375, -0.641937255859375, -0.6138458251953125, -0.58575439453125, -0.5576629638671875, -0.529571533203125, -0.5014801025390625, -0.473388671875, -0.4452972412109375, -0.417205810546875, -0.3891143798828125, -0.36102294921875, -0.3329315185546875, -0.304840087890625, -0.2767486572265625, -0.2486572265625, -0.2205657958984375, -0.192474365234375, -0.1643829345703125, -0.13629150390625, -0.1082000732421875, -0.080108642578125, -0.0520172119140625, -0.02392578125, 0.0041656494140625, 0.032257080078125, 0.0603485107421875, 0.08843994140625, 0.1165313720703125, 0.144622802734375, 0.1727142333984375, 0.2008056640625, 0.2288970947265625, 0.256988525390625, 0.2850799560546875, 0.31317138671875, 0.3412628173828125, 0.369354248046875, 0.3974456787109375, 0.425537109375, 0.4536285400390625, 0.481719970703125, 0.5098114013671875, 0.53790283203125, 0.5659942626953125, 0.594085693359375, 0.6221771240234375, 0.6502685546875, 0.6783599853515625, 0.706451416015625, 0.7345428466796875, 0.76263427734375, 0.7907257080078125, 0.818817138671875, 0.8469085693359375, 0.875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 7.0, 3.0, 6.0, 5.0, 13.0, 9.0, 21.0, 14.0, 11.0, 19.0, 23.0, 19.0, 21.0, 31.0, 29.0, 36.0, 29.0, 29.0, 53.0, 49.0, 38.0, 43.0, 38.0, 43.0, 43.0, 27.0, 46.0, 41.0, 32.0, 24.0, 26.0, 28.0, 20.0, 23.0, 21.0, 22.0, 9.0, 8.0, 9.0, 8.0, 5.0, 7.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.900390625, -3.7822265625, -3.6640625, -3.5458984375, -3.427734375, -3.3095703125, -3.19140625, -3.0732421875, -2.955078125, -2.8369140625, -2.71875, -2.6005859375, -2.482421875, -2.3642578125, -2.24609375, -2.1279296875, -2.009765625, -1.8916015625, -1.7734375, -1.6552734375, -1.537109375, -1.4189453125, -1.30078125, -1.1826171875, -1.064453125, -0.9462890625, -0.828125, -0.7099609375, -0.591796875, -0.4736328125, -0.35546875, -0.2373046875, -0.119140625, -0.0009765625, 0.1171875, 0.2353515625, 0.353515625, 0.4716796875, 0.58984375, 0.7080078125, 0.826171875, 0.9443359375, 1.0625, 1.1806640625, 1.298828125, 1.4169921875, 1.53515625, 1.6533203125, 1.771484375, 1.8896484375, 2.0078125, 2.1259765625, 2.244140625, 2.3623046875, 2.48046875, 2.5986328125, 2.716796875, 2.8349609375, 2.953125, 3.0712890625, 3.189453125, 3.3076171875, 3.42578125, 3.5439453125, 3.662109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 10.0, 11.0, 18.0, 15.0, 26.0, 38.0, 39.0, 78.0, 108.0, 146.0, 220.0, 363.0, 514.0, 956.0, 1517.0, 2496.0, 4671.0, 8844.0, 18507.0, 41089.0, 100730.0, 283120.0, 356498.0, 131118.0, 51124.0, 22209.0, 10947.0, 5559.0, 2870.0, 1795.0, 1057.0, 659.0, 383.0, 283.0, 151.0, 110.0, 74.0, 55.0, 37.0, 30.0, 23.0, 18.0, 13.0, 8.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10546875, -0.10228538513183594, -0.09910202026367188, -0.09591865539550781, -0.09273529052734375, -0.08955192565917969, -0.08636856079101562, -0.08318519592285156, -0.0800018310546875, -0.07681846618652344, -0.07363510131835938, -0.07045173645019531, -0.06726837158203125, -0.06408500671386719, -0.060901641845703125, -0.05771827697753906, -0.054534912109375, -0.05135154724121094, -0.048168182373046875, -0.04498481750488281, -0.04180145263671875, -0.03861808776855469, -0.035434722900390625, -0.03225135803222656, -0.0290679931640625, -0.025884628295898438, -0.022701263427734375, -0.019517898559570312, -0.01633453369140625, -0.013151168823242188, -0.009967803955078125, -0.0067844390869140625, -0.00360107421875, -0.0004177093505859375, 0.002765655517578125, 0.0059490203857421875, 0.00913238525390625, 0.012315750122070312, 0.015499114990234375, 0.018682479858398438, 0.0218658447265625, 0.025049209594726562, 0.028232574462890625, 0.03141593933105469, 0.03459930419921875, 0.03778266906738281, 0.040966033935546875, 0.04414939880371094, 0.047332763671875, 0.05051612854003906, 0.053699493408203125, 0.05688285827636719, 0.06006622314453125, 0.06324958801269531, 0.06643295288085938, 0.06961631774902344, 0.0727996826171875, 0.07598304748535156, 0.07916641235351562, 0.08234977722167969, 0.08553314208984375, 0.08871650695800781, 0.09189987182617188, 0.09508323669433594, 0.0982666015625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 6.0, 6.0, 12.0, 6.0, 17.0, 17.0, 21.0, 40.0, 42.0, 56.0, 68.0, 100.0, 89.0, 71.0, 86.0, 76.0, 66.0, 40.0, 44.0, 21.0, 25.0, 22.0, 13.0, 8.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6808509826660156e-05, -1.619383692741394e-05, -1.5579164028167725e-05, -1.4964491128921509e-05, -1.4349818229675293e-05, -1.3735145330429077e-05, -1.3120472431182861e-05, -1.2505799531936646e-05, -1.189112663269043e-05, -1.1276453733444214e-05, -1.0661780834197998e-05, -1.0047107934951782e-05, -9.432435035705566e-06, -8.81776213645935e-06, -8.203089237213135e-06, -7.588416337966919e-06, -6.973743438720703e-06, -6.359070539474487e-06, -5.7443976402282715e-06, -5.129724740982056e-06, -4.51505184173584e-06, -3.900378942489624e-06, -3.285706043243408e-06, -2.6710331439971924e-06, -2.0563602447509766e-06, -1.4416873455047607e-06, -8.270144462585449e-07, -2.123415470123291e-07, 4.023313522338867e-07, 1.0170042514801025e-06, 1.6316771507263184e-06, 2.246350049972534e-06, 2.86102294921875e-06, 3.475695848464966e-06, 4.090368747711182e-06, 4.7050416469573975e-06, 5.319714546203613e-06, 5.934387445449829e-06, 6.549060344696045e-06, 7.163733243942261e-06, 7.778406143188477e-06, 8.393079042434692e-06, 9.007751941680908e-06, 9.622424840927124e-06, 1.023709774017334e-05, 1.0851770639419556e-05, 1.1466443538665771e-05, 1.2081116437911987e-05, 1.2695789337158203e-05, 1.3310462236404419e-05, 1.3925135135650635e-05, 1.453980803489685e-05, 1.5154480934143066e-05, 1.5769153833389282e-05, 1.6383826732635498e-05, 1.6998499631881714e-05, 1.761317253112793e-05, 1.8227845430374146e-05, 1.884251832962036e-05, 1.9457191228866577e-05, 2.0071864128112793e-05, 2.068653702735901e-05, 2.1301209926605225e-05, 2.191588282585144e-05, 2.2530555725097656e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 16.0, 12.0, 15.0, 25.0, 41.0, 61.0, 58.0, 78.0, 114.0, 150.0, 214.0, 330.0, 432.0, 594.0, 872.0, 1198.0, 1801.0, 2781.0, 4122.0, 6756.0, 11402.0, 20859.0, 42547.0, 99392.0, 260085.0, 339085.0, 136754.0, 55681.0, 26231.0, 13883.0, 8075.0, 4918.0, 3153.0, 2068.0, 1359.0, 1004.0, 693.0, 473.0, 315.0, 257.0, 198.0, 130.0, 93.0, 59.0, 39.0, 43.0, 33.0, 25.0, 12.0, 14.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.11602783203125, -0.11242103576660156, -0.10881423950195312, -0.10520744323730469, -0.10160064697265625, -0.09799385070800781, -0.09438705444335938, -0.09078025817871094, -0.0871734619140625, -0.08356666564941406, -0.07995986938476562, -0.07635307312011719, -0.07274627685546875, -0.06913948059082031, -0.06553268432617188, -0.06192588806152344, -0.058319091796875, -0.05471229553222656, -0.051105499267578125, -0.04749870300292969, -0.04389190673828125, -0.04028511047363281, -0.036678314208984375, -0.03307151794433594, -0.0294647216796875, -0.025857925415039062, -0.022251129150390625, -0.018644332885742188, -0.01503753662109375, -0.011430740356445312, -0.007823944091796875, -0.0042171478271484375, -0.0006103515625, 0.0029964447021484375, 0.006603240966796875, 0.010210037231445312, 0.01381683349609375, 0.017423629760742188, 0.021030426025390625, 0.024637222290039062, 0.0282440185546875, 0.03185081481933594, 0.035457611083984375, 0.03906440734863281, 0.04267120361328125, 0.04627799987792969, 0.049884796142578125, 0.05349159240722656, 0.057098388671875, 0.06070518493652344, 0.06431198120117188, 0.06791877746582031, 0.07152557373046875, 0.07513236999511719, 0.07873916625976562, 0.08234596252441406, 0.0859527587890625, 0.08955955505371094, 0.09316635131835938, 0.09677314758300781, 0.10037994384765625, 0.10398674011230469, 0.10759353637695312, 0.11120033264160156, 0.11480712890625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 2.0, 6.0, 11.0, 14.0, 11.0, 11.0, 7.0, 19.0, 18.0, 19.0, 30.0, 31.0, 38.0, 46.0, 52.0, 55.0, 54.0, 62.0, 51.0, 53.0, 56.0, 51.0, 41.0, 47.0, 33.0, 27.0, 16.0, 21.0, 21.0, 16.0, 15.0, 16.0, 6.0, 3.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0261688232421875, -0.025370121002197266, -0.02457141876220703, -0.023772716522216797, -0.022974014282226562, -0.022175312042236328, -0.021376609802246094, -0.02057790756225586, -0.019779205322265625, -0.01898050308227539, -0.018181800842285156, -0.017383098602294922, -0.016584396362304688, -0.015785694122314453, -0.014986991882324219, -0.014188289642333984, -0.01338958740234375, -0.012590885162353516, -0.011792182922363281, -0.010993480682373047, -0.010194778442382812, -0.009396076202392578, -0.008597373962402344, -0.007798671722412109, -0.006999969482421875, -0.006201267242431641, -0.005402565002441406, -0.004603862762451172, -0.0038051605224609375, -0.003006458282470703, -0.0022077560424804688, -0.0014090538024902344, -0.0006103515625, 0.00018835067749023438, 0.0009870529174804688, 0.0017857551574707031, 0.0025844573974609375, 0.003383159637451172, 0.004181861877441406, 0.004980564117431641, 0.005779266357421875, 0.006577968597412109, 0.007376670837402344, 0.008175373077392578, 0.008974075317382812, 0.009772777557373047, 0.010571479797363281, 0.011370182037353516, 0.01216888427734375, 0.012967586517333984, 0.013766288757324219, 0.014564990997314453, 0.015363693237304688, 0.016162395477294922, 0.016961097717285156, 0.01775979995727539, 0.018558502197265625, 0.01935720443725586, 0.020155906677246094, 0.020954608917236328, 0.021753311157226562, 0.022552013397216797, 0.02335071563720703, 0.024149417877197266, 0.0249481201171875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 2.0, 6.0, 13.0, 20.0, 21.0, 35.0, 36.0, 44.0, 56.0, 90.0, 86.0, 98.0, 82.0, 87.0, 66.0, 55.0, 46.0, 30.0, 25.0, 20.0, 12.0, 11.0, 8.0, 12.0, 4.0, 8.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.105227470397949, -6.830519676208496, -6.555811882019043, -6.28110408782959, -6.006396293640137, -5.731688499450684, -5.4569807052612305, -5.182272911071777, -4.907565116882324, -4.632857322692871, -4.358149528503418, -4.083441734313965, -3.8087339401245117, -3.5340261459350586, -3.2593183517456055, -2.9846105575561523, -2.709902763366699, -2.435194969177246, -2.160487174987793, -1.8857793807983398, -1.6110715866088867, -1.3363637924194336, -1.0616559982299805, -0.7869482040405273, -0.5122404098510742, -0.2375326156616211, 0.03717517852783203, 0.31188297271728516, 0.5865907669067383, 0.8612985610961914, 1.1360063552856445, 1.4107141494750977, 1.6854228973388672, 1.9601306915283203, 2.2348384857177734, 2.5095462799072266, 2.7842540740966797, 3.058961868286133, 3.333669662475586, 3.608377456665039, 3.883085250854492, 4.157793045043945, 4.432500839233398, 4.707208633422852, 4.981916427612305, 5.256624221801758, 5.531332015991211, 5.806039810180664, 6.080747604370117, 6.35545539855957, 6.630163192749023, 6.904870986938477, 7.17957878112793, 7.454286575317383, 7.728994369506836, 8.003702163696289, 8.278409957885742, 8.553117752075195, 8.827825546264648, 9.102533340454102, 9.377241134643555, 9.651948928833008, 9.926656723022461, 10.201364517211914, 10.476072311401367]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 4.0, 6.0, 8.0, 13.0, 12.0, 16.0, 17.0, 17.0, 23.0, 15.0, 23.0, 27.0, 33.0, 30.0, 36.0, 45.0, 36.0, 37.0, 45.0, 38.0, 30.0, 33.0, 38.0, 50.0, 32.0, 30.0, 33.0, 26.0, 31.0, 36.0, 18.0, 21.0, 20.0, 16.0, 24.0, 12.0, 7.0, 4.0, 13.0, 8.0, 4.0, 10.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-5.915374755859375, -5.7318434715271, -5.548312187194824, -5.364780426025391, -5.181249141693115, -4.99771785736084, -4.8141865730285645, -4.630655288696289, -4.4471235275268555, -4.26359224319458, -4.080060958862305, -3.89652943611145, -3.7129979133605957, -3.5294666290283203, -3.345935344696045, -3.1624040603637695, -2.978872776031494, -2.7953414916992188, -2.6118099689483643, -2.428278684616089, -2.2447471618652344, -2.061215877532959, -1.8776845932006836, -1.6941531896591187, -1.5106217861175537, -1.3270903825759888, -1.1435589790344238, -0.9600276947021484, -0.7764962911605835, -0.5929648876190186, -0.40943360328674316, -0.22590219974517822, -0.04237079620361328, 0.14116057753562927, 0.3246919512748718, 0.508223295211792, 0.6917546987533569, 0.8752861022949219, 1.0588173866271973, 1.2423487901687622, 1.4258801937103271, 1.609411597251892, 1.792943000793457, 1.9764742851257324, 2.160005569458008, 2.3435370922088623, 2.5270683765411377, 2.710599899291992, 2.8941311836242676, 3.077662467956543, 3.2611939907073975, 3.444725275039673, 3.6282567977905273, 3.8117880821228027, 3.995319366455078, 4.1788506507873535, 4.362381935119629, 4.545913219451904, 4.72944450378418, 4.912976264953613, 5.096507549285889, 5.280038833618164, 5.4635701179504395, 5.647101402282715, 5.830633163452148]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 12.0, 12.0, 26.0, 33.0, 52.0, 82.0, 158.0, 252.0, 453.0, 696.0, 1294.0, 2324.0, 4292.0, 7657.0, 14018.0, 25950.0, 47416.0, 82903.0, 132855.0, 179591.0, 185627.0, 146822.0, 94111.0, 54756.0, 30360.0, 16458.0, 8993.0, 4967.0, 2736.0, 1562.0, 810.0, 520.0, 278.0, 169.0, 116.0, 80.0, 34.0, 28.0, 13.0, 14.0, 8.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.39453125, -6.217529296875, -6.04052734375, -5.863525390625, -5.6865234375, -5.509521484375, -5.33251953125, -5.155517578125, -4.978515625, -4.801513671875, -4.62451171875, -4.447509765625, -4.2705078125, -4.093505859375, -3.91650390625, -3.739501953125, -3.5625, -3.385498046875, -3.20849609375, -3.031494140625, -2.8544921875, -2.677490234375, -2.50048828125, -2.323486328125, -2.146484375, -1.969482421875, -1.79248046875, -1.615478515625, -1.4384765625, -1.261474609375, -1.08447265625, -0.907470703125, -0.73046875, -0.553466796875, -0.37646484375, -0.199462890625, -0.0224609375, 0.154541015625, 0.33154296875, 0.508544921875, 0.685546875, 0.862548828125, 1.03955078125, 1.216552734375, 1.3935546875, 1.570556640625, 1.74755859375, 1.924560546875, 2.1015625, 2.278564453125, 2.45556640625, 2.632568359375, 2.8095703125, 2.986572265625, 3.16357421875, 3.340576171875, 3.517578125, 3.694580078125, 3.87158203125, 4.048583984375, 4.2255859375, 4.402587890625, 4.57958984375, 4.756591796875, 4.93359375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 7.0, 11.0, 11.0, 12.0, 17.0, 18.0, 18.0, 22.0, 30.0, 33.0, 28.0, 40.0, 46.0, 42.0, 55.0, 46.0, 34.0, 38.0, 44.0, 42.0, 54.0, 40.0, 46.0, 33.0, 28.0, 31.0, 24.0, 22.0, 26.0, 14.0, 16.0, 12.0, 13.0, 9.0, 5.0, 9.0, 4.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9765625, -6.7603759765625, -6.544189453125, -6.3280029296875, -6.11181640625, -5.8956298828125, -5.679443359375, -5.4632568359375, -5.2470703125, -5.0308837890625, -4.814697265625, -4.5985107421875, -4.38232421875, -4.1661376953125, -3.949951171875, -3.7337646484375, -3.517578125, -3.3013916015625, -3.085205078125, -2.8690185546875, -2.65283203125, -2.4366455078125, -2.220458984375, -2.0042724609375, -1.7880859375, -1.5718994140625, -1.355712890625, -1.1395263671875, -0.92333984375, -0.7071533203125, -0.490966796875, -0.2747802734375, -0.05859375, 0.1575927734375, 0.373779296875, 0.5899658203125, 0.80615234375, 1.0223388671875, 1.238525390625, 1.4547119140625, 1.6708984375, 1.8870849609375, 2.103271484375, 2.3194580078125, 2.53564453125, 2.7518310546875, 2.968017578125, 3.1842041015625, 3.400390625, 3.6165771484375, 3.832763671875, 4.0489501953125, 4.26513671875, 4.4813232421875, 4.697509765625, 4.9136962890625, 5.1298828125, 5.3460693359375, 5.562255859375, 5.7784423828125, 5.99462890625, 6.2108154296875, 6.427001953125, 6.6431884765625, 6.859375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 4.0, 5.0, 5.0, 8.0, 17.0, 22.0, 26.0, 56.0, 96.0, 123.0, 201.0, 287.0, 453.0, 667.0, 967.0, 1522.0, 2325.0, 3639.0, 5479.0, 8316.0, 12701.0, 19893.0, 30923.0, 46584.0, 68164.0, 95014.0, 119973.0, 135203.0, 130590.0, 111051.0, 82971.0, 58478.0, 39251.0, 25812.0, 16645.0, 10758.0, 7001.0, 4643.0, 2915.0, 2061.0, 1254.0, 826.0, 563.0, 348.0, 253.0, 173.0, 97.0, 75.0, 57.0, 25.0, 15.0, 6.0, 15.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.912109375, -3.785064697265625, -3.65802001953125, -3.530975341796875, -3.4039306640625, -3.276885986328125, -3.14984130859375, -3.022796630859375, -2.895751953125, -2.768707275390625, -2.64166259765625, -2.514617919921875, -2.3875732421875, -2.260528564453125, -2.13348388671875, -2.006439208984375, -1.87939453125, -1.752349853515625, -1.62530517578125, -1.498260498046875, -1.3712158203125, -1.244171142578125, -1.11712646484375, -0.990081787109375, -0.863037109375, -0.735992431640625, -0.60894775390625, -0.481903076171875, -0.3548583984375, -0.227813720703125, -0.10076904296875, 0.026275634765625, 0.1533203125, 0.280364990234375, 0.40740966796875, 0.534454345703125, 0.6614990234375, 0.788543701171875, 0.91558837890625, 1.042633056640625, 1.169677734375, 1.296722412109375, 1.42376708984375, 1.550811767578125, 1.6778564453125, 1.804901123046875, 1.93194580078125, 2.058990478515625, 2.18603515625, 2.313079833984375, 2.44012451171875, 2.567169189453125, 2.6942138671875, 2.821258544921875, 2.94830322265625, 3.075347900390625, 3.202392578125, 3.329437255859375, 3.45648193359375, 3.583526611328125, 3.7105712890625, 3.837615966796875, 3.96466064453125, 4.091705322265625, 4.21875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 6.0, 7.0, 6.0, 7.0, 8.0, 14.0, 16.0, 14.0, 21.0, 22.0, 29.0, 34.0, 30.0, 31.0, 31.0, 35.0, 34.0, 32.0, 50.0, 48.0, 45.0, 43.0, 41.0, 39.0, 35.0, 35.0, 29.0, 39.0, 23.0, 41.0, 26.0, 22.0, 16.0, 18.0, 8.0, 12.0, 10.0, 9.0, 8.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.53515625, -3.419342041015625, -3.30352783203125, -3.187713623046875, -3.0718994140625, -2.956085205078125, -2.84027099609375, -2.724456787109375, -2.608642578125, -2.492828369140625, -2.37701416015625, -2.261199951171875, -2.1453857421875, -2.029571533203125, -1.91375732421875, -1.797943115234375, -1.68212890625, -1.566314697265625, -1.45050048828125, -1.334686279296875, -1.2188720703125, -1.103057861328125, -0.98724365234375, -0.871429443359375, -0.755615234375, -0.639801025390625, -0.52398681640625, -0.408172607421875, -0.2923583984375, -0.176544189453125, -0.06072998046875, 0.055084228515625, 0.1708984375, 0.286712646484375, 0.40252685546875, 0.518341064453125, 0.6341552734375, 0.749969482421875, 0.86578369140625, 0.981597900390625, 1.097412109375, 1.213226318359375, 1.32904052734375, 1.444854736328125, 1.5606689453125, 1.676483154296875, 1.79229736328125, 1.908111572265625, 2.02392578125, 2.139739990234375, 2.25555419921875, 2.371368408203125, 2.4871826171875, 2.602996826171875, 2.71881103515625, 2.834625244140625, 2.950439453125, 3.066253662109375, 3.18206787109375, 3.297882080078125, 3.4136962890625, 3.529510498046875, 3.64532470703125, 3.761138916015625, 3.876953125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 9.0, 11.0, 10.0, 9.0, 25.0, 32.0, 41.0, 63.0, 62.0, 109.0, 158.0, 257.0, 408.0, 617.0, 1036.0, 1699.0, 3081.0, 5758.0, 11008.0, 22869.0, 50452.0, 109847.0, 213446.0, 270423.0, 184870.0, 91084.0, 41261.0, 19073.0, 9354.0, 4813.0, 2612.0, 1536.0, 894.0, 552.0, 349.0, 226.0, 151.0, 103.0, 79.0, 49.0, 27.0, 33.0, 22.0, 11.0, 9.0, 10.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.697265625, -2.611297607421875, -2.52532958984375, -2.439361572265625, -2.3533935546875, -2.267425537109375, -2.18145751953125, -2.095489501953125, -2.009521484375, -1.923553466796875, -1.83758544921875, -1.751617431640625, -1.6656494140625, -1.579681396484375, -1.49371337890625, -1.407745361328125, -1.32177734375, -1.235809326171875, -1.14984130859375, -1.063873291015625, -0.9779052734375, -0.891937255859375, -0.80596923828125, -0.720001220703125, -0.634033203125, -0.548065185546875, -0.46209716796875, -0.376129150390625, -0.2901611328125, -0.204193115234375, -0.11822509765625, -0.032257080078125, 0.0537109375, 0.139678955078125, 0.22564697265625, 0.311614990234375, 0.3975830078125, 0.483551025390625, 0.56951904296875, 0.655487060546875, 0.741455078125, 0.827423095703125, 0.91339111328125, 0.999359130859375, 1.0853271484375, 1.171295166015625, 1.25726318359375, 1.343231201171875, 1.42919921875, 1.515167236328125, 1.60113525390625, 1.687103271484375, 1.7730712890625, 1.859039306640625, 1.94500732421875, 2.030975341796875, 2.116943359375, 2.202911376953125, 2.28887939453125, 2.374847412109375, 2.4608154296875, 2.546783447265625, 2.63275146484375, 2.718719482421875, 2.8046875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 7.0, 3.0, 9.0, 8.0, 12.0, 16.0, 12.0, 28.0, 32.0, 29.0, 50.0, 38.0, 34.0, 55.0, 59.0, 68.0, 60.0, 52.0, 59.0, 57.0, 59.0, 52.0, 30.0, 30.0, 30.0, 19.0, 15.0, 15.0, 8.0, 9.0, 7.0, 7.0, 5.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00014901161193847656, -0.00014443323016166687, -0.00013985484838485718, -0.00013527646660804749, -0.0001306980848312378, -0.0001261197030544281, -0.00012154132127761841, -0.00011696293950080872, -0.00011238455772399902, -0.00010780617594718933, -0.00010322779417037964, -9.864941239356995e-05, -9.407103061676025e-05, -8.949264883995056e-05, -8.491426706314087e-05, -8.033588528633118e-05, -7.575750350952148e-05, -7.117912173271179e-05, -6.66007399559021e-05, -6.202235817909241e-05, -5.7443976402282715e-05, -5.286559462547302e-05, -4.828721284866333e-05, -4.370883107185364e-05, -3.9130449295043945e-05, -3.455206751823425e-05, -2.997368574142456e-05, -2.5395303964614868e-05, -2.0816922187805176e-05, -1.6238540410995483e-05, -1.1660158634185791e-05, -7.081776857376099e-06, -2.5033950805664062e-06, 2.074986696243286e-06, 6.6533684730529785e-06, 1.1231750249862671e-05, 1.5810132026672363e-05, 2.0388513803482056e-05, 2.4966895580291748e-05, 2.954527735710144e-05, 3.412365913391113e-05, 3.8702040910720825e-05, 4.328042268753052e-05, 4.785880446434021e-05, 5.24371862411499e-05, 5.7015568017959595e-05, 6.159394979476929e-05, 6.617233157157898e-05, 7.075071334838867e-05, 7.532909512519836e-05, 7.990747690200806e-05, 8.448585867881775e-05, 8.906424045562744e-05, 9.364262223243713e-05, 9.822100400924683e-05, 0.00010279938578605652, 0.00010737776756286621, 0.0001119561493396759, 0.0001165345311164856, 0.00012111291289329529, 0.00012569129467010498, 0.00013026967644691467, 0.00013484805822372437, 0.00013942644000053406, 0.00014400482177734375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 12.0, 22.0, 19.0, 28.0, 41.0, 45.0, 55.0, 85.0, 125.0, 194.0, 328.0, 554.0, 911.0, 1819.0, 3220.0, 6416.0, 12537.0, 25815.0, 54345.0, 116424.0, 218122.0, 263629.0, 176087.0, 87378.0, 40447.0, 19421.0, 9631.0, 4918.0, 2519.0, 1382.0, 749.0, 451.0, 247.0, 166.0, 106.0, 80.0, 55.0, 41.0, 26.0, 18.0, 19.0, 10.0, 11.0, 6.0, 5.0, 10.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.548828125, -2.4647216796875, -2.380615234375, -2.2965087890625, -2.21240234375, -2.1282958984375, -2.044189453125, -1.9600830078125, -1.8759765625, -1.7918701171875, -1.707763671875, -1.6236572265625, -1.53955078125, -1.4554443359375, -1.371337890625, -1.2872314453125, -1.203125, -1.1190185546875, -1.034912109375, -0.9508056640625, -0.86669921875, -0.7825927734375, -0.698486328125, -0.6143798828125, -0.5302734375, -0.4461669921875, -0.362060546875, -0.2779541015625, -0.19384765625, -0.1097412109375, -0.025634765625, 0.0584716796875, 0.142578125, 0.2266845703125, 0.310791015625, 0.3948974609375, 0.47900390625, 0.5631103515625, 0.647216796875, 0.7313232421875, 0.8154296875, 0.8995361328125, 0.983642578125, 1.0677490234375, 1.15185546875, 1.2359619140625, 1.320068359375, 1.4041748046875, 1.48828125, 1.5723876953125, 1.656494140625, 1.7406005859375, 1.82470703125, 1.9088134765625, 1.992919921875, 2.0770263671875, 2.1611328125, 2.2452392578125, 2.329345703125, 2.4134521484375, 2.49755859375, 2.5816650390625, 2.665771484375, 2.7498779296875, 2.833984375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 2.0, 5.0, 4.0, 5.0, 8.0, 10.0, 14.0, 14.0, 17.0, 10.0, 26.0, 22.0, 36.0, 38.0, 37.0, 51.0, 57.0, 58.0, 77.0, 61.0, 70.0, 51.0, 53.0, 51.0, 44.0, 22.0, 33.0, 26.0, 12.0, 15.0, 16.0, 9.0, 6.0, 10.0, 2.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.767578125, -0.743927001953125, -0.72027587890625, -0.696624755859375, -0.6729736328125, -0.649322509765625, -0.62567138671875, -0.602020263671875, -0.578369140625, -0.554718017578125, -0.53106689453125, -0.507415771484375, -0.4837646484375, -0.460113525390625, -0.43646240234375, -0.412811279296875, -0.38916015625, -0.365509033203125, -0.34185791015625, -0.318206787109375, -0.2945556640625, -0.270904541015625, -0.24725341796875, -0.223602294921875, -0.199951171875, -0.176300048828125, -0.15264892578125, -0.128997802734375, -0.1053466796875, -0.081695556640625, -0.05804443359375, -0.034393310546875, -0.0107421875, 0.012908935546875, 0.03656005859375, 0.060211181640625, 0.0838623046875, 0.107513427734375, 0.13116455078125, 0.154815673828125, 0.178466796875, 0.202117919921875, 0.22576904296875, 0.249420166015625, 0.2730712890625, 0.296722412109375, 0.32037353515625, 0.344024658203125, 0.36767578125, 0.391326904296875, 0.41497802734375, 0.438629150390625, 0.4622802734375, 0.485931396484375, 0.50958251953125, 0.533233642578125, 0.556884765625, 0.580535888671875, 0.60418701171875, 0.627838134765625, 0.6514892578125, 0.675140380859375, 0.69879150390625, 0.722442626953125, 0.74609375]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 6.0, 5.0, 8.0, 8.0, 10.0, 12.0, 19.0, 30.0, 29.0, 31.0, 38.0, 46.0, 68.0, 72.0, 83.0, 66.0, 75.0, 56.0, 63.0, 52.0, 38.0, 32.0, 28.0, 22.0, 22.0, 14.0, 10.0, 7.0, 8.0, 5.0, 5.0, 10.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.405219078063965, -6.180782318115234, -5.956345558166504, -5.731909275054932, -5.507472515106201, -5.283035755157471, -5.058599472045898, -4.834162712097168, -4.6097259521484375, -4.385289192199707, -4.160852432250977, -3.9364161491394043, -3.711979389190674, -3.4875426292419434, -3.263106107711792, -3.0386695861816406, -2.81423282623291, -2.5897960662841797, -2.3653595447540283, -2.140923023223877, -1.9164862632751465, -1.6920496225357056, -1.4676129817962646, -1.2431763410568237, -1.0187397003173828, -0.7943030595779419, -0.569866418838501, -0.34542977809906006, -0.12099313735961914, 0.10344350337982178, 0.3278801441192627, 0.5523167848587036, 0.7767529487609863, 1.0011895895004272, 1.2256262302398682, 1.450062870979309, 1.67449951171875, 1.898936152458191, 2.123372793197632, 2.347809314727783, 2.5722460746765137, 2.796682834625244, 3.0211193561553955, 3.245555877685547, 3.4699926376342773, 3.694429397583008, 3.918865919113159, 4.1433024406433105, 4.367739200592041, 4.5921759605407715, 4.816612243652344, 5.041049003601074, 5.265485763549805, 5.489922523498535, 5.714359283447266, 5.938795566558838, 6.163232326507568, 6.387669086456299, 6.612105369567871, 6.836542129516602, 7.060978889465332, 7.2854156494140625, 7.509852409362793, 7.734288692474365, 7.958725452423096]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 2.0, 9.0, 2.0, 6.0, 8.0, 7.0, 10.0, 13.0, 16.0, 23.0, 17.0, 19.0, 24.0, 26.0, 25.0, 53.0, 42.0, 31.0, 46.0, 36.0, 42.0, 47.0, 30.0, 38.0, 39.0, 35.0, 43.0, 32.0, 34.0, 32.0, 24.0, 24.0, 21.0, 23.0, 18.0, 24.0, 12.0, 13.0, 12.0, 5.0, 9.0, 7.0, 4.0, 2.0, 1.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-6.5223188400268555, -6.3299736976623535, -6.13762903213501, -5.945283889770508, -5.752938747406006, -5.560593605041504, -5.36824893951416, -5.175903797149658, -4.983558654785156, -4.791213512420654, -4.5988688468933105, -4.406523704528809, -4.214178562164307, -4.021833419799805, -3.829488754272461, -3.637143611907959, -3.4447989463806152, -3.2524540424346924, -3.0601089000701904, -2.8677639961242676, -2.6754188537597656, -2.4830739498138428, -2.29072904586792, -2.098383903503418, -1.9060389995574951, -1.7136939764022827, -1.5213489532470703, -1.3290040493011475, -1.136659026145935, -0.9443140029907227, -0.7519690990447998, -0.5596240758895874, -0.3672785758972168, -0.17493358254432678, 0.017411410808563232, 0.20975637435913086, 0.40210139751434326, 0.5944464206695557, 0.7867913246154785, 0.9791363477706909, 1.1714813709259033, 1.3638263940811157, 1.5561714172363281, 1.748516321182251, 1.9408613443374634, 2.133206367492676, 2.3255512714385986, 2.5178961753845215, 2.7102413177490234, 2.9025862216949463, 3.0949313640594482, 3.287276268005371, 3.479621410369873, 3.671966314315796, 3.8643112182617188, 4.056656360626221, 4.249001502990723, 4.441346645355225, 4.633691310882568, 4.82603645324707, 5.018381595611572, 5.210726737976074, 5.403071403503418, 5.59541654586792, 5.787761211395264]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 11.0, 11.0, 29.0, 40.0, 47.0, 83.0, 124.0, 196.0, 320.0, 463.0, 756.0, 1153.0, 1882.0, 3101.0, 4954.0, 8006.0, 13414.0, 22619.0, 39142.0, 70404.0, 129816.0, 245963.0, 466331.0, 789353.0, 922504.0, 667048.0, 370254.0, 193875.0, 103272.0, 56873.0, 32539.0, 19141.0, 11802.0, 6935.0, 4272.0, 2796.0, 1684.0, 1088.0, 729.0, 458.0, 281.0, 196.0, 108.0, 80.0, 51.0, 33.0, 16.0, 13.0, 10.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5546875, -5.365234375, -5.17578125, -4.986328125, -4.796875, -4.607421875, -4.41796875, -4.228515625, -4.0390625, -3.849609375, -3.66015625, -3.470703125, -3.28125, -3.091796875, -2.90234375, -2.712890625, -2.5234375, -2.333984375, -2.14453125, -1.955078125, -1.765625, -1.576171875, -1.38671875, -1.197265625, -1.0078125, -0.818359375, -0.62890625, -0.439453125, -0.25, -0.060546875, 0.12890625, 0.318359375, 0.5078125, 0.697265625, 0.88671875, 1.076171875, 1.265625, 1.455078125, 1.64453125, 1.833984375, 2.0234375, 2.212890625, 2.40234375, 2.591796875, 2.78125, 2.970703125, 3.16015625, 3.349609375, 3.5390625, 3.728515625, 3.91796875, 4.107421875, 4.296875, 4.486328125, 4.67578125, 4.865234375, 5.0546875, 5.244140625, 5.43359375, 5.623046875, 5.8125, 6.001953125, 6.19140625, 6.380859375, 6.5703125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 8.0, 2.0, 6.0, 3.0, 8.0, 8.0, 10.0, 12.0, 12.0, 15.0, 26.0, 19.0, 27.0, 34.0, 24.0, 34.0, 41.0, 53.0, 49.0, 40.0, 34.0, 38.0, 41.0, 46.0, 33.0, 41.0, 48.0, 28.0, 41.0, 26.0, 29.0, 22.0, 21.0, 19.0, 21.0, 15.0, 14.0, 9.0, 10.0, 8.0, 9.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-4.7421875, -4.60333251953125, -4.4644775390625, -4.32562255859375, -4.186767578125, -4.04791259765625, -3.9090576171875, -3.77020263671875, -3.63134765625, -3.49249267578125, -3.3536376953125, -3.21478271484375, -3.075927734375, -2.93707275390625, -2.7982177734375, -2.65936279296875, -2.5205078125, -2.38165283203125, -2.2427978515625, -2.10394287109375, -1.965087890625, -1.82623291015625, -1.6873779296875, -1.54852294921875, -1.40966796875, -1.27081298828125, -1.1319580078125, -0.99310302734375, -0.854248046875, -0.71539306640625, -0.5765380859375, -0.43768310546875, -0.298828125, -0.15997314453125, -0.0211181640625, 0.11773681640625, 0.256591796875, 0.39544677734375, 0.5343017578125, 0.67315673828125, 0.81201171875, 0.95086669921875, 1.0897216796875, 1.22857666015625, 1.367431640625, 1.50628662109375, 1.6451416015625, 1.78399658203125, 1.9228515625, 2.06170654296875, 2.2005615234375, 2.33941650390625, 2.478271484375, 2.61712646484375, 2.7559814453125, 2.89483642578125, 3.03369140625, 3.17254638671875, 3.3114013671875, 3.45025634765625, 3.589111328125, 3.72796630859375, 3.8668212890625, 4.00567626953125, 4.14453125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 7.0, 14.0, 33.0, 35.0, 52.0, 88.0, 139.0, 224.0, 346.0, 539.0, 907.0, 1497.0, 2353.0, 3916.0, 6634.0, 11185.0, 19418.0, 34106.0, 60337.0, 108674.0, 195990.0, 345404.0, 563394.0, 768608.0, 758177.0, 549062.0, 332787.0, 187659.0, 105035.0, 58616.0, 32569.0, 18984.0, 11006.0, 6612.0, 3857.0, 2295.0, 1362.0, 892.0, 518.0, 327.0, 231.0, 142.0, 98.0, 53.0, 35.0, 27.0, 11.0, 5.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.453125, -5.27703857421875, -5.1009521484375, -4.92486572265625, -4.748779296875, -4.57269287109375, -4.3966064453125, -4.22052001953125, -4.04443359375, -3.86834716796875, -3.6922607421875, -3.51617431640625, -3.340087890625, -3.16400146484375, -2.9879150390625, -2.81182861328125, -2.6357421875, -2.45965576171875, -2.2835693359375, -2.10748291015625, -1.931396484375, -1.75531005859375, -1.5792236328125, -1.40313720703125, -1.22705078125, -1.05096435546875, -0.8748779296875, -0.69879150390625, -0.522705078125, -0.34661865234375, -0.1705322265625, 0.00555419921875, 0.181640625, 0.35772705078125, 0.5338134765625, 0.70989990234375, 0.885986328125, 1.06207275390625, 1.2381591796875, 1.41424560546875, 1.59033203125, 1.76641845703125, 1.9425048828125, 2.11859130859375, 2.294677734375, 2.47076416015625, 2.6468505859375, 2.82293701171875, 2.9990234375, 3.17510986328125, 3.3511962890625, 3.52728271484375, 3.703369140625, 3.87945556640625, 4.0555419921875, 4.23162841796875, 4.40771484375, 4.58380126953125, 4.7598876953125, 4.93597412109375, 5.112060546875, 5.28814697265625, 5.4642333984375, 5.64031982421875, 5.81640625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 8.0, 8.0, 15.0, 19.0, 29.0, 35.0, 43.0, 64.0, 68.0, 98.0, 107.0, 132.0, 148.0, 173.0, 184.0, 199.0, 229.0, 254.0, 276.0, 215.0, 217.0, 239.0, 199.0, 191.0, 154.0, 126.0, 128.0, 96.0, 70.0, 65.0, 48.0, 50.0, 34.0, 31.0, 26.0, 19.0, 12.0, 6.0, 7.0, 9.0, 10.0, 7.0, 8.0, 7.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.21875, -2.1453857421875, -2.072021484375, -1.9986572265625, -1.92529296875, -1.8519287109375, -1.778564453125, -1.7052001953125, -1.6318359375, -1.5584716796875, -1.485107421875, -1.4117431640625, -1.33837890625, -1.2650146484375, -1.191650390625, -1.1182861328125, -1.044921875, -0.9715576171875, -0.898193359375, -0.8248291015625, -0.75146484375, -0.6781005859375, -0.604736328125, -0.5313720703125, -0.4580078125, -0.3846435546875, -0.311279296875, -0.2379150390625, -0.16455078125, -0.0911865234375, -0.017822265625, 0.0555419921875, 0.12890625, 0.2022705078125, 0.275634765625, 0.3489990234375, 0.42236328125, 0.4957275390625, 0.569091796875, 0.6424560546875, 0.7158203125, 0.7891845703125, 0.862548828125, 0.9359130859375, 1.00927734375, 1.0826416015625, 1.156005859375, 1.2293701171875, 1.302734375, 1.3760986328125, 1.449462890625, 1.5228271484375, 1.59619140625, 1.6695556640625, 1.742919921875, 1.8162841796875, 1.8896484375, 1.9630126953125, 2.036376953125, 2.1097412109375, 2.18310546875, 2.2564697265625, 2.329833984375, 2.4031982421875, 2.4765625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 2.0, 5.0, 4.0, 11.0, 12.0, 21.0, 17.0, 19.0, 26.0, 30.0, 38.0, 45.0, 60.0, 66.0, 72.0, 77.0, 70.0, 76.0, 47.0, 61.0, 38.0, 44.0, 33.0, 17.0, 17.0, 15.0, 15.0, 10.0, 9.0, 9.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-6.891319274902344, -6.666637897491455, -6.441956043243408, -6.2172746658325195, -5.992592811584473, -5.767911434173584, -5.543230056762695, -5.318548202514648, -5.09386682510376, -4.869185447692871, -4.644503593444824, -4.4198222160339355, -4.195140361785889, -3.970458984375, -3.7457773685455322, -3.5210957527160645, -3.2964141368865967, -3.071732521057129, -2.847050905227661, -2.6223692893981934, -2.3976879119873047, -2.173006296157837, -1.9483246803283691, -1.723643183708191, -1.4989615678787231, -1.2742799520492554, -1.0495984554290771, -0.8249168395996094, -0.6002352833747864, -0.3755537271499634, -0.1508721113204956, 0.07380938529968262, 0.2984910011291504, 0.5231725573539734, 0.7478541135787964, 0.9725357294082642, 1.1972172260284424, 1.4218988418579102, 1.646580457687378, 1.8712619543075562, 2.0959434509277344, 2.320625066757202, 2.54530668258667, 2.7699880599975586, 2.9946696758270264, 3.219351291656494, 3.444032907485962, 3.6687145233154297, 3.8933961391448975, 4.118077754974365, 4.342759132385254, 4.567440986633301, 4.7921223640441895, 5.016803741455078, 5.241485595703125, 5.466166973114014, 5.6908488273620605, 5.915530204772949, 6.140212059020996, 6.364893436431885, 6.589575290679932, 6.81425666809082, 7.038938522338867, 7.263619899749756, 7.4883012771606445]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 5.0, 4.0, 6.0, 10.0, 7.0, 10.0, 12.0, 12.0, 13.0, 14.0, 21.0, 26.0, 28.0, 27.0, 45.0, 31.0, 35.0, 35.0, 47.0, 50.0, 33.0, 46.0, 46.0, 45.0, 36.0, 37.0, 41.0, 31.0, 27.0, 31.0, 25.0, 20.0, 24.0, 15.0, 12.0, 19.0, 12.0, 7.0, 6.0, 5.0, 6.0, 7.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.0724358558654785, -5.884020805358887, -5.695605754852295, -5.507190704345703, -5.318775653839111, -5.1303606033325195, -4.941945552825928, -4.753530502319336, -4.565115451812744, -4.376700401306152, -4.1882853507995605, -3.9998703002929688, -3.811455249786377, -3.623040199279785, -3.4346251487731934, -3.2462100982666016, -3.0577948093414307, -2.869379758834839, -2.680964708328247, -2.4925496578216553, -2.3041346073150635, -2.1157195568084717, -1.9273043870925903, -1.7388893365859985, -1.5504742860794067, -1.362059235572815, -1.1736441850662231, -0.9852290749549866, -0.7968140244483948, -0.608398973941803, -0.4199838638305664, -0.2315688133239746, -0.04315376281738281, 0.14526130259037018, 0.33367636799812317, 0.5220914483070374, 0.7105064988136292, 0.898921549320221, 1.0873366594314575, 1.2757517099380493, 1.4641667604446411, 1.652581810951233, 1.8409968614578247, 2.029412031173706, 2.217827081680298, 2.4062421321868896, 2.5946571826934814, 2.7830722332000732, 2.971487283706665, 3.159902334213257, 3.3483173847198486, 3.5367324352264404, 3.7251474857330322, 3.913562536239624, 4.101977825164795, 4.290392875671387, 4.4788079261779785, 4.66722297668457, 4.855638027191162, 5.044053077697754, 5.232468128204346, 5.4208831787109375, 5.609298229217529, 5.797713279724121, 5.986128330230713]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 14.0, 21.0, 29.0, 63.0, 94.0, 114.0, 177.0, 291.0, 426.0, 653.0, 1030.0, 1589.0, 2439.0, 3695.0, 5740.0, 9087.0, 14471.0, 22841.0, 36692.0, 59203.0, 95540.0, 148129.0, 195991.0, 164220.0, 106912.0, 67397.0, 41340.0, 25741.0, 16077.0, 10104.0, 6412.0, 4242.0, 2748.0, 1791.0, 1136.0, 713.0, 477.0, 327.0, 208.0, 140.0, 87.0, 68.0, 31.0, 22.0, 13.0, 15.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.78369140625, -0.7589111328125, -0.734130859375, -0.7093505859375, -0.6845703125, -0.6597900390625, -0.635009765625, -0.6102294921875, -0.58544921875, -0.5606689453125, -0.535888671875, -0.5111083984375, -0.486328125, -0.4615478515625, -0.436767578125, -0.4119873046875, -0.38720703125, -0.3624267578125, -0.337646484375, -0.3128662109375, -0.2880859375, -0.2633056640625, -0.238525390625, -0.2137451171875, -0.18896484375, -0.1641845703125, -0.139404296875, -0.1146240234375, -0.08984375, -0.0650634765625, -0.040283203125, -0.0155029296875, 0.00927734375, 0.0340576171875, 0.058837890625, 0.0836181640625, 0.1083984375, 0.1331787109375, 0.157958984375, 0.1827392578125, 0.20751953125, 0.2322998046875, 0.257080078125, 0.2818603515625, 0.306640625, 0.3314208984375, 0.356201171875, 0.3809814453125, 0.40576171875, 0.4305419921875, 0.455322265625, 0.4801025390625, 0.5048828125, 0.5296630859375, 0.554443359375, 0.5792236328125, 0.60400390625, 0.6287841796875, 0.653564453125, 0.6783447265625, 0.703125, 0.7279052734375, 0.752685546875, 0.7774658203125, 0.80224609375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 10.0, 6.0, 8.0, 10.0, 5.0, 13.0, 12.0, 14.0, 18.0, 24.0, 30.0, 34.0, 33.0, 36.0, 43.0, 37.0, 48.0, 52.0, 37.0, 61.0, 46.0, 42.0, 46.0, 50.0, 25.0, 40.0, 29.0, 34.0, 15.0, 27.0, 12.0, 17.0, 19.0, 13.0, 9.0, 6.0, 10.0, 5.0, 3.0, 5.0, 2.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91796875, -6.70361328125, -6.4892578125, -6.27490234375, -6.060546875, -5.84619140625, -5.6318359375, -5.41748046875, -5.203125, -4.98876953125, -4.7744140625, -4.56005859375, -4.345703125, -4.13134765625, -3.9169921875, -3.70263671875, -3.48828125, -3.27392578125, -3.0595703125, -2.84521484375, -2.630859375, -2.41650390625, -2.2021484375, -1.98779296875, -1.7734375, -1.55908203125, -1.3447265625, -1.13037109375, -0.916015625, -0.70166015625, -0.4873046875, -0.27294921875, -0.05859375, 0.15576171875, 0.3701171875, 0.58447265625, 0.798828125, 1.01318359375, 1.2275390625, 1.44189453125, 1.65625, 1.87060546875, 2.0849609375, 2.29931640625, 2.513671875, 2.72802734375, 2.9423828125, 3.15673828125, 3.37109375, 3.58544921875, 3.7998046875, 4.01416015625, 4.228515625, 4.44287109375, 4.6572265625, 4.87158203125, 5.0859375, 5.30029296875, 5.5146484375, 5.72900390625, 5.943359375, 6.15771484375, 6.3720703125, 6.58642578125, 6.80078125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 9.0, 11.0, 16.0, 23.0, 41.0, 68.0, 93.0, 165.0, 242.0, 373.0, 621.0, 973.0, 1609.0, 2524.0, 4040.0, 6410.0, 10460.0, 17079.0, 28070.0, 44843.0, 71503.0, 109403.0, 159674.0, 186326.0, 143862.0, 96367.0, 61773.0, 38859.0, 24103.0, 14880.0, 9250.0, 5536.0, 3475.0, 2165.0, 1346.0, 833.0, 538.0, 371.0, 227.0, 156.0, 78.0, 62.0, 30.0, 28.0, 17.0, 10.0, 3.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.89306640625, -0.8670654296875, -0.841064453125, -0.8150634765625, -0.7890625, -0.7630615234375, -0.737060546875, -0.7110595703125, -0.68505859375, -0.6590576171875, -0.633056640625, -0.6070556640625, -0.5810546875, -0.5550537109375, -0.529052734375, -0.5030517578125, -0.47705078125, -0.4510498046875, -0.425048828125, -0.3990478515625, -0.373046875, -0.3470458984375, -0.321044921875, -0.2950439453125, -0.26904296875, -0.2430419921875, -0.217041015625, -0.1910400390625, -0.1650390625, -0.1390380859375, -0.113037109375, -0.0870361328125, -0.06103515625, -0.0350341796875, -0.009033203125, 0.0169677734375, 0.04296875, 0.0689697265625, 0.094970703125, 0.1209716796875, 0.14697265625, 0.1729736328125, 0.198974609375, 0.2249755859375, 0.2509765625, 0.2769775390625, 0.302978515625, 0.3289794921875, 0.35498046875, 0.3809814453125, 0.406982421875, 0.4329833984375, 0.458984375, 0.4849853515625, 0.510986328125, 0.5369873046875, 0.56298828125, 0.5889892578125, 0.614990234375, 0.6409912109375, 0.6669921875, 0.6929931640625, 0.718994140625, 0.7449951171875, 0.77099609375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 6.0, 14.0, 13.0, 8.0, 14.0, 16.0, 21.0, 17.0, 25.0, 33.0, 30.0, 36.0, 28.0, 34.0, 42.0, 48.0, 49.0, 46.0, 46.0, 54.0, 35.0, 33.0, 38.0, 30.0, 41.0, 32.0, 33.0, 28.0, 28.0, 15.0, 19.0, 17.0, 16.0, 8.0, 15.0, 8.0, 4.0, 4.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.80078125, -3.67510986328125, -3.5494384765625, -3.42376708984375, -3.298095703125, -3.17242431640625, -3.0467529296875, -2.92108154296875, -2.79541015625, -2.66973876953125, -2.5440673828125, -2.41839599609375, -2.292724609375, -2.16705322265625, -2.0413818359375, -1.91571044921875, -1.7900390625, -1.66436767578125, -1.5386962890625, -1.41302490234375, -1.287353515625, -1.16168212890625, -1.0360107421875, -0.91033935546875, -0.78466796875, -0.65899658203125, -0.5333251953125, -0.40765380859375, -0.281982421875, -0.15631103515625, -0.0306396484375, 0.09503173828125, 0.220703125, 0.34637451171875, 0.4720458984375, 0.59771728515625, 0.723388671875, 0.84906005859375, 0.9747314453125, 1.10040283203125, 1.22607421875, 1.35174560546875, 1.4774169921875, 1.60308837890625, 1.728759765625, 1.85443115234375, 1.9801025390625, 2.10577392578125, 2.2314453125, 2.35711669921875, 2.4827880859375, 2.60845947265625, 2.734130859375, 2.85980224609375, 2.9854736328125, 3.11114501953125, 3.23681640625, 3.36248779296875, 3.4881591796875, 3.61383056640625, 3.739501953125, 3.86517333984375, 3.9908447265625, 4.11651611328125, 4.2421875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 7.0, 21.0, 14.0, 27.0, 44.0, 69.0, 72.0, 128.0, 230.0, 370.0, 584.0, 992.0, 1682.0, 2961.0, 5756.0, 11166.0, 24004.0, 57232.0, 157806.0, 397681.0, 239310.0, 83854.0, 33190.0, 14887.0, 7380.0, 3859.0, 2087.0, 1239.0, 720.0, 428.0, 264.0, 154.0, 119.0, 72.0, 42.0, 32.0, 25.0, 17.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07379150390625, -0.07112693786621094, -0.06846237182617188, -0.06579780578613281, -0.06313323974609375, -0.06046867370605469, -0.057804107666015625, -0.05513954162597656, -0.0524749755859375, -0.04981040954589844, -0.047145843505859375, -0.04448127746582031, -0.04181671142578125, -0.03915214538574219, -0.036487579345703125, -0.03382301330566406, -0.031158447265625, -0.028493881225585938, -0.025829315185546875, -0.023164749145507812, -0.02050018310546875, -0.017835617065429688, -0.015171051025390625, -0.012506484985351562, -0.0098419189453125, -0.0071773529052734375, -0.004512786865234375, -0.0018482208251953125, 0.00081634521484375, 0.0034809112548828125, 0.006145477294921875, 0.008810043334960938, 0.011474609375, 0.014139175415039062, 0.016803741455078125, 0.019468307495117188, 0.02213287353515625, 0.024797439575195312, 0.027462005615234375, 0.030126571655273438, 0.0327911376953125, 0.03545570373535156, 0.038120269775390625, 0.04078483581542969, 0.04344940185546875, 0.04611396789550781, 0.048778533935546875, 0.05144309997558594, 0.054107666015625, 0.05677223205566406, 0.059436798095703125, 0.06210136413574219, 0.06476593017578125, 0.06743049621582031, 0.07009506225585938, 0.07275962829589844, 0.0754241943359375, 0.07808876037597656, 0.08075332641601562, 0.08341789245605469, 0.08608245849609375, 0.08874702453613281, 0.09141159057617188, 0.09407615661621094, 0.09674072265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 6.0, 6.0, 12.0, 8.0, 9.0, 8.0, 11.0, 10.0, 18.0, 19.0, 26.0, 34.0, 28.0, 30.0, 43.0, 44.0, 56.0, 66.0, 37.0, 44.0, 53.0, 42.0, 55.0, 45.0, 40.0, 38.0, 35.0, 31.0, 20.0, 23.0, 19.0, 11.0, 20.0, 9.0, 10.0, 6.0, 5.0, 2.0, 8.0, 6.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.894371032714844e-06, -9.597279131412506e-06, -9.300187230110168e-06, -9.00309532880783e-06, -8.706003427505493e-06, -8.408911526203156e-06, -8.111819624900818e-06, -7.81472772359848e-06, -7.517635822296143e-06, -7.220543920993805e-06, -6.923452019691467e-06, -6.62636011838913e-06, -6.329268217086792e-06, -6.032176315784454e-06, -5.735084414482117e-06, -5.437992513179779e-06, -5.140900611877441e-06, -4.843808710575104e-06, -4.546716809272766e-06, -4.2496249079704285e-06, -3.952533006668091e-06, -3.655441105365753e-06, -3.3583492040634155e-06, -3.061257302761078e-06, -2.7641654014587402e-06, -2.4670735001564026e-06, -2.169981598854065e-06, -1.8728896975517273e-06, -1.5757977962493896e-06, -1.278705894947052e-06, -9.816139936447144e-07, -6.845220923423767e-07, -3.8743019104003906e-07, -9.033828973770142e-08, 2.0675361156463623e-07, 5.038455128669739e-07, 8.009374141693115e-07, 1.0980293154716492e-06, 1.3951212167739868e-06, 1.6922131180763245e-06, 1.989305019378662e-06, 2.2863969206809998e-06, 2.5834888219833374e-06, 2.880580723285675e-06, 3.1776726245880127e-06, 3.4747645258903503e-06, 3.771856427192688e-06, 4.068948328495026e-06, 4.366040229797363e-06, 4.663132131099701e-06, 4.9602240324020386e-06, 5.257315933704376e-06, 5.554407835006714e-06, 5.8514997363090515e-06, 6.148591637611389e-06, 6.445683538913727e-06, 6.7427754402160645e-06, 7.039867341518402e-06, 7.33695924282074e-06, 7.634051144123077e-06, 7.931143045425415e-06, 8.228234946727753e-06, 8.52532684803009e-06, 8.822418749332428e-06, 9.119510650634766e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 9.0, 9.0, 12.0, 25.0, 31.0, 62.0, 72.0, 99.0, 161.0, 204.0, 322.0, 485.0, 693.0, 1125.0, 1651.0, 2654.0, 4305.0, 7151.0, 12304.0, 23722.0, 49269.0, 115464.0, 306858.0, 303486.0, 114603.0, 48768.0, 23559.0, 12306.0, 7253.0, 4227.0, 2666.0, 1705.0, 1081.0, 749.0, 483.0, 295.0, 220.0, 150.0, 95.0, 80.0, 34.0, 36.0, 20.0, 10.0, 11.0, 11.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0941162109375, -0.0910797119140625, -0.088043212890625, -0.0850067138671875, -0.08197021484375, -0.0789337158203125, -0.075897216796875, -0.0728607177734375, -0.06982421875, -0.0667877197265625, -0.063751220703125, -0.0607147216796875, -0.05767822265625, -0.0546417236328125, -0.051605224609375, -0.0485687255859375, -0.0455322265625, -0.0424957275390625, -0.039459228515625, -0.0364227294921875, -0.03338623046875, -0.0303497314453125, -0.027313232421875, -0.0242767333984375, -0.021240234375, -0.0182037353515625, -0.015167236328125, -0.0121307373046875, -0.00909423828125, -0.0060577392578125, -0.003021240234375, 1.52587890625e-05, 0.0030517578125, 0.0060882568359375, 0.009124755859375, 0.0121612548828125, 0.01519775390625, 0.0182342529296875, 0.021270751953125, 0.0243072509765625, 0.02734375, 0.0303802490234375, 0.033416748046875, 0.0364532470703125, 0.03948974609375, 0.0425262451171875, 0.045562744140625, 0.0485992431640625, 0.0516357421875, 0.0546722412109375, 0.057708740234375, 0.0607452392578125, 0.06378173828125, 0.0668182373046875, 0.069854736328125, 0.0728912353515625, 0.075927734375, 0.0789642333984375, 0.082000732421875, 0.0850372314453125, 0.08807373046875, 0.0911102294921875, 0.094146728515625, 0.0971832275390625, 0.1002197265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 6.0, 5.0, 6.0, 8.0, 20.0, 8.0, 13.0, 27.0, 34.0, 37.0, 45.0, 61.0, 77.0, 81.0, 93.0, 97.0, 83.0, 58.0, 54.0, 56.0, 32.0, 29.0, 16.0, 11.0, 14.0, 9.0, 4.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036224365234375, -0.03507232666015625, -0.0339202880859375, -0.03276824951171875, -0.0316162109375, -0.03046417236328125, -0.0293121337890625, -0.02816009521484375, -0.027008056640625, -0.02585601806640625, -0.0247039794921875, -0.02355194091796875, -0.02239990234375, -0.02124786376953125, -0.0200958251953125, -0.01894378662109375, -0.017791748046875, -0.01663970947265625, -0.0154876708984375, -0.01433563232421875, -0.01318359375, -0.01203155517578125, -0.0108795166015625, -0.00972747802734375, -0.008575439453125, -0.00742340087890625, -0.0062713623046875, -0.00511932373046875, -0.00396728515625, -0.00281524658203125, -0.0016632080078125, -0.00051116943359375, 0.000640869140625, 0.00179290771484375, 0.0029449462890625, 0.00409698486328125, 0.0052490234375, 0.00640106201171875, 0.0075531005859375, 0.00870513916015625, 0.009857177734375, 0.01100921630859375, 0.0121612548828125, 0.01331329345703125, 0.01446533203125, 0.01561737060546875, 0.0167694091796875, 0.01792144775390625, 0.019073486328125, 0.02022552490234375, 0.0213775634765625, 0.02252960205078125, 0.023681640625, 0.02483367919921875, 0.0259857177734375, 0.02713775634765625, 0.028289794921875, 0.02944183349609375, 0.0305938720703125, 0.03174591064453125, 0.03289794921875, 0.03404998779296875, 0.0352020263671875, 0.03635406494140625, 0.037506103515625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 4.0, 5.0, 5.0, 14.0, 19.0, 15.0, 19.0, 23.0, 34.0, 27.0, 47.0, 49.0, 68.0, 68.0, 72.0, 78.0, 76.0, 60.0, 52.0, 47.0, 40.0, 36.0, 27.0, 18.0, 14.0, 13.0, 13.0, 10.0, 8.0, 7.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-6.7645955085754395, -6.539731979370117, -6.314868927001953, -6.090005397796631, -5.865141868591309, -5.6402788162231445, -5.415415287017822, -5.1905517578125, -4.965688705444336, -4.740825176239014, -4.51596212387085, -4.291098594665527, -4.066235065460205, -3.841372013092041, -3.6165084838867188, -3.3916451930999756, -3.1667816638946533, -2.94191837310791, -2.717054843902588, -2.4921915531158447, -2.2673282623291016, -2.0424647331237793, -1.8176014423370361, -1.592738151550293, -1.3678747415542603, -1.1430113315582275, -0.9181480407714844, -0.6932846307754517, -0.4684212803840637, -0.24355792999267578, -0.018694519996643066, 0.2061687707901001, 0.4310321807861328, 0.6558955311775208, 0.8807588815689087, 1.1056222915649414, 1.3304855823516846, 1.5553489923477173, 1.78021240234375, 2.005075693130493, 2.2299389839172363, 2.4548022747039795, 2.6796658039093018, 2.904529094696045, 3.129392385482788, 3.3542556762695312, 3.5791192054748535, 3.8039824962615967, 4.02884578704834, 4.253709316253662, 4.478572368621826, 4.703435897827148, 4.928299427032471, 5.153162479400635, 5.378026008605957, 5.602889060974121, 5.827753067016602, 6.052616596221924, 6.277479648590088, 6.50234317779541, 6.727206707000732, 6.9520697593688965, 7.176933288574219, 7.401796340942383, 7.626659870147705]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 5.0, 6.0, 5.0, 5.0, 5.0, 10.0, 6.0, 12.0, 11.0, 12.0, 14.0, 12.0, 22.0, 27.0, 28.0, 28.0, 44.0, 32.0, 36.0, 32.0, 47.0, 51.0, 32.0, 47.0, 49.0, 39.0, 38.0, 42.0, 36.0, 30.0, 28.0, 30.0, 26.0, 20.0, 24.0, 16.0, 10.0, 20.0, 12.0, 7.0, 6.0, 5.0, 6.0, 9.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.0192670822143555, -5.831381797790527, -5.643496036529541, -5.455610752105713, -5.267724990844727, -5.079839706420898, -4.89195442199707, -4.704069137573242, -4.516183376312256, -4.328298091888428, -4.140412330627441, -3.9525270462036133, -3.764641523361206, -3.576756000518799, -3.3888707160949707, -3.2009851932525635, -3.0130996704101562, -2.825214147567749, -2.637328624725342, -2.4494433403015137, -2.2615578174591064, -2.073672294616699, -1.8857868909835815, -1.6979014873504639, -1.5100159645080566, -1.3221304416656494, -1.1342450380325317, -0.9463595747947693, -0.7584741115570068, -0.5705886483192444, -0.38270318508148193, -0.19481778144836426, -0.006931781768798828, 0.18095368146896362, 0.3688391447067261, 0.5567246079444885, 0.744610071182251, 0.9324955344200134, 1.1203809976577759, 1.3082664012908936, 1.4961519241333008, 1.684037446975708, 1.8719228506088257, 2.0598082542419434, 2.2476937770843506, 2.435579299926758, 2.623464584350586, 2.811350107192993, 2.9992356300354004, 3.1871211528778076, 3.375006675720215, 3.562891960144043, 3.75077748298645, 3.9386630058288574, 4.1265482902526855, 4.314434051513672, 4.5023193359375, 4.690204620361328, 4.8780903816223145, 5.065975666046143, 5.253861427307129, 5.441746711730957, 5.629631996154785, 5.817517280578613, 6.0054030418396]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 10.0, 10.0, 16.0, 36.0, 46.0, 81.0, 112.0, 178.0, 284.0, 438.0, 674.0, 1143.0, 1746.0, 2877.0, 4862.0, 8060.0, 13966.0, 24035.0, 42005.0, 72488.0, 117166.0, 166119.0, 184880.0, 154133.0, 104349.0, 62186.0, 36168.0, 20633.0, 11900.0, 7103.0, 4003.0, 2454.0, 1586.0, 1008.0, 658.0, 378.0, 269.0, 172.0, 116.0, 62.0, 53.0, 36.0, 15.0, 10.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.88671875, -5.71026611328125, -5.5338134765625, -5.35736083984375, -5.180908203125, -5.00445556640625, -4.8280029296875, -4.65155029296875, -4.47509765625, -4.29864501953125, -4.1221923828125, -3.94573974609375, -3.769287109375, -3.59283447265625, -3.4163818359375, -3.23992919921875, -3.0634765625, -2.88702392578125, -2.7105712890625, -2.53411865234375, -2.357666015625, -2.18121337890625, -2.0047607421875, -1.82830810546875, -1.65185546875, -1.47540283203125, -1.2989501953125, -1.12249755859375, -0.946044921875, -0.76959228515625, -0.5931396484375, -0.41668701171875, -0.240234375, -0.06378173828125, 0.1126708984375, 0.28912353515625, 0.465576171875, 0.64202880859375, 0.8184814453125, 0.99493408203125, 1.17138671875, 1.34783935546875, 1.5242919921875, 1.70074462890625, 1.877197265625, 2.05364990234375, 2.2301025390625, 2.40655517578125, 2.5830078125, 2.75946044921875, 2.9359130859375, 3.11236572265625, 3.288818359375, 3.46527099609375, 3.6417236328125, 3.81817626953125, 3.99462890625, 4.17108154296875, 4.3475341796875, 4.52398681640625, 4.700439453125, 4.87689208984375, 5.0533447265625, 5.22979736328125, 5.40625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 8.0, 3.0, 5.0, 4.0, 6.0, 4.0, 9.0, 9.0, 10.0, 8.0, 11.0, 18.0, 13.0, 19.0, 20.0, 29.0, 32.0, 40.0, 28.0, 49.0, 42.0, 51.0, 43.0, 52.0, 49.0, 51.0, 41.0, 40.0, 39.0, 35.0, 28.0, 33.0, 27.0, 26.0, 21.0, 18.0, 14.0, 19.0, 6.0, 10.0, 8.0, 9.0, 4.0, 2.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.48046875, -6.2762451171875, -6.072021484375, -5.8677978515625, -5.66357421875, -5.4593505859375, -5.255126953125, -5.0509033203125, -4.8466796875, -4.6424560546875, -4.438232421875, -4.2340087890625, -4.02978515625, -3.8255615234375, -3.621337890625, -3.4171142578125, -3.212890625, -3.0086669921875, -2.804443359375, -2.6002197265625, -2.39599609375, -2.1917724609375, -1.987548828125, -1.7833251953125, -1.5791015625, -1.3748779296875, -1.170654296875, -0.9664306640625, -0.76220703125, -0.5579833984375, -0.353759765625, -0.1495361328125, 0.0546875, 0.2589111328125, 0.463134765625, 0.6673583984375, 0.87158203125, 1.0758056640625, 1.280029296875, 1.4842529296875, 1.6884765625, 1.8927001953125, 2.096923828125, 2.3011474609375, 2.50537109375, 2.7095947265625, 2.913818359375, 3.1180419921875, 3.322265625, 3.5264892578125, 3.730712890625, 3.9349365234375, 4.13916015625, 4.3433837890625, 4.547607421875, 4.7518310546875, 4.9560546875, 5.1602783203125, 5.364501953125, 5.5687255859375, 5.77294921875, 5.9771728515625, 6.181396484375, 6.3856201171875, 6.58984375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 8.0, 11.0, 19.0, 38.0, 61.0, 113.0, 126.0, 220.0, 343.0, 526.0, 918.0, 1411.0, 2338.0, 3987.0, 6693.0, 10912.0, 18701.0, 31519.0, 52230.0, 83363.0, 123434.0, 158283.0, 164265.0, 137488.0, 97026.0, 61693.0, 37246.0, 22289.0, 13161.0, 7984.0, 4676.0, 2899.0, 1767.0, 1027.0, 652.0, 428.0, 255.0, 163.0, 96.0, 52.0, 46.0, 33.0, 20.0, 14.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.46875, -5.3087158203125, -5.148681640625, -4.9886474609375, -4.82861328125, -4.6685791015625, -4.508544921875, -4.3485107421875, -4.1884765625, -4.0284423828125, -3.868408203125, -3.7083740234375, -3.54833984375, -3.3883056640625, -3.228271484375, -3.0682373046875, -2.908203125, -2.7481689453125, -2.588134765625, -2.4281005859375, -2.26806640625, -2.1080322265625, -1.947998046875, -1.7879638671875, -1.6279296875, -1.4678955078125, -1.307861328125, -1.1478271484375, -0.98779296875, -0.8277587890625, -0.667724609375, -0.5076904296875, -0.34765625, -0.1876220703125, -0.027587890625, 0.1324462890625, 0.29248046875, 0.4525146484375, 0.612548828125, 0.7725830078125, 0.9326171875, 1.0926513671875, 1.252685546875, 1.4127197265625, 1.57275390625, 1.7327880859375, 1.892822265625, 2.0528564453125, 2.212890625, 2.3729248046875, 2.532958984375, 2.6929931640625, 2.85302734375, 3.0130615234375, 3.173095703125, 3.3331298828125, 3.4931640625, 3.6531982421875, 3.813232421875, 3.9732666015625, 4.13330078125, 4.2933349609375, 4.453369140625, 4.6134033203125, 4.7734375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 10.0, 9.0, 6.0, 10.0, 12.0, 16.0, 19.0, 12.0, 22.0, 28.0, 26.0, 43.0, 37.0, 32.0, 45.0, 40.0, 26.0, 43.0, 29.0, 46.0, 47.0, 42.0, 39.0, 35.0, 35.0, 46.0, 44.0, 26.0, 22.0, 27.0, 13.0, 17.0, 25.0, 17.0, 5.0, 10.0, 10.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-4.078125, -3.96002197265625, -3.8419189453125, -3.72381591796875, -3.605712890625, -3.48760986328125, -3.3695068359375, -3.25140380859375, -3.13330078125, -3.01519775390625, -2.8970947265625, -2.77899169921875, -2.660888671875, -2.54278564453125, -2.4246826171875, -2.30657958984375, -2.1884765625, -2.07037353515625, -1.9522705078125, -1.83416748046875, -1.716064453125, -1.59796142578125, -1.4798583984375, -1.36175537109375, -1.24365234375, -1.12554931640625, -1.0074462890625, -0.88934326171875, -0.771240234375, -0.65313720703125, -0.5350341796875, -0.41693115234375, -0.298828125, -0.18072509765625, -0.0626220703125, 0.05548095703125, 0.173583984375, 0.29168701171875, 0.4097900390625, 0.52789306640625, 0.64599609375, 0.76409912109375, 0.8822021484375, 1.00030517578125, 1.118408203125, 1.23651123046875, 1.3546142578125, 1.47271728515625, 1.5908203125, 1.70892333984375, 1.8270263671875, 1.94512939453125, 2.063232421875, 2.18133544921875, 2.2994384765625, 2.41754150390625, 2.53564453125, 2.65374755859375, 2.7718505859375, 2.88995361328125, 3.008056640625, 3.12615966796875, 3.2442626953125, 3.36236572265625, 3.48046875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 15.0, 9.0, 18.0, 23.0, 31.0, 54.0, 62.0, 91.0, 166.0, 218.0, 333.0, 478.0, 806.0, 1183.0, 1726.0, 2688.0, 4181.0, 6528.0, 10246.0, 16032.0, 25429.0, 40178.0, 63291.0, 95046.0, 133282.0, 157160.0, 149951.0, 116104.0, 80395.0, 52011.0, 33004.0, 20808.0, 13177.0, 8463.0, 5369.0, 3401.0, 2228.0, 1421.0, 954.0, 671.0, 410.0, 299.0, 175.0, 126.0, 90.0, 65.0, 44.0, 39.0, 16.0, 14.0, 17.0, 7.0, 9.0, 5.0, 1.0, 4.0, 2.0], "bins": [-1.4951171875, -1.4495086669921875, -1.403900146484375, -1.3582916259765625, -1.31268310546875, -1.2670745849609375, -1.221466064453125, -1.1758575439453125, -1.1302490234375, -1.0846405029296875, -1.039031982421875, -0.9934234619140625, -0.94781494140625, -0.9022064208984375, -0.856597900390625, -0.8109893798828125, -0.765380859375, -0.7197723388671875, -0.674163818359375, -0.6285552978515625, -0.58294677734375, -0.5373382568359375, -0.491729736328125, -0.4461212158203125, -0.4005126953125, -0.3549041748046875, -0.309295654296875, -0.2636871337890625, -0.21807861328125, -0.1724700927734375, -0.126861572265625, -0.0812530517578125, -0.03564453125, 0.0099639892578125, 0.055572509765625, 0.1011810302734375, 0.14678955078125, 0.1923980712890625, 0.238006591796875, 0.2836151123046875, 0.3292236328125, 0.3748321533203125, 0.420440673828125, 0.4660491943359375, 0.51165771484375, 0.5572662353515625, 0.602874755859375, 0.6484832763671875, 0.694091796875, 0.7397003173828125, 0.785308837890625, 0.8309173583984375, 0.87652587890625, 0.9221343994140625, 0.967742919921875, 1.0133514404296875, 1.0589599609375, 1.1045684814453125, 1.150177001953125, 1.1957855224609375, 1.24139404296875, 1.2870025634765625, 1.332611083984375, 1.3782196044921875, 1.423828125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 10.0, 8.0, 7.0, 13.0, 14.0, 19.0, 23.0, 33.0, 37.0, 41.0, 68.0, 59.0, 64.0, 65.0, 73.0, 79.0, 69.0, 67.0, 49.0, 50.0, 40.0, 24.0, 13.0, 23.0, 13.0, 9.0, 5.0, 6.0, 1.0, 5.0, 2.0, 2.0, 2.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017595291137695312, -0.00017096847295761108, -0.00016598403453826904, -0.000160999596118927, -0.00015601515769958496, -0.00015103071928024292, -0.00014604628086090088, -0.00014106184244155884, -0.0001360774040222168, -0.00013109296560287476, -0.00012610852718353271, -0.00012112408876419067, -0.00011613965034484863, -0.00011115521192550659, -0.00010617077350616455, -0.00010118633508682251, -9.620189666748047e-05, -9.121745824813843e-05, -8.623301982879639e-05, -8.124858140945435e-05, -7.62641429901123e-05, -7.127970457077026e-05, -6.629526615142822e-05, -6.131082773208618e-05, -5.632638931274414e-05, -5.13419508934021e-05, -4.635751247406006e-05, -4.137307405471802e-05, -3.6388635635375977e-05, -3.1404197216033936e-05, -2.6419758796691895e-05, -2.1435320377349854e-05, -1.6450881958007812e-05, -1.1466443538665771e-05, -6.4820051193237305e-06, -1.4975666999816895e-06, 3.4868717193603516e-06, 8.471310138702393e-06, 1.3455748558044434e-05, 1.8440186977386475e-05, 2.3424625396728516e-05, 2.8409063816070557e-05, 3.33935022354126e-05, 3.837794065475464e-05, 4.336237907409668e-05, 4.834681749343872e-05, 5.333125591278076e-05, 5.83156943321228e-05, 6.330013275146484e-05, 6.828457117080688e-05, 7.326900959014893e-05, 7.825344800949097e-05, 8.323788642883301e-05, 8.822232484817505e-05, 9.320676326751709e-05, 9.819120168685913e-05, 0.00010317564010620117, 0.00010816007852554321, 0.00011314451694488525, 0.0001181289553642273, 0.00012311339378356934, 0.00012809783220291138, 0.00013308227062225342, 0.00013806670904159546, 0.0001430511474609375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 9.0, 8.0, 9.0, 27.0, 20.0, 30.0, 57.0, 68.0, 99.0, 147.0, 224.0, 345.0, 490.0, 760.0, 1127.0, 1728.0, 2687.0, 4329.0, 6694.0, 10823.0, 17209.0, 28213.0, 45593.0, 71677.0, 108284.0, 147516.0, 164234.0, 145080.0, 104974.0, 69035.0, 43728.0, 27428.0, 16994.0, 10600.0, 6472.0, 4205.0, 2646.0, 1727.0, 1090.0, 753.0, 442.0, 316.0, 214.0, 149.0, 117.0, 64.0, 31.0, 38.0, 18.0, 8.0, 7.0, 9.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.490234375, -1.44287109375, -1.3955078125, -1.34814453125, -1.30078125, -1.25341796875, -1.2060546875, -1.15869140625, -1.111328125, -1.06396484375, -1.0166015625, -0.96923828125, -0.921875, -0.87451171875, -0.8271484375, -0.77978515625, -0.732421875, -0.68505859375, -0.6376953125, -0.59033203125, -0.54296875, -0.49560546875, -0.4482421875, -0.40087890625, -0.353515625, -0.30615234375, -0.2587890625, -0.21142578125, -0.1640625, -0.11669921875, -0.0693359375, -0.02197265625, 0.025390625, 0.07275390625, 0.1201171875, 0.16748046875, 0.21484375, 0.26220703125, 0.3095703125, 0.35693359375, 0.404296875, 0.45166015625, 0.4990234375, 0.54638671875, 0.59375, 0.64111328125, 0.6884765625, 0.73583984375, 0.783203125, 0.83056640625, 0.8779296875, 0.92529296875, 0.97265625, 1.02001953125, 1.0673828125, 1.11474609375, 1.162109375, 1.20947265625, 1.2568359375, 1.30419921875, 1.3515625, 1.39892578125, 1.4462890625, 1.49365234375, 1.541015625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 13.0, 7.0, 9.0, 17.0, 20.0, 21.0, 24.0, 33.0, 25.0, 38.0, 53.0, 52.0, 61.0, 56.0, 44.0, 60.0, 61.0, 51.0, 48.0, 53.0, 28.0, 40.0, 31.0, 27.0, 18.0, 17.0, 22.0, 7.0, 6.0, 9.0, 8.0, 10.0, 2.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.76123046875, -0.7399444580078125, -0.718658447265625, -0.6973724365234375, -0.67608642578125, -0.6548004150390625, -0.633514404296875, -0.6122283935546875, -0.5909423828125, -0.5696563720703125, -0.548370361328125, -0.5270843505859375, -0.50579833984375, -0.4845123291015625, -0.463226318359375, -0.4419403076171875, -0.420654296875, -0.3993682861328125, -0.378082275390625, -0.3567962646484375, -0.33551025390625, -0.3142242431640625, -0.292938232421875, -0.2716522216796875, -0.2503662109375, -0.2290802001953125, -0.207794189453125, -0.1865081787109375, -0.16522216796875, -0.1439361572265625, -0.122650146484375, -0.1013641357421875, -0.080078125, -0.0587921142578125, -0.037506103515625, -0.0162200927734375, 0.00506591796875, 0.0263519287109375, 0.047637939453125, 0.0689239501953125, 0.0902099609375, 0.1114959716796875, 0.132781982421875, 0.1540679931640625, 0.17535400390625, 0.1966400146484375, 0.217926025390625, 0.2392120361328125, 0.260498046875, 0.2817840576171875, 0.303070068359375, 0.3243560791015625, 0.34564208984375, 0.3669281005859375, 0.388214111328125, 0.4095001220703125, 0.4307861328125, 0.4520721435546875, 0.473358154296875, 0.4946441650390625, 0.51593017578125, 0.5372161865234375, 0.558502197265625, 0.5797882080078125, 0.60107421875]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 6.0, 6.0, 6.0, 11.0, 10.0, 19.0, 20.0, 25.0, 26.0, 37.0, 65.0, 56.0, 72.0, 79.0, 82.0, 85.0, 65.0, 75.0, 47.0, 36.0, 32.0, 33.0, 25.0, 17.0, 18.0, 9.0, 9.0, 2.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7593913078308105, -6.506035327911377, -6.252678871154785, -5.999322891235352, -5.745966911315918, -5.492610931396484, -5.239254474639893, -4.985898494720459, -4.732542037963867, -4.479186058044434, -4.225829601287842, -3.972473621368408, -3.7191176414489746, -3.465761423110962, -3.212405204772949, -2.9590492248535156, -2.705693244934082, -2.4523370265960693, -2.1989810466766357, -1.945624828338623, -1.6922687292099, -1.4389126300811768, -1.185556411743164, -0.9322003126144409, -0.6788442134857178, -0.42548808455467224, -0.1721319556236267, 0.08122420310974121, 0.33458030223846436, 0.5879364013671875, 0.8412926197052002, 1.0946487188339233, 1.3480052947998047, 1.6013613939285278, 1.854717493057251, 2.1080737113952637, 2.3614296913146973, 2.61478590965271, 2.8681421279907227, 3.1214981079101562, 3.374854326248169, 3.6282105445861816, 3.8815665245056152, 4.134922981262207, 4.388278961181641, 4.641634941101074, 4.894990921020508, 5.1483473777771, 5.401703357696533, 5.655059337615967, 5.908415794372559, 6.161771774291992, 6.415127754211426, 6.668483734130859, 6.921840190887451, 7.175196170806885, 7.428552627563477, 7.68190860748291, 7.935265064239502, 8.188621520996094, 8.441977500915527, 8.695333480834961, 8.948689460754395, 9.202045440673828, 9.455401420593262]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 2.0, 9.0, 12.0, 4.0, 11.0, 8.0, 18.0, 19.0, 16.0, 29.0, 34.0, 21.0, 38.0, 42.0, 37.0, 47.0, 43.0, 36.0, 61.0, 36.0, 46.0, 39.0, 34.0, 43.0, 36.0, 38.0, 33.0, 37.0, 27.0, 20.0, 21.0, 21.0, 9.0, 16.0, 11.0, 12.0, 8.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.229199409484863, -6.02313756942749, -5.817075729370117, -5.611013889312744, -5.404952049255371, -5.198890686035156, -4.992828369140625, -4.78676700592041, -4.580705165863037, -4.374643325805664, -4.168581485748291, -3.962519645690918, -3.756458044052124, -3.550396203994751, -3.344334363937378, -3.138272762298584, -2.932210683822632, -2.726148843765259, -2.5200870037078857, -2.314025402069092, -2.1079635620117188, -1.9019017219543457, -1.6958398818969727, -1.4897781610488892, -1.2837163209915161, -1.077654480934143, -0.8715927600860596, -0.6655309200286865, -0.45946913957595825, -0.25340735912323, -0.047345519065856934, 0.15871620178222656, 0.3647780418395996, 0.5708398222923279, 0.7769016027450562, 0.9829634428024292, 1.1890251636505127, 1.3950870037078857, 1.6011488437652588, 1.8072105646133423, 2.013272285461426, 2.219334125518799, 2.425395965576172, 2.631457805633545, 2.837519407272339, 3.043581247329712, 3.249643087387085, 3.455704689025879, 3.661766767501831, 3.867828607559204, 4.073890209197998, 4.279952049255371, 4.486013889312744, 4.692075729370117, 4.89813756942749, 5.104199409484863, 5.310261249542236, 5.516323089599609, 5.722384929656982, 5.9284467697143555, 6.1345086097717285, 6.340570449829102, 6.546631813049316, 6.7526936531066895, 6.9587554931640625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 8.0, 6.0, 26.0, 25.0, 35.0, 72.0, 115.0, 183.0, 251.0, 379.0, 585.0, 889.0, 1355.0, 1983.0, 3029.0, 4540.0, 7040.0, 11178.0, 17533.0, 28381.0, 47868.0, 82955.0, 148181.0, 268813.0, 478774.0, 747412.0, 836751.0, 630833.0, 377315.0, 209767.0, 116887.0, 66739.0, 39135.0, 23894.0, 14580.0, 9316.0, 6037.0, 3794.0, 2543.0, 1691.0, 1100.0, 770.0, 534.0, 319.0, 219.0, 138.0, 107.0, 73.0, 47.0, 32.0, 16.0, 16.0, 11.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.1796875, -5.0086669921875, -4.837646484375, -4.6666259765625, -4.49560546875, -4.3245849609375, -4.153564453125, -3.9825439453125, -3.8115234375, -3.6405029296875, -3.469482421875, -3.2984619140625, -3.12744140625, -2.9564208984375, -2.785400390625, -2.6143798828125, -2.443359375, -2.2723388671875, -2.101318359375, -1.9302978515625, -1.75927734375, -1.5882568359375, -1.417236328125, -1.2462158203125, -1.0751953125, -0.9041748046875, -0.733154296875, -0.5621337890625, -0.39111328125, -0.2200927734375, -0.049072265625, 0.1219482421875, 0.29296875, 0.4639892578125, 0.635009765625, 0.8060302734375, 0.97705078125, 1.1480712890625, 1.319091796875, 1.4901123046875, 1.6611328125, 1.8321533203125, 2.003173828125, 2.1741943359375, 2.34521484375, 2.5162353515625, 2.687255859375, 2.8582763671875, 3.029296875, 3.2003173828125, 3.371337890625, 3.5423583984375, 3.71337890625, 3.8843994140625, 4.055419921875, 4.2264404296875, 4.3974609375, 4.5684814453125, 4.739501953125, 4.9105224609375, 5.08154296875, 5.2525634765625, 5.423583984375, 5.5946044921875, 5.765625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 10.0, 9.0, 6.0, 16.0, 10.0, 17.0, 17.0, 21.0, 29.0, 34.0, 40.0, 39.0, 39.0, 44.0, 43.0, 44.0, 51.0, 55.0, 41.0, 49.0, 43.0, 46.0, 49.0, 34.0, 33.0, 26.0, 23.0, 25.0, 22.0, 17.0, 15.0, 11.0, 10.0, 6.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.515625, -4.36102294921875, -4.2064208984375, -4.05181884765625, -3.897216796875, -3.74261474609375, -3.5880126953125, -3.43341064453125, -3.27880859375, -3.12420654296875, -2.9696044921875, -2.81500244140625, -2.660400390625, -2.50579833984375, -2.3511962890625, -2.19659423828125, -2.0419921875, -1.88739013671875, -1.7327880859375, -1.57818603515625, -1.423583984375, -1.26898193359375, -1.1143798828125, -0.95977783203125, -0.80517578125, -0.65057373046875, -0.4959716796875, -0.34136962890625, -0.186767578125, -0.03216552734375, 0.1224365234375, 0.27703857421875, 0.431640625, 0.58624267578125, 0.7408447265625, 0.89544677734375, 1.050048828125, 1.20465087890625, 1.3592529296875, 1.51385498046875, 1.66845703125, 1.82305908203125, 1.9776611328125, 2.13226318359375, 2.286865234375, 2.44146728515625, 2.5960693359375, 2.75067138671875, 2.9052734375, 3.05987548828125, 3.2144775390625, 3.36907958984375, 3.523681640625, 3.67828369140625, 3.8328857421875, 3.98748779296875, 4.14208984375, 4.29669189453125, 4.4512939453125, 4.60589599609375, 4.760498046875, 4.91510009765625, 5.0697021484375, 5.22430419921875, 5.37890625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 13.0, 12.0, 33.0, 23.0, 57.0, 72.0, 145.0, 206.0, 309.0, 505.0, 793.0, 1349.0, 2223.0, 3624.0, 6175.0, 10468.0, 18666.0, 33048.0, 60139.0, 110117.0, 202438.0, 365177.0, 602586.0, 807134.0, 760932.0, 526721.0, 307726.0, 168059.0, 90976.0, 49725.0, 27258.0, 15471.0, 8891.0, 5114.0, 3102.0, 1903.0, 1146.0, 712.0, 432.0, 319.0, 177.0, 106.0, 60.0, 37.0, 33.0, 33.0, 14.0, 5.0, 8.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-5.63671875, -5.4539794921875, -5.271240234375, -5.0885009765625, -4.90576171875, -4.7230224609375, -4.540283203125, -4.3575439453125, -4.1748046875, -3.9920654296875, -3.809326171875, -3.6265869140625, -3.44384765625, -3.2611083984375, -3.078369140625, -2.8956298828125, -2.712890625, -2.5301513671875, -2.347412109375, -2.1646728515625, -1.98193359375, -1.7991943359375, -1.616455078125, -1.4337158203125, -1.2509765625, -1.0682373046875, -0.885498046875, -0.7027587890625, -0.52001953125, -0.3372802734375, -0.154541015625, 0.0281982421875, 0.2109375, 0.3936767578125, 0.576416015625, 0.7591552734375, 0.94189453125, 1.1246337890625, 1.307373046875, 1.4901123046875, 1.6728515625, 1.8555908203125, 2.038330078125, 2.2210693359375, 2.40380859375, 2.5865478515625, 2.769287109375, 2.9520263671875, 3.134765625, 3.3175048828125, 3.500244140625, 3.6829833984375, 3.86572265625, 4.0484619140625, 4.231201171875, 4.4139404296875, 4.5966796875, 4.7794189453125, 4.962158203125, 5.1448974609375, 5.32763671875, 5.5103759765625, 5.693115234375, 5.8758544921875, 6.05859375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 5.0, 7.0, 6.0, 22.0, 22.0, 24.0, 46.0, 61.0, 86.0, 91.0, 113.0, 148.0, 147.0, 174.0, 263.0, 240.0, 262.0, 261.0, 275.0, 291.0, 238.0, 222.0, 178.0, 180.0, 125.0, 122.0, 81.0, 63.0, 67.0, 53.0, 48.0, 25.0, 22.0, 21.0, 16.0, 12.0, 14.0, 8.0, 6.0, 4.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.240234375, -2.161590576171875, -2.08294677734375, -2.004302978515625, -1.9256591796875, -1.847015380859375, -1.76837158203125, -1.689727783203125, -1.611083984375, -1.532440185546875, -1.45379638671875, -1.375152587890625, -1.2965087890625, -1.217864990234375, -1.13922119140625, -1.060577392578125, -0.98193359375, -0.903289794921875, -0.82464599609375, -0.746002197265625, -0.6673583984375, -0.588714599609375, -0.51007080078125, -0.431427001953125, -0.352783203125, -0.274139404296875, -0.19549560546875, -0.116851806640625, -0.0382080078125, 0.040435791015625, 0.11907958984375, 0.197723388671875, 0.2763671875, 0.355010986328125, 0.43365478515625, 0.512298583984375, 0.5909423828125, 0.669586181640625, 0.74822998046875, 0.826873779296875, 0.905517578125, 0.984161376953125, 1.06280517578125, 1.141448974609375, 1.2200927734375, 1.298736572265625, 1.37738037109375, 1.456024169921875, 1.53466796875, 1.613311767578125, 1.69195556640625, 1.770599365234375, 1.8492431640625, 1.927886962890625, 2.00653076171875, 2.085174560546875, 2.163818359375, 2.242462158203125, 2.32110595703125, 2.399749755859375, 2.4783935546875, 2.557037353515625, 2.63568115234375, 2.714324951171875, 2.79296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 3.0, 7.0, 8.0, 11.0, 11.0, 28.0, 36.0, 36.0, 41.0, 48.0, 60.0, 83.0, 70.0, 82.0, 83.0, 74.0, 53.0, 68.0, 38.0, 28.0, 28.0, 23.0, 16.0, 10.0, 12.0, 6.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.344273567199707, -7.0862016677856445, -6.828129768371582, -6.5700578689575195, -6.311985969543457, -6.0539140701293945, -5.79584264755249, -5.537770748138428, -5.279698848724365, -5.021626949310303, -4.76355504989624, -4.505483150482178, -4.247411727905273, -3.989339590072632, -3.7312679290771484, -3.473196029663086, -3.2151241302490234, -2.957052230834961, -2.6989803314208984, -2.440908670425415, -2.1828367710113525, -1.92476487159729, -1.666693091392517, -1.4086213111877441, -1.1505494117736816, -0.8924775719642639, -0.6344057321548462, -0.37633389234542847, -0.11826205253601074, 0.13980984687805176, 0.3978816270828247, 0.6559534072875977, 0.9140253067016602, 1.1720972061157227, 1.4301689863204956, 1.6882407665252686, 1.946312665939331, 2.2043845653533936, 2.462456226348877, 2.7205281257629395, 2.978600025177002, 3.2366719245910645, 3.494743824005127, 3.7528154850006104, 4.010887145996094, 4.268959045410156, 4.527030944824219, 4.785102844238281, 5.043174743652344, 5.301246643066406, 5.559318542480469, 5.817390441894531, 6.075462341308594, 6.333534240722656, 6.5916056632995605, 6.849677562713623, 7.1077494621276855, 7.365821361541748, 7.6238932609558105, 7.881965160369873, 8.140036582946777, 8.39810848236084, 8.656180381774902, 8.914252281188965, 9.172324180603027]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 5.0, 4.0, 8.0, 9.0, 12.0, 17.0, 8.0, 18.0, 24.0, 28.0, 27.0, 30.0, 34.0, 27.0, 35.0, 40.0, 49.0, 38.0, 38.0, 40.0, 43.0, 38.0, 40.0, 39.0, 39.0, 35.0, 33.0, 31.0, 36.0, 23.0, 24.0, 23.0, 17.0, 18.0, 12.0, 11.0, 9.0, 10.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.433184623718262, -6.238821983337402, -6.044459342956543, -5.850096702575684, -5.655734062194824, -5.461371421813965, -5.2670087814331055, -5.072646141052246, -4.878283500671387, -4.683920860290527, -4.489558219909668, -4.295195579528809, -4.100832939147949, -3.90647029876709, -3.7121076583862305, -3.517745018005371, -3.3233823776245117, -3.1290197372436523, -2.934657096862793, -2.7402944564819336, -2.545931816101074, -2.351569175720215, -2.1572065353393555, -1.962843894958496, -1.7684812545776367, -1.5741186141967773, -1.379755973815918, -1.1853933334350586, -0.9910306930541992, -0.7966680526733398, -0.6023054122924805, -0.4079427719116211, -0.21358060836791992, -0.019217967987060547, 0.17514467239379883, 0.3695073127746582, 0.5638699531555176, 0.758232593536377, 0.9525952339172363, 1.1469578742980957, 1.341320514678955, 1.5356831550598145, 1.7300457954406738, 1.9244084358215332, 2.1187710762023926, 2.313133716583252, 2.5074963569641113, 2.7018589973449707, 2.89622163772583, 3.0905842781066895, 3.284946918487549, 3.479309558868408, 3.6736721992492676, 3.868034839630127, 4.062397480010986, 4.256760120391846, 4.451122760772705, 4.6454854011535645, 4.839848041534424, 5.034210681915283, 5.228573322296143, 5.422935962677002, 5.617298603057861, 5.811661243438721, 6.00602388381958]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 20.0, 16.0, 39.0, 43.0, 71.0, 114.0, 216.0, 290.0, 551.0, 892.0, 1344.0, 2182.0, 3541.0, 5931.0, 9606.0, 15954.0, 26471.0, 44191.0, 73672.0, 123272.0, 190442.0, 201535.0, 138772.0, 83679.0, 50048.0, 29566.0, 17856.0, 10978.0, 6724.0, 4080.0, 2435.0, 1516.0, 928.0, 606.0, 357.0, 231.0, 148.0, 73.0, 57.0, 32.0, 21.0, 15.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7900390625, -0.7638092041015625, -0.737579345703125, -0.7113494873046875, -0.68511962890625, -0.6588897705078125, -0.632659912109375, -0.6064300537109375, -0.5802001953125, -0.5539703369140625, -0.527740478515625, -0.5015106201171875, -0.47528076171875, -0.4490509033203125, -0.422821044921875, -0.3965911865234375, -0.370361328125, -0.3441314697265625, -0.317901611328125, -0.2916717529296875, -0.26544189453125, -0.2392120361328125, -0.212982177734375, -0.1867523193359375, -0.1605224609375, -0.1342926025390625, -0.108062744140625, -0.0818328857421875, -0.05560302734375, -0.0293731689453125, -0.003143310546875, 0.0230865478515625, 0.04931640625, 0.0755462646484375, 0.101776123046875, 0.1280059814453125, 0.15423583984375, 0.1804656982421875, 0.206695556640625, 0.2329254150390625, 0.2591552734375, 0.2853851318359375, 0.311614990234375, 0.3378448486328125, 0.36407470703125, 0.3903045654296875, 0.416534423828125, 0.4427642822265625, 0.468994140625, 0.4952239990234375, 0.521453857421875, 0.5476837158203125, 0.57391357421875, 0.6001434326171875, 0.626373291015625, 0.6526031494140625, 0.6788330078125, 0.7050628662109375, 0.731292724609375, 0.7575225830078125, 0.78375244140625, 0.8099822998046875, 0.836212158203125, 0.8624420166015625, 0.888671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 3.0, 13.0, 10.0, 15.0, 12.0, 27.0, 15.0, 18.0, 30.0, 33.0, 40.0, 37.0, 34.0, 40.0, 30.0, 38.0, 53.0, 47.0, 34.0, 42.0, 37.0, 41.0, 34.0, 33.0, 35.0, 32.0, 34.0, 36.0, 18.0, 18.0, 23.0, 12.0, 12.0, 10.0, 11.0, 8.0, 6.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.109375, -6.90667724609375, -6.7039794921875, -6.50128173828125, -6.298583984375, -6.09588623046875, -5.8931884765625, -5.69049072265625, -5.48779296875, -5.28509521484375, -5.0823974609375, -4.87969970703125, -4.677001953125, -4.47430419921875, -4.2716064453125, -4.06890869140625, -3.8662109375, -3.66351318359375, -3.4608154296875, -3.25811767578125, -3.055419921875, -2.85272216796875, -2.6500244140625, -2.44732666015625, -2.24462890625, -2.04193115234375, -1.8392333984375, -1.63653564453125, -1.433837890625, -1.23114013671875, -1.0284423828125, -0.82574462890625, -0.623046875, -0.42034912109375, -0.2176513671875, -0.01495361328125, 0.187744140625, 0.39044189453125, 0.5931396484375, 0.79583740234375, 0.99853515625, 1.20123291015625, 1.4039306640625, 1.60662841796875, 1.809326171875, 2.01202392578125, 2.2147216796875, 2.41741943359375, 2.6201171875, 2.82281494140625, 3.0255126953125, 3.22821044921875, 3.430908203125, 3.63360595703125, 3.8363037109375, 4.03900146484375, 4.24169921875, 4.44439697265625, 4.6470947265625, 4.84979248046875, 5.052490234375, 5.25518798828125, 5.4578857421875, 5.66058349609375, 5.86328125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 11.0, 16.0, 19.0, 37.0, 48.0, 74.0, 106.0, 154.0, 221.0, 291.0, 476.0, 650.0, 944.0, 1491.0, 2182.0, 3094.0, 4563.0, 6956.0, 10342.0, 15376.0, 23442.0, 35315.0, 52524.0, 78418.0, 113678.0, 153288.0, 159650.0, 124529.0, 86058.0, 57991.0, 38882.0, 25896.0, 17071.0, 11497.0, 7549.0, 4996.0, 3389.0, 2311.0, 1569.0, 1090.0, 724.0, 498.0, 352.0, 262.0, 172.0, 106.0, 80.0, 58.0, 32.0, 34.0, 17.0, 12.0, 5.0, 7.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.7001953125, -0.6783981323242188, -0.6566009521484375, -0.6348037719726562, -0.613006591796875, -0.5912094116210938, -0.5694122314453125, -0.5476150512695312, -0.52581787109375, -0.5040206909179688, -0.4822235107421875, -0.46042633056640625, -0.438629150390625, -0.41683197021484375, -0.3950347900390625, -0.37323760986328125, -0.3514404296875, -0.32964324951171875, -0.3078460693359375, -0.28604888916015625, -0.264251708984375, -0.24245452880859375, -0.2206573486328125, -0.19886016845703125, -0.17706298828125, -0.15526580810546875, -0.1334686279296875, -0.11167144775390625, -0.089874267578125, -0.06807708740234375, -0.0462799072265625, -0.02448272705078125, -0.002685546875, 0.01911163330078125, 0.0409088134765625, 0.06270599365234375, 0.084503173828125, 0.10630035400390625, 0.1280975341796875, 0.14989471435546875, 0.17169189453125, 0.19348907470703125, 0.2152862548828125, 0.23708343505859375, 0.258880615234375, 0.28067779541015625, 0.3024749755859375, 0.32427215576171875, 0.3460693359375, 0.36786651611328125, 0.3896636962890625, 0.41146087646484375, 0.433258056640625, 0.45505523681640625, 0.4768524169921875, 0.49864959716796875, 0.52044677734375, 0.5422439575195312, 0.5640411376953125, 0.5858383178710938, 0.607635498046875, 0.6294326782226562, 0.6512298583984375, 0.6730270385742188, 0.69482421875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 5.0, 10.0, 12.0, 8.0, 15.0, 15.0, 21.0, 22.0, 22.0, 23.0, 31.0, 23.0, 23.0, 35.0, 47.0, 40.0, 42.0, 46.0, 46.0, 38.0, 43.0, 34.0, 47.0, 27.0, 46.0, 35.0, 28.0, 26.0, 29.0, 29.0, 23.0, 14.0, 18.0, 12.0, 9.0, 11.0, 13.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.529296875, -3.408416748046875, -3.28753662109375, -3.166656494140625, -3.0457763671875, -2.924896240234375, -2.80401611328125, -2.683135986328125, -2.562255859375, -2.441375732421875, -2.32049560546875, -2.199615478515625, -2.0787353515625, -1.957855224609375, -1.83697509765625, -1.716094970703125, -1.59521484375, -1.474334716796875, -1.35345458984375, -1.232574462890625, -1.1116943359375, -0.990814208984375, -0.86993408203125, -0.749053955078125, -0.628173828125, -0.507293701171875, -0.38641357421875, -0.265533447265625, -0.1446533203125, -0.023773193359375, 0.09710693359375, 0.217987060546875, 0.3388671875, 0.459747314453125, 0.58062744140625, 0.701507568359375, 0.8223876953125, 0.943267822265625, 1.06414794921875, 1.185028076171875, 1.305908203125, 1.426788330078125, 1.54766845703125, 1.668548583984375, 1.7894287109375, 1.910308837890625, 2.03118896484375, 2.152069091796875, 2.27294921875, 2.393829345703125, 2.51470947265625, 2.635589599609375, 2.7564697265625, 2.877349853515625, 2.99822998046875, 3.119110107421875, 3.239990234375, 3.360870361328125, 3.48175048828125, 3.602630615234375, 3.7235107421875, 3.844390869140625, 3.96527099609375, 4.086151123046875, 4.20703125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 8.0, 8.0, 16.0, 18.0, 50.0, 67.0, 129.0, 200.0, 359.0, 703.0, 1346.0, 2886.0, 6185.0, 14793.0, 38250.0, 108596.0, 313986.0, 359015.0, 127214.0, 44328.0, 16836.0, 7182.0, 3171.0, 1473.0, 742.0, 427.0, 247.0, 130.0, 77.0, 44.0, 21.0, 14.0, 11.0, 8.0, 6.0, 7.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08642578125, -0.08323383331298828, -0.08004188537597656, -0.07684993743896484, -0.07365798950195312, -0.0704660415649414, -0.06727409362792969, -0.06408214569091797, -0.06089019775390625, -0.05769824981689453, -0.05450630187988281, -0.051314353942871094, -0.048122406005859375, -0.044930458068847656, -0.04173851013183594, -0.03854656219482422, -0.0353546142578125, -0.03216266632080078, -0.028970718383789062, -0.025778770446777344, -0.022586822509765625, -0.019394874572753906, -0.016202926635742188, -0.013010978698730469, -0.00981903076171875, -0.006627082824707031, -0.0034351348876953125, -0.00024318695068359375, 0.002948760986328125, 0.006140708923339844, 0.009332656860351562, 0.012524604797363281, 0.015716552734375, 0.01890850067138672, 0.022100448608398438, 0.025292396545410156, 0.028484344482421875, 0.031676292419433594, 0.03486824035644531, 0.03806018829345703, 0.04125213623046875, 0.04444408416748047, 0.04763603210449219, 0.050827980041503906, 0.054019927978515625, 0.057211875915527344, 0.06040382385253906, 0.06359577178955078, 0.0667877197265625, 0.06997966766357422, 0.07317161560058594, 0.07636356353759766, 0.07955551147460938, 0.0827474594116211, 0.08593940734863281, 0.08913135528564453, 0.09232330322265625, 0.09551525115966797, 0.09870719909667969, 0.1018991470336914, 0.10509109497070312, 0.10828304290771484, 0.11147499084472656, 0.11466693878173828, 0.11785888671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 6.0, 1.0, 4.0, 6.0, 6.0, 9.0, 8.0, 11.0, 16.0, 13.0, 14.0, 46.0, 28.0, 35.0, 51.0, 51.0, 46.0, 52.0, 43.0, 51.0, 59.0, 59.0, 37.0, 44.0, 46.0, 34.0, 33.0, 35.0, 33.0, 23.0, 14.0, 19.0, 10.0, 10.0, 8.0, 11.0, 10.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.119510650634766e-06, -8.818693459033966e-06, -8.517876267433167e-06, -8.217059075832367e-06, -7.916241884231567e-06, -7.615424692630768e-06, -7.314607501029968e-06, -7.013790309429169e-06, -6.712973117828369e-06, -6.41215592622757e-06, -6.11133873462677e-06, -5.8105215430259705e-06, -5.509704351425171e-06, -5.208887159824371e-06, -4.908069968223572e-06, -4.607252776622772e-06, -4.306435585021973e-06, -4.005618393421173e-06, -3.7048012018203735e-06, -3.403984010219574e-06, -3.1031668186187744e-06, -2.802349627017975e-06, -2.5015324354171753e-06, -2.2007152438163757e-06, -1.8998980522155762e-06, -1.5990808606147766e-06, -1.298263669013977e-06, -9.974464774131775e-07, -6.966292858123779e-07, -3.9581209421157837e-07, -9.499490261077881e-08, 2.0582228899002075e-07, 5.066394805908203e-07, 8.074566721916199e-07, 1.1082738637924194e-06, 1.409091055393219e-06, 1.7099082469940186e-06, 2.010725438594818e-06, 2.3115426301956177e-06, 2.6123598217964172e-06, 2.913177013397217e-06, 3.2139942049980164e-06, 3.514811396598816e-06, 3.8156285881996155e-06, 4.116445779800415e-06, 4.417262971401215e-06, 4.718080163002014e-06, 5.018897354602814e-06, 5.319714546203613e-06, 5.620531737804413e-06, 5.921348929405212e-06, 6.222166121006012e-06, 6.5229833126068115e-06, 6.823800504207611e-06, 7.124617695808411e-06, 7.42543488740921e-06, 7.72625207901001e-06, 8.02706927061081e-06, 8.327886462211609e-06, 8.628703653812408e-06, 8.929520845413208e-06, 9.230338037014008e-06, 9.531155228614807e-06, 9.831972420215607e-06, 1.0132789611816406e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 11.0, 25.0, 26.0, 36.0, 51.0, 80.0, 126.0, 184.0, 250.0, 391.0, 621.0, 873.0, 1329.0, 2069.0, 3205.0, 5101.0, 8216.0, 13434.0, 22852.0, 41302.0, 76651.0, 147000.0, 263399.0, 212942.0, 110727.0, 58496.0, 31545.0, 18264.0, 10807.0, 6651.0, 4089.0, 2603.0, 1743.0, 1147.0, 754.0, 495.0, 345.0, 228.0, 158.0, 104.0, 70.0, 45.0, 33.0, 29.0, 15.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.0718994140625, -0.06963729858398438, -0.06737518310546875, -0.06511306762695312, -0.0628509521484375, -0.060588836669921875, -0.05832672119140625, -0.056064605712890625, -0.053802490234375, -0.051540374755859375, -0.04927825927734375, -0.047016143798828125, -0.0447540283203125, -0.042491912841796875, -0.04022979736328125, -0.037967681884765625, -0.03570556640625, -0.033443450927734375, -0.03118133544921875, -0.028919219970703125, -0.0266571044921875, -0.024394989013671875, -0.02213287353515625, -0.019870758056640625, -0.017608642578125, -0.015346527099609375, -0.01308441162109375, -0.010822296142578125, -0.0085601806640625, -0.006298065185546875, -0.00403594970703125, -0.001773834228515625, 0.00048828125, 0.002750396728515625, 0.00501251220703125, 0.007274627685546875, 0.0095367431640625, 0.011798858642578125, 0.01406097412109375, 0.016323089599609375, 0.018585205078125, 0.020847320556640625, 0.02310943603515625, 0.025371551513671875, 0.0276336669921875, 0.029895782470703125, 0.03215789794921875, 0.034420013427734375, 0.03668212890625, 0.038944244384765625, 0.04120635986328125, 0.043468475341796875, 0.0457305908203125, 0.047992706298828125, 0.05025482177734375, 0.052516937255859375, 0.054779052734375, 0.057041168212890625, 0.05930328369140625, 0.061565399169921875, 0.0638275146484375, 0.06608963012695312, 0.06835174560546875, 0.07061386108398438, 0.0728759765625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 6.0, 8.0, 6.0, 17.0, 10.0, 12.0, 19.0, 15.0, 25.0, 38.0, 38.0, 31.0, 55.0, 36.0, 57.0, 64.0, 61.0, 77.0, 75.0, 62.0, 45.0, 21.0, 42.0, 36.0, 18.0, 16.0, 16.0, 15.0, 12.0, 13.0, 13.0, 10.0, 6.0, 9.0, 0.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0241241455078125, -0.023389577865600586, -0.022655010223388672, -0.021920442581176758, -0.021185874938964844, -0.02045130729675293, -0.019716739654541016, -0.0189821720123291, -0.018247604370117188, -0.017513036727905273, -0.01677846908569336, -0.016043901443481445, -0.015309333801269531, -0.014574766159057617, -0.013840198516845703, -0.013105630874633789, -0.012371063232421875, -0.011636495590209961, -0.010901927947998047, -0.010167360305786133, -0.009432792663574219, -0.008698225021362305, -0.00796365737915039, -0.0072290897369384766, -0.0064945220947265625, -0.0057599544525146484, -0.005025386810302734, -0.00429081916809082, -0.0035562515258789062, -0.002821683883666992, -0.002087116241455078, -0.001352548599243164, -0.00061798095703125, 0.00011658668518066406, 0.0008511543273925781, 0.0015857219696044922, 0.0023202896118164062, 0.0030548572540283203, 0.0037894248962402344, 0.0045239925384521484, 0.0052585601806640625, 0.0059931278228759766, 0.006727695465087891, 0.007462263107299805, 0.008196830749511719, 0.008931398391723633, 0.009665966033935547, 0.010400533676147461, 0.011135101318359375, 0.011869668960571289, 0.012604236602783203, 0.013338804244995117, 0.014073371887207031, 0.014807939529418945, 0.01554250717163086, 0.016277074813842773, 0.017011642456054688, 0.0177462100982666, 0.018480777740478516, 0.01921534538269043, 0.019949913024902344, 0.020684480667114258, 0.021419048309326172, 0.022153615951538086, 0.02288818359375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 9.0, 3.0, 6.0, 10.0, 5.0, 11.0, 20.0, 40.0, 37.0, 33.0, 48.0, 60.0, 78.0, 63.0, 83.0, 75.0, 87.0, 63.0, 62.0, 38.0, 40.0, 24.0, 20.0, 27.0, 10.0, 9.0, 10.0, 5.0, 4.0, 9.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.416112899780273, -7.15893030166626, -6.901747703552246, -6.644565105438232, -6.387382507324219, -6.130199909210205, -5.873017311096191, -5.615835189819336, -5.358652114868164, -5.10146951675415, -4.844286918640137, -4.587104320526123, -4.329921722412109, -4.072739124298096, -3.815556764602661, -3.5583741664886475, -3.301191806793213, -3.044009208679199, -2.7868266105651855, -2.529644012451172, -2.272461414337158, -2.0152788162231445, -1.75809645652771, -1.5009138584136963, -1.2437312602996826, -0.986548662185669, -0.7293661236763, -0.47218358516693115, -0.21500098705291748, 0.04218161106109619, 0.2993640899658203, 0.556546688079834, 0.8137292861938477, 1.0709118843078613, 1.328094482421875, 1.5852769613265991, 1.8424595594406128, 2.099642276763916, 2.3568246364593506, 2.6140072345733643, 2.871189832687378, 3.1283724308013916, 3.3855550289154053, 3.64273738861084, 3.8999199867248535, 4.157102584838867, 4.414285182952881, 4.6714677810668945, 4.928650379180908, 5.185832977294922, 5.4430155754089355, 5.700198173522949, 5.957380771636963, 6.214563369750977, 6.471745491027832, 6.728928565979004, 6.986110687255859, 7.243293285369873, 7.500475883483887, 7.7576584815979, 8.014841079711914, 8.27202320098877, 8.529206275939941, 8.786388397216797, 9.043571472167969]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 8.0, 9.0, 11.0, 18.0, 8.0, 16.0, 26.0, 26.0, 26.0, 31.0, 36.0, 25.0, 36.0, 38.0, 52.0, 38.0, 38.0, 39.0, 44.0, 36.0, 41.0, 40.0, 38.0, 35.0, 34.0, 29.0, 36.0, 25.0, 23.0, 23.0, 17.0, 19.0, 12.0, 11.0, 9.0, 10.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.437732696533203, -6.243539333343506, -6.049345970153809, -5.855152606964111, -5.660959243774414, -5.466766357421875, -5.272572994232178, -5.0783796310424805, -4.884186267852783, -4.689992904663086, -4.495799541473389, -4.301606178283691, -4.107413291931152, -3.913219690322876, -3.719026565551758, -3.5248332023620605, -3.3306398391723633, -3.136446475982666, -2.9422531127929688, -2.7480599880218506, -2.5538666248321533, -2.359673261642456, -2.165480136871338, -1.9712867736816406, -1.7770934104919434, -1.582900047302246, -1.3887068033218384, -1.1945135593414307, -1.0003201961517334, -0.8061268925666809, -0.6119335889816284, -0.4177403450012207, -0.22354745864868164, -0.02935415506362915, 0.16483914852142334, 0.35903245210647583, 0.5532257556915283, 0.7474190592765808, 0.9416123628616333, 1.135805606842041, 1.3299989700317383, 1.5241923332214355, 1.7183855772018433, 1.912578821182251, 2.1067721843719482, 2.3009655475616455, 2.4951586723327637, 2.689352035522461, 2.883545398712158, 3.0777387619018555, 3.2719321250915527, 3.466125249862671, 3.660318613052368, 3.8545119762420654, 4.048705101013184, 4.242898464202881, 4.437091827392578, 4.631285190582275, 4.825478553771973, 5.01967191696167, 5.213865280151367, 5.408058166503906, 5.6022515296936035, 5.796444892883301, 5.990638256072998]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 22.0, 32.0, 49.0, 63.0, 127.0, 177.0, 275.0, 437.0, 665.0, 1093.0, 1676.0, 2577.0, 4135.0, 6356.0, 10066.0, 16021.0, 25163.0, 39593.0, 60449.0, 89406.0, 121685.0, 143438.0, 144146.0, 121278.0, 89227.0, 61153.0, 39854.0, 25264.0, 16096.0, 10163.0, 6524.0, 4062.0, 2560.0, 1640.0, 1056.0, 697.0, 442.0, 289.0, 204.0, 137.0, 80.0, 47.0, 41.0, 31.0, 16.0, 11.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.19232177734375, -4.0526123046875, -3.91290283203125, -3.773193359375, -3.63348388671875, -3.4937744140625, -3.35406494140625, -3.21435546875, -3.07464599609375, -2.9349365234375, -2.79522705078125, -2.655517578125, -2.51580810546875, -2.3760986328125, -2.23638916015625, -2.0966796875, -1.95697021484375, -1.8172607421875, -1.67755126953125, -1.537841796875, -1.39813232421875, -1.2584228515625, -1.11871337890625, -0.97900390625, -0.83929443359375, -0.6995849609375, -0.55987548828125, -0.420166015625, -0.28045654296875, -0.1407470703125, -0.00103759765625, 0.138671875, 0.27838134765625, 0.4180908203125, 0.55780029296875, 0.697509765625, 0.83721923828125, 0.9769287109375, 1.11663818359375, 1.25634765625, 1.39605712890625, 1.5357666015625, 1.67547607421875, 1.815185546875, 1.95489501953125, 2.0946044921875, 2.23431396484375, 2.3740234375, 2.51373291015625, 2.6534423828125, 2.79315185546875, 2.932861328125, 3.07257080078125, 3.2122802734375, 3.35198974609375, 3.49169921875, 3.63140869140625, 3.7711181640625, 3.91082763671875, 4.050537109375, 4.19024658203125, 4.3299560546875, 4.46966552734375, 4.609375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 7.0, 10.0, 7.0, 10.0, 13.0, 18.0, 20.0, 37.0, 19.0, 28.0, 31.0, 36.0, 42.0, 41.0, 52.0, 50.0, 43.0, 34.0, 51.0, 38.0, 40.0, 43.0, 43.0, 35.0, 32.0, 37.0, 30.0, 26.0, 21.0, 12.0, 18.0, 17.0, 14.0, 13.0, 7.0, 10.0, 7.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.47265625, -7.25872802734375, -7.0447998046875, -6.83087158203125, -6.616943359375, -6.40301513671875, -6.1890869140625, -5.97515869140625, -5.76123046875, -5.54730224609375, -5.3333740234375, -5.11944580078125, -4.905517578125, -4.69158935546875, -4.4776611328125, -4.26373291015625, -4.0498046875, -3.83587646484375, -3.6219482421875, -3.40802001953125, -3.194091796875, -2.98016357421875, -2.7662353515625, -2.55230712890625, -2.33837890625, -2.12445068359375, -1.9105224609375, -1.69659423828125, -1.482666015625, -1.26873779296875, -1.0548095703125, -0.84088134765625, -0.626953125, -0.41302490234375, -0.1990966796875, 0.01483154296875, 0.228759765625, 0.44268798828125, 0.6566162109375, 0.87054443359375, 1.08447265625, 1.29840087890625, 1.5123291015625, 1.72625732421875, 1.940185546875, 2.15411376953125, 2.3680419921875, 2.58197021484375, 2.7958984375, 3.00982666015625, 3.2237548828125, 3.43768310546875, 3.651611328125, 3.86553955078125, 4.0794677734375, 4.29339599609375, 4.50732421875, 4.72125244140625, 4.9351806640625, 5.14910888671875, 5.363037109375, 5.57696533203125, 5.7908935546875, 6.00482177734375, 6.21875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 19.0, 12.0, 22.0, 39.0, 61.0, 82.0, 101.0, 186.0, 278.0, 438.0, 601.0, 958.0, 1581.0, 2358.0, 3716.0, 5925.0, 9184.0, 14675.0, 23055.0, 36347.0, 56246.0, 83333.0, 115425.0, 141442.0, 145281.0, 127041.0, 95759.0, 65875.0, 42895.0, 27713.0, 17491.0, 10934.0, 7013.0, 4473.0, 2818.0, 1834.0, 1149.0, 770.0, 519.0, 317.0, 223.0, 116.0, 81.0, 51.0, 42.0, 18.0, 17.0, 9.0, 10.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-4.58984375, -4.447265625, -4.3046875, -4.162109375, -4.01953125, -3.876953125, -3.734375, -3.591796875, -3.44921875, -3.306640625, -3.1640625, -3.021484375, -2.87890625, -2.736328125, -2.59375, -2.451171875, -2.30859375, -2.166015625, -2.0234375, -1.880859375, -1.73828125, -1.595703125, -1.453125, -1.310546875, -1.16796875, -1.025390625, -0.8828125, -0.740234375, -0.59765625, -0.455078125, -0.3125, -0.169921875, -0.02734375, 0.115234375, 0.2578125, 0.400390625, 0.54296875, 0.685546875, 0.828125, 0.970703125, 1.11328125, 1.255859375, 1.3984375, 1.541015625, 1.68359375, 1.826171875, 1.96875, 2.111328125, 2.25390625, 2.396484375, 2.5390625, 2.681640625, 2.82421875, 2.966796875, 3.109375, 3.251953125, 3.39453125, 3.537109375, 3.6796875, 3.822265625, 3.96484375, 4.107421875, 4.25, 4.392578125, 4.53515625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 6.0, 10.0, 12.0, 7.0, 14.0, 18.0, 16.0, 20.0, 30.0, 24.0, 28.0, 23.0, 40.0, 41.0, 39.0, 51.0, 39.0, 47.0, 54.0, 48.0, 53.0, 42.0, 42.0, 40.0, 26.0, 31.0, 43.0, 21.0, 27.0, 17.0, 23.0, 7.0, 9.0, 15.0, 11.0, 9.0, 7.0, 4.0, 5.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.67578125, -4.5389404296875, -4.402099609375, -4.2652587890625, -4.12841796875, -3.9915771484375, -3.854736328125, -3.7178955078125, -3.5810546875, -3.4442138671875, -3.307373046875, -3.1705322265625, -3.03369140625, -2.8968505859375, -2.760009765625, -2.6231689453125, -2.486328125, -2.3494873046875, -2.212646484375, -2.0758056640625, -1.93896484375, -1.8021240234375, -1.665283203125, -1.5284423828125, -1.3916015625, -1.2547607421875, -1.117919921875, -0.9810791015625, -0.84423828125, -0.7073974609375, -0.570556640625, -0.4337158203125, -0.296875, -0.1600341796875, -0.023193359375, 0.1136474609375, 0.25048828125, 0.3873291015625, 0.524169921875, 0.6610107421875, 0.7978515625, 0.9346923828125, 1.071533203125, 1.2083740234375, 1.34521484375, 1.4820556640625, 1.618896484375, 1.7557373046875, 1.892578125, 2.0294189453125, 2.166259765625, 2.3031005859375, 2.43994140625, 2.5767822265625, 2.713623046875, 2.8504638671875, 2.9873046875, 3.1241455078125, 3.260986328125, 3.3978271484375, 3.53466796875, 3.6715087890625, 3.808349609375, 3.9451904296875, 4.08203125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 6.0, 9.0, 11.0, 22.0, 25.0, 21.0, 40.0, 64.0, 84.0, 119.0, 144.0, 211.0, 296.0, 411.0, 558.0, 834.0, 1259.0, 1910.0, 2965.0, 4968.0, 8524.0, 14724.0, 26733.0, 50907.0, 96005.0, 167086.0, 223449.0, 191289.0, 116202.0, 62571.0, 32584.0, 17948.0, 10111.0, 5844.0, 3592.0, 2284.0, 1429.0, 1001.0, 649.0, 484.0, 325.0, 233.0, 172.0, 130.0, 73.0, 66.0, 59.0, 50.0, 27.0, 13.0, 9.0, 10.0, 8.0, 6.0, 1.0, 1.0, 2.0], "bins": [-2.392578125, -2.321502685546875, -2.25042724609375, -2.179351806640625, -2.1082763671875, -2.037200927734375, -1.96612548828125, -1.895050048828125, -1.823974609375, -1.752899169921875, -1.68182373046875, -1.610748291015625, -1.5396728515625, -1.468597412109375, -1.39752197265625, -1.326446533203125, -1.25537109375, -1.184295654296875, -1.11322021484375, -1.042144775390625, -0.9710693359375, -0.899993896484375, -0.82891845703125, -0.757843017578125, -0.686767578125, -0.615692138671875, -0.54461669921875, -0.473541259765625, -0.4024658203125, -0.331390380859375, -0.26031494140625, -0.189239501953125, -0.1181640625, -0.047088623046875, 0.02398681640625, 0.095062255859375, 0.1661376953125, 0.237213134765625, 0.30828857421875, 0.379364013671875, 0.450439453125, 0.521514892578125, 0.59259033203125, 0.663665771484375, 0.7347412109375, 0.805816650390625, 0.87689208984375, 0.947967529296875, 1.01904296875, 1.090118408203125, 1.16119384765625, 1.232269287109375, 1.3033447265625, 1.374420166015625, 1.44549560546875, 1.516571044921875, 1.587646484375, 1.658721923828125, 1.72979736328125, 1.800872802734375, 1.8719482421875, 1.943023681640625, 2.01409912109375, 2.085174560546875, 2.15625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 10.0, 6.0, 7.0, 8.0, 14.0, 21.0, 24.0, 46.0, 43.0, 62.0, 81.0, 95.0, 89.0, 93.0, 86.0, 75.0, 52.0, 41.0, 28.0, 31.0, 18.0, 30.0, 10.0, 6.0, 11.0, 2.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002903938293457031, -0.00028291717171669006, -0.000275440514087677, -0.00026796385645866394, -0.0002604871988296509, -0.0002530105412006378, -0.00024553388357162476, -0.0002380572259426117, -0.00023058056831359863, -0.00022310391068458557, -0.0002156272530555725, -0.00020815059542655945, -0.0002006739377975464, -0.00019319728016853333, -0.00018572062253952026, -0.0001782439649105072, -0.00017076730728149414, -0.00016329064965248108, -0.00015581399202346802, -0.00014833733439445496, -0.0001408606767654419, -0.00013338401913642883, -0.00012590736150741577, -0.00011843070387840271, -0.00011095404624938965, -0.00010347738862037659, -9.600073099136353e-05, -8.852407336235046e-05, -8.10474157333374e-05, -7.357075810432434e-05, -6.609410047531128e-05, -5.861744284629822e-05, -5.1140785217285156e-05, -4.3664127588272095e-05, -3.618746995925903e-05, -2.871081233024597e-05, -2.123415470123291e-05, -1.3757497072219849e-05, -6.280839443206787e-06, 1.1958181858062744e-06, 8.672475814819336e-06, 1.6149133443832397e-05, 2.362579107284546e-05, 3.110244870185852e-05, 3.857910633087158e-05, 4.6055763959884644e-05, 5.3532421588897705e-05, 6.1009079217910767e-05, 6.848573684692383e-05, 7.596239447593689e-05, 8.343905210494995e-05, 9.091570973396301e-05, 9.839236736297607e-05, 0.00010586902499198914, 0.0001133456826210022, 0.00012082234025001526, 0.00012829899787902832, 0.00013577565550804138, 0.00014325231313705444, 0.0001507289707660675, 0.00015820562839508057, 0.00016568228602409363, 0.0001731589436531067, 0.00018063560128211975, 0.0001881122589111328]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 6.0, 3.0, 9.0, 16.0, 21.0, 40.0, 66.0, 105.0, 144.0, 225.0, 335.0, 573.0, 863.0, 1406.0, 2408.0, 4019.0, 7248.0, 13330.0, 25797.0, 50868.0, 98948.0, 176237.0, 235169.0, 194238.0, 113414.0, 58471.0, 29907.0, 15266.0, 8086.0, 4440.0, 2550.0, 1600.0, 1027.0, 598.0, 403.0, 269.0, 163.0, 99.0, 69.0, 48.0, 29.0, 13.0, 15.0, 2.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1640625, -2.088409423828125, -2.01275634765625, -1.937103271484375, -1.8614501953125, -1.785797119140625, -1.71014404296875, -1.634490966796875, -1.558837890625, -1.483184814453125, -1.40753173828125, -1.331878662109375, -1.2562255859375, -1.180572509765625, -1.10491943359375, -1.029266357421875, -0.95361328125, -0.877960205078125, -0.80230712890625, -0.726654052734375, -0.6510009765625, -0.575347900390625, -0.49969482421875, -0.424041748046875, -0.348388671875, -0.272735595703125, -0.19708251953125, -0.121429443359375, -0.0457763671875, 0.029876708984375, 0.10552978515625, 0.181182861328125, 0.2568359375, 0.332489013671875, 0.40814208984375, 0.483795166015625, 0.5594482421875, 0.635101318359375, 0.71075439453125, 0.786407470703125, 0.862060546875, 0.937713623046875, 1.01336669921875, 1.089019775390625, 1.1646728515625, 1.240325927734375, 1.31597900390625, 1.391632080078125, 1.46728515625, 1.542938232421875, 1.61859130859375, 1.694244384765625, 1.7698974609375, 1.845550537109375, 1.92120361328125, 1.996856689453125, 2.072509765625, 2.148162841796875, 2.22381591796875, 2.299468994140625, 2.3751220703125, 2.450775146484375, 2.52642822265625, 2.602081298828125, 2.677734375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 10.0, 11.0, 18.0, 19.0, 23.0, 20.0, 29.0, 42.0, 49.0, 54.0, 51.0, 77.0, 59.0, 86.0, 58.0, 72.0, 51.0, 44.0, 35.0, 45.0, 28.0, 30.0, 16.0, 21.0, 12.0, 7.0, 10.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.646484375, -0.6176910400390625, -0.588897705078125, -0.5601043701171875, -0.53131103515625, -0.5025177001953125, -0.473724365234375, -0.4449310302734375, -0.4161376953125, -0.3873443603515625, -0.358551025390625, -0.3297576904296875, -0.30096435546875, -0.2721710205078125, -0.243377685546875, -0.2145843505859375, -0.185791015625, -0.1569976806640625, -0.128204345703125, -0.0994110107421875, -0.07061767578125, -0.0418243408203125, -0.013031005859375, 0.0157623291015625, 0.0445556640625, 0.0733489990234375, 0.102142333984375, 0.1309356689453125, 0.15972900390625, 0.1885223388671875, 0.217315673828125, 0.2461090087890625, 0.27490234375, 0.3036956787109375, 0.332489013671875, 0.3612823486328125, 0.39007568359375, 0.4188690185546875, 0.447662353515625, 0.4764556884765625, 0.5052490234375, 0.5340423583984375, 0.562835693359375, 0.5916290283203125, 0.62042236328125, 0.6492156982421875, 0.678009033203125, 0.7068023681640625, 0.735595703125, 0.7643890380859375, 0.793182373046875, 0.8219757080078125, 0.85076904296875, 0.8795623779296875, 0.908355712890625, 0.9371490478515625, 0.9659423828125, 0.9947357177734375, 1.023529052734375, 1.0523223876953125, 1.08111572265625, 1.1099090576171875, 1.138702392578125, 1.1674957275390625, 1.1962890625]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 3.0, 4.0, 5.0, 6.0, 9.0, 14.0, 21.0, 29.0, 39.0, 48.0, 58.0, 61.0, 80.0, 81.0, 86.0, 70.0, 65.0, 67.0, 64.0, 47.0, 30.0, 26.0, 22.0, 11.0, 12.0, 8.0, 6.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.717831134796143, -7.445763111114502, -7.173694610595703, -6.9016265869140625, -6.629558563232422, -6.357490539550781, -6.085422515869141, -5.813354015350342, -5.541285991668701, -5.2692179679870605, -4.997149467468262, -4.725081443786621, -4.4530134201049805, -4.18094539642334, -3.90887713432312, -3.6368088722229004, -3.3647408485412598, -3.092672824859619, -2.8206045627593994, -2.5485363006591797, -2.276468276977539, -2.0044002532958984, -1.7323319911956787, -1.4602638483047485, -1.1881957054138184, -0.9161275625228882, -0.644059419631958, -0.37199127674102783, -0.09992313385009766, 0.17214500904083252, 0.4442131519317627, 0.7162812948226929, 0.9883489608764648, 1.260417103767395, 1.5324852466583252, 1.8045533895492554, 2.0766215324401855, 2.348689556121826, 2.620757818222046, 2.8928260803222656, 3.1648941040039062, 3.436962127685547, 3.7090303897857666, 3.9810986518859863, 4.253166675567627, 4.525234699249268, 4.797303199768066, 5.069371223449707, 5.341439247131348, 5.613507270812988, 5.885575294494629, 6.157643795013428, 6.429711818695068, 6.701779842376709, 6.973848342895508, 7.245916366577148, 7.517984390258789, 7.79005241394043, 8.06212043762207, 8.334188461303711, 8.606256484985352, 8.878325462341309, 9.15039348602295, 9.42246150970459, 9.69452953338623]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 6.0, 6.0, 6.0, 8.0, 12.0, 16.0, 9.0, 21.0, 20.0, 28.0, 32.0, 28.0, 35.0, 31.0, 22.0, 35.0, 35.0, 39.0, 54.0, 44.0, 37.0, 35.0, 32.0, 27.0, 39.0, 43.0, 44.0, 34.0, 30.0, 31.0, 31.0, 16.0, 13.0, 8.0, 15.0, 14.0, 11.0, 9.0, 8.0, 7.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.051273345947266, -5.852762222290039, -5.6542510986328125, -5.455739974975586, -5.257228851318359, -5.058718204498291, -4.8602070808410645, -4.661695957183838, -4.463184833526611, -4.264673709869385, -4.066162586212158, -3.8676517009735107, -3.669140577316284, -3.4706294536590576, -3.27211856842041, -3.0736074447631836, -2.875096321105957, -2.6765851974487305, -2.478074073791504, -2.2795631885528564, -2.08105206489563, -1.8825409412384033, -1.6840299367904663, -1.4855189323425293, -1.2870078086853027, -1.0884966850280762, -0.8899856805801392, -0.6914746165275574, -0.4929635524749756, -0.2944524884223938, -0.09594142436981201, 0.102569580078125, 0.30108070373535156, 0.49959176778793335, 0.6981028318405151, 0.8966138958930969, 1.0951249599456787, 1.2936360836029053, 1.4921470880508423, 1.6906580924987793, 1.8891692161560059, 2.0876803398132324, 2.286191463470459, 2.4847023487091064, 2.683213472366333, 2.8817245960235596, 3.080235481262207, 3.2787466049194336, 3.47725772857666, 3.6757688522338867, 3.8742799758911133, 4.07279109954834, 4.271302223205566, 4.469812870025635, 4.668323993682861, 4.866835117340088, 5.0653462409973145, 5.263857364654541, 5.462368488311768, 5.660879611968994, 5.8593902587890625, 6.057901382446289, 6.256412506103516, 6.454923629760742, 6.653434753417969]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 6.0, 5.0, 8.0, 17.0, 20.0, 23.0, 55.0, 98.0, 136.0, 202.0, 366.0, 597.0, 1051.0, 1692.0, 2910.0, 5206.0, 9292.0, 16707.0, 31463.0, 60920.0, 124381.0, 263669.0, 551567.0, 960850.0, 992261.0, 593703.0, 287872.0, 138526.0, 68889.0, 36046.0, 19617.0, 10651.0, 6241.0, 3676.0, 2159.0, 1328.0, 784.0, 535.0, 307.0, 170.0, 113.0, 69.0, 41.0, 24.0, 18.0, 2.0, 8.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.65234375, -7.427734375, -7.203125, -6.978515625, -6.75390625, -6.529296875, -6.3046875, -6.080078125, -5.85546875, -5.630859375, -5.40625, -5.181640625, -4.95703125, -4.732421875, -4.5078125, -4.283203125, -4.05859375, -3.833984375, -3.609375, -3.384765625, -3.16015625, -2.935546875, -2.7109375, -2.486328125, -2.26171875, -2.037109375, -1.8125, -1.587890625, -1.36328125, -1.138671875, -0.9140625, -0.689453125, -0.46484375, -0.240234375, -0.015625, 0.208984375, 0.43359375, 0.658203125, 0.8828125, 1.107421875, 1.33203125, 1.556640625, 1.78125, 2.005859375, 2.23046875, 2.455078125, 2.6796875, 2.904296875, 3.12890625, 3.353515625, 3.578125, 3.802734375, 4.02734375, 4.251953125, 4.4765625, 4.701171875, 4.92578125, 5.150390625, 5.375, 5.599609375, 5.82421875, 6.048828125, 6.2734375, 6.498046875, 6.72265625]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 5.0, 7.0, 9.0, 11.0, 14.0, 19.0, 24.0, 21.0, 22.0, 35.0, 31.0, 36.0, 37.0, 33.0, 45.0, 42.0, 43.0, 41.0, 29.0, 36.0, 36.0, 47.0, 35.0, 34.0, 44.0, 28.0, 27.0, 40.0, 25.0, 22.0, 19.0, 10.0, 17.0, 13.0, 7.0, 9.0, 2.0, 15.0, 4.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.09765625, -3.9586181640625, -3.819580078125, -3.6805419921875, -3.54150390625, -3.4024658203125, -3.263427734375, -3.1243896484375, -2.9853515625, -2.8463134765625, -2.707275390625, -2.5682373046875, -2.42919921875, -2.2901611328125, -2.151123046875, -2.0120849609375, -1.873046875, -1.7340087890625, -1.594970703125, -1.4559326171875, -1.31689453125, -1.1778564453125, -1.038818359375, -0.8997802734375, -0.7607421875, -0.6217041015625, -0.482666015625, -0.3436279296875, -0.20458984375, -0.0655517578125, 0.073486328125, 0.2125244140625, 0.3515625, 0.4906005859375, 0.629638671875, 0.7686767578125, 0.90771484375, 1.0467529296875, 1.185791015625, 1.3248291015625, 1.4638671875, 1.6029052734375, 1.741943359375, 1.8809814453125, 2.02001953125, 2.1590576171875, 2.298095703125, 2.4371337890625, 2.576171875, 2.7152099609375, 2.854248046875, 2.9932861328125, 3.13232421875, 3.2713623046875, 3.410400390625, 3.5494384765625, 3.6884765625, 3.8275146484375, 3.966552734375, 4.1055908203125, 4.24462890625, 4.3836669921875, 4.522705078125, 4.6617431640625, 4.80078125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 12.0, 13.0, 19.0, 44.0, 67.0, 115.0, 152.0, 275.0, 410.0, 623.0, 937.0, 1601.0, 2492.0, 4133.0, 6840.0, 11144.0, 19366.0, 33481.0, 59050.0, 103426.0, 182297.0, 314475.0, 509274.0, 707126.0, 747845.0, 589168.0, 379345.0, 223074.0, 126732.0, 71687.0, 40847.0, 23305.0, 13785.0, 8136.0, 4953.0, 3024.0, 1828.0, 1133.0, 726.0, 489.0, 293.0, 200.0, 97.0, 102.0, 48.0, 26.0, 24.0, 18.0, 8.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.59375, -5.419921875, -5.24609375, -5.072265625, -4.8984375, -4.724609375, -4.55078125, -4.376953125, -4.203125, -4.029296875, -3.85546875, -3.681640625, -3.5078125, -3.333984375, -3.16015625, -2.986328125, -2.8125, -2.638671875, -2.46484375, -2.291015625, -2.1171875, -1.943359375, -1.76953125, -1.595703125, -1.421875, -1.248046875, -1.07421875, -0.900390625, -0.7265625, -0.552734375, -0.37890625, -0.205078125, -0.03125, 0.142578125, 0.31640625, 0.490234375, 0.6640625, 0.837890625, 1.01171875, 1.185546875, 1.359375, 1.533203125, 1.70703125, 1.880859375, 2.0546875, 2.228515625, 2.40234375, 2.576171875, 2.75, 2.923828125, 3.09765625, 3.271484375, 3.4453125, 3.619140625, 3.79296875, 3.966796875, 4.140625, 4.314453125, 4.48828125, 4.662109375, 4.8359375, 5.009765625, 5.18359375, 5.357421875, 5.53125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 3.0, 4.0, 5.0, 8.0, 17.0, 12.0, 27.0, 32.0, 39.0, 44.0, 64.0, 73.0, 100.0, 108.0, 133.0, 169.0, 198.0, 221.0, 218.0, 266.0, 242.0, 247.0, 215.0, 233.0, 204.0, 184.0, 147.0, 157.0, 132.0, 84.0, 88.0, 71.0, 62.0, 48.0, 43.0, 37.0, 30.0, 19.0, 26.0, 14.0, 12.0, 5.0, 10.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.169921875, -2.097137451171875, -2.02435302734375, -1.951568603515625, -1.8787841796875, -1.805999755859375, -1.73321533203125, -1.660430908203125, -1.587646484375, -1.514862060546875, -1.44207763671875, -1.369293212890625, -1.2965087890625, -1.223724365234375, -1.15093994140625, -1.078155517578125, -1.00537109375, -0.932586669921875, -0.85980224609375, -0.787017822265625, -0.7142333984375, -0.641448974609375, -0.56866455078125, -0.495880126953125, -0.423095703125, -0.350311279296875, -0.27752685546875, -0.204742431640625, -0.1319580078125, -0.059173583984375, 0.01361083984375, 0.086395263671875, 0.1591796875, 0.231964111328125, 0.30474853515625, 0.377532958984375, 0.4503173828125, 0.523101806640625, 0.59588623046875, 0.668670654296875, 0.741455078125, 0.814239501953125, 0.88702392578125, 0.959808349609375, 1.0325927734375, 1.105377197265625, 1.17816162109375, 1.250946044921875, 1.32373046875, 1.396514892578125, 1.46929931640625, 1.542083740234375, 1.6148681640625, 1.687652587890625, 1.76043701171875, 1.833221435546875, 1.906005859375, 1.978790283203125, 2.05157470703125, 2.124359130859375, 2.1971435546875, 2.269927978515625, 2.34271240234375, 2.415496826171875, 2.48828125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 8.0, 8.0, 10.0, 15.0, 18.0, 22.0, 38.0, 51.0, 56.0, 93.0, 94.0, 103.0, 111.0, 85.0, 66.0, 52.0, 38.0, 38.0, 26.0, 24.0, 13.0, 6.0, 10.0, 3.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.555540561676025, -6.2271342277526855, -5.898727893829346, -5.570322036743164, -5.241915702819824, -4.913509368896484, -4.5851030349731445, -4.256696701049805, -3.928290605545044, -3.599884271621704, -3.2714781761169434, -2.9430718421936035, -2.6146655082702637, -2.286259412765503, -1.957853078842163, -1.6294469833374023, -1.3010406494140625, -0.9726344347000122, -0.6442281603813171, -0.31582188606262207, 0.012584328651428223, 0.3409905433654785, 0.6693968772888184, 0.9978029727935791, 1.326209306716919, 1.6546155214309692, 1.9830217361450195, 2.3114280700683594, 2.639834403991699, 2.96824049949646, 3.2966468334198, 3.6250529289245605, 3.953458786010742, 4.281865119934082, 4.610271453857422, 4.938677787780762, 5.267083644866943, 5.595489978790283, 5.923896312713623, 6.252302169799805, 6.5807085037231445, 6.909114837646484, 7.237521171569824, 7.565927505493164, 7.894333362579346, 8.222740173339844, 8.551145553588867, 8.879551887512207, 9.207958221435547, 9.536364555358887, 9.864770889282227, 10.193177223205566, 10.521583557128906, 10.84998893737793, 11.178396224975586, 11.50680160522461, 11.835208892822266, 12.163615226745605, 12.492021560668945, 12.820427894592285, 13.148834228515625, 13.477239608764648, 13.805646896362305, 14.134052276611328, 14.462458610534668]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 8.0, 2.0, 3.0, 10.0, 9.0, 16.0, 11.0, 13.0, 25.0, 28.0, 25.0, 42.0, 38.0, 36.0, 48.0, 62.0, 48.0, 33.0, 52.0, 48.0, 54.0, 52.0, 61.0, 38.0, 46.0, 34.0, 29.0, 16.0, 35.0, 21.0, 7.0, 14.0, 13.0, 12.0, 10.0, 3.0, 2.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.35279655456543, -8.111002922058105, -7.8692097663879395, -7.627416133880615, -7.385622501373291, -7.143829345703125, -6.902035713195801, -6.660242080688477, -6.418448448181152, -6.176654815673828, -5.934861660003662, -5.693068027496338, -5.451274394989014, -5.209481239318848, -4.967687606811523, -4.725893974304199, -4.484100818634033, -4.242307186126709, -4.000514030456543, -3.7587203979492188, -3.5169267654418945, -3.2751333713531494, -3.0333399772644043, -2.79154634475708, -2.549752950668335, -2.30795955657959, -2.0661659240722656, -1.8243725299835205, -1.5825790166854858, -1.3407855033874512, -1.098992109298706, -0.8571985960006714, -0.6154046058654785, -0.37361112236976624, -0.13181763887405396, 0.10997581481933594, 0.3517693281173706, 0.5935628414154053, 0.8353562355041504, 1.077149748802185, 1.3189432621002197, 1.5607367753982544, 1.802530288696289, 2.044323682785034, 2.2861170768737793, 2.5279107093811035, 2.7697041034698486, 3.0114974975585938, 3.253291130065918, 3.495084524154663, 3.7368781566619873, 3.9786715507507324, 4.220465183258057, 4.462258338928223, 4.704051971435547, 4.945845603942871, 5.187639236450195, 5.4294328689575195, 5.6712260246276855, 5.91301965713501, 6.154813289642334, 6.3966064453125, 6.638400077819824, 6.880193710327148, 7.1219868659973145]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 19.0, 28.0, 23.0, 41.0, 46.0, 73.0, 121.0, 182.0, 287.0, 388.0, 587.0, 895.0, 1288.0, 1906.0, 2991.0, 4493.0, 6680.0, 10643.0, 16717.0, 25882.0, 40519.0, 63290.0, 96665.0, 142369.0, 176174.0, 153189.0, 106840.0, 70004.0, 45166.0, 28694.0, 18269.0, 11729.0, 7639.0, 4997.0, 3127.0, 2137.0, 1393.0, 993.0, 644.0, 449.0, 312.0, 205.0, 145.0, 87.0, 67.0, 54.0, 39.0, 20.0, 12.0, 11.0, 8.0, 5.0, 3.0, 2.0], "bins": [-0.84228515625, -0.8179550170898438, -0.7936248779296875, -0.7692947387695312, -0.744964599609375, -0.7206344604492188, -0.6963043212890625, -0.6719741821289062, -0.64764404296875, -0.6233139038085938, -0.5989837646484375, -0.5746536254882812, -0.550323486328125, -0.5259933471679688, -0.5016632080078125, -0.47733306884765625, -0.4530029296875, -0.42867279052734375, -0.4043426513671875, -0.38001251220703125, -0.355682373046875, -0.33135223388671875, -0.3070220947265625, -0.28269195556640625, -0.25836181640625, -0.23403167724609375, -0.2097015380859375, -0.18537139892578125, -0.161041259765625, -0.13671112060546875, -0.1123809814453125, -0.08805084228515625, -0.063720703125, -0.03939056396484375, -0.0150604248046875, 0.00926971435546875, 0.033599853515625, 0.05792999267578125, 0.0822601318359375, 0.10659027099609375, 0.13092041015625, 0.15525054931640625, 0.1795806884765625, 0.20391082763671875, 0.228240966796875, 0.25257110595703125, 0.2769012451171875, 0.30123138427734375, 0.3255615234375, 0.34989166259765625, 0.3742218017578125, 0.39855194091796875, 0.422882080078125, 0.44721221923828125, 0.4715423583984375, 0.49587249755859375, 0.52020263671875, 0.5445327758789062, 0.5688629150390625, 0.5931930541992188, 0.617523193359375, 0.6418533325195312, 0.6661834716796875, 0.6905136108398438, 0.71484375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 4.0, 9.0, 8.0, 17.0, 15.0, 14.0, 13.0, 24.0, 25.0, 33.0, 21.0, 31.0, 36.0, 51.0, 42.0, 41.0, 36.0, 56.0, 49.0, 49.0, 33.0, 51.0, 44.0, 36.0, 40.0, 39.0, 31.0, 27.0, 20.0, 21.0, 11.0, 22.0, 5.0, 11.0, 8.0, 6.0, 6.0, 6.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.0859375, -7.86273193359375, -7.6395263671875, -7.41632080078125, -7.193115234375, -6.96990966796875, -6.7467041015625, -6.52349853515625, -6.30029296875, -6.07708740234375, -5.8538818359375, -5.63067626953125, -5.407470703125, -5.18426513671875, -4.9610595703125, -4.73785400390625, -4.5146484375, -4.29144287109375, -4.0682373046875, -3.84503173828125, -3.621826171875, -3.39862060546875, -3.1754150390625, -2.95220947265625, -2.72900390625, -2.50579833984375, -2.2825927734375, -2.05938720703125, -1.836181640625, -1.61297607421875, -1.3897705078125, -1.16656494140625, -0.943359375, -0.72015380859375, -0.4969482421875, -0.27374267578125, -0.050537109375, 0.17266845703125, 0.3958740234375, 0.61907958984375, 0.84228515625, 1.06549072265625, 1.2886962890625, 1.51190185546875, 1.735107421875, 1.95831298828125, 2.1815185546875, 2.40472412109375, 2.6279296875, 2.85113525390625, 3.0743408203125, 3.29754638671875, 3.520751953125, 3.74395751953125, 3.9671630859375, 4.19036865234375, 4.41357421875, 4.63677978515625, 4.8599853515625, 5.08319091796875, 5.306396484375, 5.52960205078125, 5.7528076171875, 5.97601318359375, 6.19921875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 7.0, 10.0, 11.0, 18.0, 26.0, 34.0, 56.0, 78.0, 124.0, 195.0, 310.0, 454.0, 734.0, 1156.0, 1961.0, 3247.0, 5236.0, 8889.0, 15176.0, 25423.0, 43745.0, 74765.0, 127723.0, 197057.0, 206199.0, 137603.0, 81837.0, 48091.0, 27944.0, 16024.0, 9736.0, 5667.0, 3425.0, 2167.0, 1284.0, 757.0, 489.0, 300.0, 185.0, 136.0, 95.0, 60.0, 46.0, 20.0, 19.0, 18.0, 11.0, 3.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.064453125, -1.0332183837890625, -1.001983642578125, -0.9707489013671875, -0.93951416015625, -0.9082794189453125, -0.877044677734375, -0.8458099365234375, -0.8145751953125, -0.7833404541015625, -0.752105712890625, -0.7208709716796875, -0.68963623046875, -0.6584014892578125, -0.627166748046875, -0.5959320068359375, -0.564697265625, -0.5334625244140625, -0.502227783203125, -0.4709930419921875, -0.43975830078125, -0.4085235595703125, -0.377288818359375, -0.3460540771484375, -0.3148193359375, -0.2835845947265625, -0.252349853515625, -0.2211151123046875, -0.18988037109375, -0.1586456298828125, -0.127410888671875, -0.0961761474609375, -0.06494140625, -0.0337066650390625, -0.002471923828125, 0.0287628173828125, 0.05999755859375, 0.0912322998046875, 0.122467041015625, 0.1537017822265625, 0.1849365234375, 0.2161712646484375, 0.247406005859375, 0.2786407470703125, 0.30987548828125, 0.3411102294921875, 0.372344970703125, 0.4035797119140625, 0.434814453125, 0.4660491943359375, 0.497283935546875, 0.5285186767578125, 0.55975341796875, 0.5909881591796875, 0.622222900390625, 0.6534576416015625, 0.6846923828125, 0.7159271240234375, 0.747161865234375, 0.7783966064453125, 0.80963134765625, 0.8408660888671875, 0.872100830078125, 0.9033355712890625, 0.9345703125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 6.0, 4.0, 3.0, 10.0, 16.0, 7.0, 6.0, 15.0, 14.0, 19.0, 30.0, 32.0, 30.0, 45.0, 39.0, 33.0, 40.0, 45.0, 37.0, 36.0, 40.0, 39.0, 38.0, 32.0, 30.0, 52.0, 37.0, 46.0, 26.0, 30.0, 22.0, 30.0, 20.0, 14.0, 19.0, 11.0, 11.0, 8.0, 7.0, 3.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.482421875, -3.356964111328125, -3.23150634765625, -3.106048583984375, -2.9805908203125, -2.855133056640625, -2.72967529296875, -2.604217529296875, -2.478759765625, -2.353302001953125, -2.22784423828125, -2.102386474609375, -1.9769287109375, -1.851470947265625, -1.72601318359375, -1.600555419921875, -1.47509765625, -1.349639892578125, -1.22418212890625, -1.098724365234375, -0.9732666015625, -0.847808837890625, -0.72235107421875, -0.596893310546875, -0.471435546875, -0.345977783203125, -0.22052001953125, -0.095062255859375, 0.0303955078125, 0.155853271484375, 0.28131103515625, 0.406768798828125, 0.5322265625, 0.657684326171875, 0.78314208984375, 0.908599853515625, 1.0340576171875, 1.159515380859375, 1.28497314453125, 1.410430908203125, 1.535888671875, 1.661346435546875, 1.78680419921875, 1.912261962890625, 2.0377197265625, 2.163177490234375, 2.28863525390625, 2.414093017578125, 2.53955078125, 2.665008544921875, 2.79046630859375, 2.915924072265625, 3.0413818359375, 3.166839599609375, 3.29229736328125, 3.417755126953125, 3.543212890625, 3.668670654296875, 3.79412841796875, 3.919586181640625, 4.0450439453125, 4.170501708984375, 4.29595947265625, 4.421417236328125, 4.546875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 4.0, 14.0, 20.0, 18.0, 51.0, 43.0, 113.0, 167.0, 230.0, 414.0, 640.0, 1100.0, 2101.0, 4230.0, 8568.0, 19273.0, 48524.0, 138271.0, 396370.0, 277465.0, 90024.0, 33241.0, 13921.0, 6468.0, 3180.0, 1675.0, 935.0, 535.0, 327.0, 222.0, 143.0, 87.0, 72.0, 30.0, 27.0, 9.0, 12.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1356201171875, -0.13172340393066406, -0.12782669067382812, -0.12392997741699219, -0.12003326416015625, -0.11613655090332031, -0.11223983764648438, -0.10834312438964844, -0.1044464111328125, -0.10054969787597656, -0.09665298461914062, -0.09275627136230469, -0.08885955810546875, -0.08496284484863281, -0.08106613159179688, -0.07716941833496094, -0.073272705078125, -0.06937599182128906, -0.06547927856445312, -0.06158256530761719, -0.05768585205078125, -0.05378913879394531, -0.049892425537109375, -0.04599571228027344, -0.0420989990234375, -0.03820228576660156, -0.034305572509765625, -0.030408859252929688, -0.02651214599609375, -0.022615432739257812, -0.018718719482421875, -0.014822006225585938, -0.01092529296875, -0.0070285797119140625, -0.003131866455078125, 0.0007648468017578125, 0.00466156005859375, 0.008558273315429688, 0.012454986572265625, 0.016351699829101562, 0.0202484130859375, 0.024145126342773438, 0.028041839599609375, 0.03193855285644531, 0.03583526611328125, 0.03973197937011719, 0.043628692626953125, 0.04752540588378906, 0.051422119140625, 0.05531883239746094, 0.059215545654296875, 0.06311225891113281, 0.06700897216796875, 0.07090568542480469, 0.07480239868164062, 0.07869911193847656, 0.0825958251953125, 0.08649253845214844, 0.09038925170898438, 0.09428596496582031, 0.09818267822265625, 0.10207939147949219, 0.10597610473632812, 0.10987281799316406, 0.11376953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 6.0, 7.0, 12.0, 13.0, 23.0, 21.0, 35.0, 42.0, 43.0, 55.0, 67.0, 81.0, 70.0, 67.0, 82.0, 70.0, 70.0, 55.0, 48.0, 29.0, 19.0, 18.0, 13.0, 23.0, 14.0, 4.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-05, -1.3146549463272095e-05, -1.2584030628204346e-05, -1.2021511793136597e-05, -1.1458992958068848e-05, -1.0896474123001099e-05, -1.033395528793335e-05, -9.7714364528656e-06, -9.208917617797852e-06, -8.646398782730103e-06, -8.083879947662354e-06, -7.5213611125946045e-06, -6.9588422775268555e-06, -6.3963234424591064e-06, -5.833804607391357e-06, -5.271285772323608e-06, -4.708766937255859e-06, -4.14624810218811e-06, -3.5837292671203613e-06, -3.0212104320526123e-06, -2.4586915969848633e-06, -1.8961727619171143e-06, -1.3336539268493652e-06, -7.711350917816162e-07, -2.086162567138672e-07, 3.5390257835388184e-07, 9.164214134216309e-07, 1.4789402484893799e-06, 2.041459083557129e-06, 2.603977918624878e-06, 3.166496753692627e-06, 3.729015588760376e-06, 4.291534423828125e-06, 4.854053258895874e-06, 5.416572093963623e-06, 5.979090929031372e-06, 6.541609764099121e-06, 7.10412859916687e-06, 7.666647434234619e-06, 8.229166269302368e-06, 8.791685104370117e-06, 9.354203939437866e-06, 9.916722774505615e-06, 1.0479241609573364e-05, 1.1041760444641113e-05, 1.1604279279708862e-05, 1.2166798114776611e-05, 1.272931694984436e-05, 1.329183578491211e-05, 1.3854354619979858e-05, 1.4416873455047607e-05, 1.4979392290115356e-05, 1.5541911125183105e-05, 1.6104429960250854e-05, 1.6666948795318604e-05, 1.7229467630386353e-05, 1.77919864654541e-05, 1.835450530052185e-05, 1.89170241355896e-05, 1.947954297065735e-05, 2.0042061805725098e-05, 2.0604580640792847e-05, 2.1167099475860596e-05, 2.1729618310928345e-05, 2.2292137145996094e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 8.0, 13.0, 16.0, 16.0, 35.0, 47.0, 88.0, 144.0, 210.0, 329.0, 584.0, 889.0, 1468.0, 2462.0, 4392.0, 7673.0, 14571.0, 29690.0, 66629.0, 179462.0, 402800.0, 198374.0, 72282.0, 31390.0, 15564.0, 8281.0, 4480.0, 2717.0, 1552.0, 875.0, 547.0, 344.0, 216.0, 127.0, 100.0, 53.0, 38.0, 30.0, 22.0, 15.0, 9.0, 8.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1275634765625, -0.12309455871582031, -0.11862564086914062, -0.11415672302246094, -0.10968780517578125, -0.10521888732910156, -0.10074996948242188, -0.09628105163574219, -0.0918121337890625, -0.08734321594238281, -0.08287429809570312, -0.07840538024902344, -0.07393646240234375, -0.06946754455566406, -0.06499862670898438, -0.06052970886230469, -0.056060791015625, -0.05159187316894531, -0.047122955322265625, -0.04265403747558594, -0.03818511962890625, -0.03371620178222656, -0.029247283935546875, -0.024778366088867188, -0.0203094482421875, -0.015840530395507812, -0.011371612548828125, -0.0069026947021484375, -0.00243377685546875, 0.0020351409912109375, 0.006504058837890625, 0.010972976684570312, 0.01544189453125, 0.019910812377929688, 0.024379730224609375, 0.028848648071289062, 0.03331756591796875, 0.03778648376464844, 0.042255401611328125, 0.04672431945800781, 0.0511932373046875, 0.05566215515136719, 0.060131072998046875, 0.06459999084472656, 0.06906890869140625, 0.07353782653808594, 0.07800674438476562, 0.08247566223144531, 0.086944580078125, 0.09141349792480469, 0.09588241577148438, 0.10035133361816406, 0.10482025146484375, 0.10928916931152344, 0.11375808715820312, 0.11822700500488281, 0.1226959228515625, 0.1271648406982422, 0.13163375854492188, 0.13610267639160156, 0.14057159423828125, 0.14504051208496094, 0.14950942993164062, 0.1539783477783203, 0.158447265625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 3.0, 6.0, 6.0, 10.0, 14.0, 21.0, 21.0, 31.0, 34.0, 27.0, 69.0, 60.0, 68.0, 93.0, 99.0, 70.0, 81.0, 65.0, 57.0, 38.0, 26.0, 19.0, 14.0, 14.0, 11.0, 14.0, 3.0, 8.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047210693359375, -0.045705318450927734, -0.04419994354248047, -0.0426945686340332, -0.04118919372558594, -0.03968381881713867, -0.038178443908691406, -0.03667306900024414, -0.035167694091796875, -0.03366231918334961, -0.032156944274902344, -0.030651569366455078, -0.029146194458007812, -0.027640819549560547, -0.02613544464111328, -0.024630069732666016, -0.02312469482421875, -0.021619319915771484, -0.02011394500732422, -0.018608570098876953, -0.017103195190429688, -0.015597820281982422, -0.014092445373535156, -0.01258707046508789, -0.011081695556640625, -0.00957632064819336, -0.008070945739746094, -0.006565570831298828, -0.0050601959228515625, -0.003554821014404297, -0.0020494461059570312, -0.0005440711975097656, 0.0009613037109375, 0.0024666786193847656, 0.003972053527832031, 0.005477428436279297, 0.0069828033447265625, 0.008488178253173828, 0.009993553161621094, 0.01149892807006836, 0.013004302978515625, 0.01450967788696289, 0.016015052795410156, 0.017520427703857422, 0.019025802612304688, 0.020531177520751953, 0.02203655242919922, 0.023541927337646484, 0.02504730224609375, 0.026552677154541016, 0.02805805206298828, 0.029563426971435547, 0.031068801879882812, 0.03257417678833008, 0.034079551696777344, 0.03558492660522461, 0.037090301513671875, 0.03859567642211914, 0.040101051330566406, 0.04160642623901367, 0.04311180114746094, 0.0446171760559082, 0.04612255096435547, 0.047627925872802734, 0.04913330078125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 12.0, 8.0, 8.0, 18.0, 16.0, 23.0, 46.0, 52.0, 61.0, 94.0, 93.0, 109.0, 104.0, 89.0, 67.0, 48.0, 38.0, 26.0, 24.0, 24.0, 11.0, 7.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.492403030395508, -6.163326263427734, -5.834249496459961, -5.5051727294921875, -5.176096439361572, -4.847019672393799, -4.517942905426025, -4.18886661529541, -3.8597896099090576, -3.530712842941284, -3.20163631439209, -2.8725595474243164, -2.543482780456543, -2.2144062519073486, -1.8853294849395752, -1.5562529563903809, -1.2271761894226074, -0.8980995416641235, -0.5690228343009949, -0.2399461269378662, 0.08913052082061768, 0.41820716857910156, 0.747283935546875, 1.0763604640960693, 1.4054372310638428, 1.7345138788223267, 2.0635905265808105, 2.392667293548584, 2.7217440605163574, 3.0508205890655518, 3.379897356033325, 3.7089738845825195, 4.038050651550293, 4.367127418518066, 4.69620418548584, 5.025280952453613, 5.3543572425842285, 5.683434009552002, 6.012510776519775, 6.341587066650391, 6.670663833618164, 6.9997406005859375, 7.328817367553711, 7.657894134521484, 7.9869704246521, 8.316047668457031, 8.645124435424805, 8.974200248718262, 9.303277969360352, 9.632354736328125, 9.961431503295898, 10.290508270263672, 10.619585037231445, 10.948661804199219, 11.277738571166992, 11.60681438446045, 11.935891151428223, 12.264967918395996, 12.59404468536377, 12.923121452331543, 13.252198219299316, 13.581274032592773, 13.910350799560547, 14.23942756652832, 14.568504333496094]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 8.0, 2.0, 3.0, 10.0, 9.0, 16.0, 9.0, 15.0, 23.0, 29.0, 25.0, 43.0, 37.0, 37.0, 47.0, 60.0, 49.0, 34.0, 49.0, 49.0, 58.0, 48.0, 63.0, 37.0, 49.0, 31.0, 29.0, 18.0, 35.0, 22.0, 8.0, 12.0, 13.0, 12.0, 9.0, 3.0, 3.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.4210844039917, -8.179022789001465, -7.9369611740112305, -7.694900035858154, -7.45283842086792, -7.2107768058776855, -6.968715667724609, -6.726654052734375, -6.484592437744141, -6.242530822753906, -6.000469207763672, -5.758408069610596, -5.516346454620361, -5.274284839630127, -5.032223701477051, -4.790162086486816, -4.548100471496582, -4.306038856506348, -4.063977241516113, -3.821916103363037, -3.5798544883728027, -3.3377928733825684, -3.095731496810913, -2.853670120239258, -2.6116085052490234, -2.369546890258789, -2.127485513687134, -1.885424017906189, -1.6433625221252441, -1.4013010263442993, -1.1592395305633545, -0.9171780347824097, -0.675117015838623, -0.4330555200576782, -0.1909940242767334, 0.051067471504211426, 0.29312896728515625, 0.5351904630661011, 0.7772519588470459, 1.0193134546279907, 1.2613749504089355, 1.5034364461898804, 1.7454979419708252, 1.98755943775177, 2.229620933532715, 2.471682548522949, 2.7137439250946045, 2.9558053016662598, 3.197866916656494, 3.4399285316467285, 3.681989908218384, 3.924051284790039, 4.166112899780273, 4.408174514770508, 4.650236129760742, 4.892297267913818, 5.134358882904053, 5.376420497894287, 5.618481636047363, 5.860543251037598, 6.102604866027832, 6.344666481018066, 6.586728096008301, 6.828789234161377, 7.070850849151611]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 9.0, 20.0, 37.0, 47.0, 85.0, 134.0, 248.0, 444.0, 764.0, 1331.0, 2463.0, 4720.0, 8837.0, 16969.0, 32391.0, 60824.0, 107769.0, 166007.0, 200646.0, 176920.0, 120312.0, 69446.0, 37031.0, 19192.0, 10032.0, 5427.0, 2828.0, 1524.0, 909.0, 520.0, 263.0, 173.0, 88.0, 43.0, 38.0, 21.0, 13.0, 10.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.37109375, -6.1815185546875, -5.991943359375, -5.8023681640625, -5.61279296875, -5.4232177734375, -5.233642578125, -5.0440673828125, -4.8544921875, -4.6649169921875, -4.475341796875, -4.2857666015625, -4.09619140625, -3.9066162109375, -3.717041015625, -3.5274658203125, -3.337890625, -3.1483154296875, -2.958740234375, -2.7691650390625, -2.57958984375, -2.3900146484375, -2.200439453125, -2.0108642578125, -1.8212890625, -1.6317138671875, -1.442138671875, -1.2525634765625, -1.06298828125, -0.8734130859375, -0.683837890625, -0.4942626953125, -0.3046875, -0.1151123046875, 0.074462890625, 0.2640380859375, 0.45361328125, 0.6431884765625, 0.832763671875, 1.0223388671875, 1.2119140625, 1.4014892578125, 1.591064453125, 1.7806396484375, 1.97021484375, 2.1597900390625, 2.349365234375, 2.5389404296875, 2.728515625, 2.9180908203125, 3.107666015625, 3.2972412109375, 3.48681640625, 3.6763916015625, 3.865966796875, 4.0555419921875, 4.2451171875, 4.4346923828125, 4.624267578125, 4.8138427734375, 5.00341796875, 5.1929931640625, 5.382568359375, 5.5721435546875, 5.76171875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 3.0, 6.0, 18.0, 9.0, 15.0, 19.0, 17.0, 37.0, 36.0, 37.0, 38.0, 49.0, 60.0, 41.0, 52.0, 47.0, 54.0, 59.0, 52.0, 53.0, 54.0, 37.0, 39.0, 25.0, 26.0, 27.0, 19.0, 13.0, 10.0, 15.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -8.02880859375, -7.7763671875, -7.52392578125, -7.271484375, -7.01904296875, -6.7666015625, -6.51416015625, -6.26171875, -6.00927734375, -5.7568359375, -5.50439453125, -5.251953125, -4.99951171875, -4.7470703125, -4.49462890625, -4.2421875, -3.98974609375, -3.7373046875, -3.48486328125, -3.232421875, -2.97998046875, -2.7275390625, -2.47509765625, -2.22265625, -1.97021484375, -1.7177734375, -1.46533203125, -1.212890625, -0.96044921875, -0.7080078125, -0.45556640625, -0.203125, 0.04931640625, 0.3017578125, 0.55419921875, 0.806640625, 1.05908203125, 1.3115234375, 1.56396484375, 1.81640625, 2.06884765625, 2.3212890625, 2.57373046875, 2.826171875, 3.07861328125, 3.3310546875, 3.58349609375, 3.8359375, 4.08837890625, 4.3408203125, 4.59326171875, 4.845703125, 5.09814453125, 5.3505859375, 5.60302734375, 5.85546875, 6.10791015625, 6.3603515625, 6.61279296875, 6.865234375, 7.11767578125, 7.3701171875, 7.62255859375, 7.875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 12.0, 8.0, 15.0, 19.0, 32.0, 49.0, 75.0, 120.0, 179.0, 245.0, 398.0, 666.0, 1038.0, 1552.0, 2494.0, 3903.0, 6513.0, 10464.0, 16862.0, 27406.0, 42908.0, 66044.0, 95861.0, 127271.0, 145852.0, 141462.0, 117045.0, 84492.0, 57284.0, 37009.0, 23109.0, 14393.0, 9010.0, 5423.0, 3386.0, 2140.0, 1373.0, 848.0, 551.0, 334.0, 233.0, 143.0, 117.0, 70.0, 43.0, 32.0, 13.0, 21.0, 11.0, 9.0, 5.0, 3.0, 0.0, 2.0, 2.0, 4.0], "bins": [-4.6484375, -4.5068359375, -4.365234375, -4.2236328125, -4.08203125, -3.9404296875, -3.798828125, -3.6572265625, -3.515625, -3.3740234375, -3.232421875, -3.0908203125, -2.94921875, -2.8076171875, -2.666015625, -2.5244140625, -2.3828125, -2.2412109375, -2.099609375, -1.9580078125, -1.81640625, -1.6748046875, -1.533203125, -1.3916015625, -1.25, -1.1083984375, -0.966796875, -0.8251953125, -0.68359375, -0.5419921875, -0.400390625, -0.2587890625, -0.1171875, 0.0244140625, 0.166015625, 0.3076171875, 0.44921875, 0.5908203125, 0.732421875, 0.8740234375, 1.015625, 1.1572265625, 1.298828125, 1.4404296875, 1.58203125, 1.7236328125, 1.865234375, 2.0068359375, 2.1484375, 2.2900390625, 2.431640625, 2.5732421875, 2.71484375, 2.8564453125, 2.998046875, 3.1396484375, 3.28125, 3.4228515625, 3.564453125, 3.7060546875, 3.84765625, 3.9892578125, 4.130859375, 4.2724609375, 4.4140625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 7.0, 9.0, 9.0, 11.0, 12.0, 17.0, 20.0, 23.0, 29.0, 38.0, 27.0, 36.0, 34.0, 38.0, 47.0, 44.0, 50.0, 47.0, 44.0, 32.0, 40.0, 44.0, 35.0, 45.0, 28.0, 36.0, 29.0, 34.0, 21.0, 14.0, 19.0, 12.0, 10.0, 13.0, 10.0, 8.0, 6.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.73828125, -3.61199951171875, -3.4857177734375, -3.35943603515625, -3.233154296875, -3.10687255859375, -2.9805908203125, -2.85430908203125, -2.72802734375, -2.60174560546875, -2.4754638671875, -2.34918212890625, -2.222900390625, -2.09661865234375, -1.9703369140625, -1.84405517578125, -1.7177734375, -1.59149169921875, -1.4652099609375, -1.33892822265625, -1.212646484375, -1.08636474609375, -0.9600830078125, -0.83380126953125, -0.70751953125, -0.58123779296875, -0.4549560546875, -0.32867431640625, -0.202392578125, -0.07611083984375, 0.0501708984375, 0.17645263671875, 0.302734375, 0.42901611328125, 0.5552978515625, 0.68157958984375, 0.807861328125, 0.93414306640625, 1.0604248046875, 1.18670654296875, 1.31298828125, 1.43927001953125, 1.5655517578125, 1.69183349609375, 1.818115234375, 1.94439697265625, 2.0706787109375, 2.19696044921875, 2.3232421875, 2.44952392578125, 2.5758056640625, 2.70208740234375, 2.828369140625, 2.95465087890625, 3.0809326171875, 3.20721435546875, 3.33349609375, 3.45977783203125, 3.5860595703125, 3.71234130859375, 3.838623046875, 3.96490478515625, 4.0911865234375, 4.21746826171875, 4.34375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 8.0, 4.0, 4.0, 17.0, 10.0, 23.0, 37.0, 60.0, 68.0, 119.0, 188.0, 254.0, 410.0, 561.0, 917.0, 1393.0, 2248.0, 3600.0, 5840.0, 10051.0, 17047.0, 29721.0, 54191.0, 98191.0, 162457.0, 210489.0, 183128.0, 116077.0, 65318.0, 35876.0, 20470.0, 11665.0, 6814.0, 3987.0, 2648.0, 1689.0, 961.0, 702.0, 434.0, 311.0, 179.0, 122.0, 92.0, 65.0, 37.0, 23.0, 29.0, 11.0, 8.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.322265625, -2.2489013671875, -2.175537109375, -2.1021728515625, -2.02880859375, -1.9554443359375, -1.882080078125, -1.8087158203125, -1.7353515625, -1.6619873046875, -1.588623046875, -1.5152587890625, -1.44189453125, -1.3685302734375, -1.295166015625, -1.2218017578125, -1.1484375, -1.0750732421875, -1.001708984375, -0.9283447265625, -0.85498046875, -0.7816162109375, -0.708251953125, -0.6348876953125, -0.5615234375, -0.4881591796875, -0.414794921875, -0.3414306640625, -0.26806640625, -0.1947021484375, -0.121337890625, -0.0479736328125, 0.025390625, 0.0987548828125, 0.172119140625, 0.2454833984375, 0.31884765625, 0.3922119140625, 0.465576171875, 0.5389404296875, 0.6123046875, 0.6856689453125, 0.759033203125, 0.8323974609375, 0.90576171875, 0.9791259765625, 1.052490234375, 1.1258544921875, 1.19921875, 1.2725830078125, 1.345947265625, 1.4193115234375, 1.49267578125, 1.5660400390625, 1.639404296875, 1.7127685546875, 1.7861328125, 1.8594970703125, 1.932861328125, 2.0062255859375, 2.07958984375, 2.1529541015625, 2.226318359375, 2.2996826171875, 2.373046875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 1.0, 7.0, 7.0, 15.0, 15.0, 13.0, 23.0, 31.0, 29.0, 44.0, 50.0, 48.0, 83.0, 72.0, 85.0, 74.0, 77.0, 69.0, 59.0, 42.0, 37.0, 43.0, 25.0, 11.0, 14.0, 9.0, 8.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001823902130126953, -0.00017573311924934387, -0.00016907602548599243, -0.000162418931722641, -0.00015576183795928955, -0.0001491047441959381, -0.00014244765043258667, -0.00013579055666923523, -0.0001291334629058838, -0.00012247636914253235, -0.00011581927537918091, -0.00010916218161582947, -0.00010250508785247803, -9.584799408912659e-05, -8.919090032577515e-05, -8.25338065624237e-05, -7.587671279907227e-05, -6.921961903572083e-05, -6.256252527236938e-05, -5.5905431509017944e-05, -4.9248337745666504e-05, -4.2591243982315063e-05, -3.593415021896362e-05, -2.9277056455612183e-05, -2.2619962692260742e-05, -1.5962868928909302e-05, -9.305775165557861e-06, -2.648681402206421e-06, 4.0084123611450195e-06, 1.066550612449646e-05, 1.73225998878479e-05, 2.397969365119934e-05, 3.063678741455078e-05, 3.729388117790222e-05, 4.395097494125366e-05, 5.06080687046051e-05, 5.726516246795654e-05, 6.392225623130798e-05, 7.057934999465942e-05, 7.723644375801086e-05, 8.38935375213623e-05, 9.055063128471375e-05, 9.720772504806519e-05, 0.00010386481881141663, 0.00011052191257476807, 0.00011717900633811951, 0.00012383610010147095, 0.0001304931938648224, 0.00013715028762817383, 0.00014380738139152527, 0.0001504644751548767, 0.00015712156891822815, 0.0001637786626815796, 0.00017043575644493103, 0.00017709285020828247, 0.0001837499439716339, 0.00019040703773498535, 0.0001970641314983368, 0.00020372122526168823, 0.00021037831902503967, 0.0002170354127883911, 0.00022369250655174255, 0.000230349600315094, 0.00023700669407844543, 0.00024366378784179688]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 6.0, 8.0, 17.0, 24.0, 27.0, 29.0, 45.0, 73.0, 107.0, 140.0, 252.0, 332.0, 539.0, 771.0, 1132.0, 1765.0, 2626.0, 4284.0, 6627.0, 10529.0, 16803.0, 27552.0, 44174.0, 70207.0, 108305.0, 148798.0, 167343.0, 146759.0, 105115.0, 68930.0, 43082.0, 26880.0, 16438.0, 10269.0, 6541.0, 4200.0, 2684.0, 1732.0, 1138.0, 782.0, 481.0, 326.0, 215.0, 151.0, 99.0, 65.0, 55.0, 23.0, 34.0, 14.0, 9.0, 5.0, 7.0, 5.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.775390625, -1.717132568359375, -1.65887451171875, -1.600616455078125, -1.5423583984375, -1.484100341796875, -1.42584228515625, -1.367584228515625, -1.309326171875, -1.251068115234375, -1.19281005859375, -1.134552001953125, -1.0762939453125, -1.018035888671875, -0.95977783203125, -0.901519775390625, -0.84326171875, -0.785003662109375, -0.72674560546875, -0.668487548828125, -0.6102294921875, -0.551971435546875, -0.49371337890625, -0.435455322265625, -0.377197265625, -0.318939208984375, -0.26068115234375, -0.202423095703125, -0.1441650390625, -0.085906982421875, -0.02764892578125, 0.030609130859375, 0.0888671875, 0.147125244140625, 0.20538330078125, 0.263641357421875, 0.3218994140625, 0.380157470703125, 0.43841552734375, 0.496673583984375, 0.554931640625, 0.613189697265625, 0.67144775390625, 0.729705810546875, 0.7879638671875, 0.846221923828125, 0.90447998046875, 0.962738037109375, 1.02099609375, 1.079254150390625, 1.13751220703125, 1.195770263671875, 1.2540283203125, 1.312286376953125, 1.37054443359375, 1.428802490234375, 1.487060546875, 1.545318603515625, 1.60357666015625, 1.661834716796875, 1.7200927734375, 1.778350830078125, 1.83660888671875, 1.894866943359375, 1.953125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 0.0, 5.0, 6.0, 4.0, 1.0, 7.0, 8.0, 10.0, 14.0, 13.0, 22.0, 13.0, 24.0, 28.0, 29.0, 38.0, 43.0, 39.0, 53.0, 64.0, 51.0, 66.0, 53.0, 52.0, 47.0, 43.0, 33.0, 37.0, 33.0, 25.0, 26.0, 20.0, 14.0, 19.0, 14.0, 8.0, 5.0, 4.0, 4.0, 8.0, 1.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79150390625, -0.7654342651367188, -0.7393646240234375, -0.7132949829101562, -0.687225341796875, -0.6611557006835938, -0.6350860595703125, -0.6090164184570312, -0.58294677734375, -0.5568771362304688, -0.5308074951171875, -0.5047378540039062, -0.478668212890625, -0.45259857177734375, -0.4265289306640625, -0.40045928955078125, -0.3743896484375, -0.34832000732421875, -0.3222503662109375, -0.29618072509765625, -0.270111083984375, -0.24404144287109375, -0.2179718017578125, -0.19190216064453125, -0.16583251953125, -0.13976287841796875, -0.1136932373046875, -0.08762359619140625, -0.061553955078125, -0.03548431396484375, -0.0094146728515625, 0.01665496826171875, 0.042724609375, 0.06879425048828125, 0.0948638916015625, 0.12093353271484375, 0.147003173828125, 0.17307281494140625, 0.1991424560546875, 0.22521209716796875, 0.25128173828125, 0.27735137939453125, 0.3034210205078125, 0.32949066162109375, 0.355560302734375, 0.38162994384765625, 0.4076995849609375, 0.43376922607421875, 0.4598388671875, 0.48590850830078125, 0.5119781494140625, 0.5380477905273438, 0.564117431640625, 0.5901870727539062, 0.6162567138671875, 0.6423263549804688, 0.66839599609375, 0.6944656372070312, 0.7205352783203125, 0.7466049194335938, 0.772674560546875, 0.7987442016601562, 0.8248138427734375, 0.8508834838867188, 0.876953125]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 5.0, 5.0, 4.0, 2.0, 4.0, 10.0, 10.0, 25.0, 21.0, 33.0, 40.0, 50.0, 71.0, 78.0, 91.0, 86.0, 89.0, 87.0, 67.0, 53.0, 37.0, 37.0, 19.0, 18.0, 20.0, 6.0, 9.0, 7.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.262760162353516, -5.972482204437256, -5.682204246520996, -5.391926288604736, -5.101648330688477, -4.811370849609375, -4.521092891693115, -4.2308149337768555, -3.9405369758605957, -3.650259017944336, -3.359981060028076, -3.0697033405303955, -2.7794253826141357, -2.489147424697876, -2.1988697052001953, -1.9085917472839355, -1.6183137893676758, -1.328035831451416, -1.0377579927444458, -0.7474800944328308, -0.4572021961212158, -0.16692423820495605, 0.12335360050201416, 0.4136314392089844, 0.7039093971252441, 0.9941872954368591, 1.2844651937484741, 1.5747430324554443, 1.865020990371704, 2.155298948287964, 2.4455766677856445, 2.7358546257019043, 3.026132583618164, 3.316410541534424, 3.6066884994506836, 3.8969662189483643, 4.187244415283203, 4.477521896362305, 4.7677998542785645, 5.058077812194824, 5.348355770111084, 5.638633728027344, 5.9289116859436035, 6.219189643859863, 6.509467124938965, 6.799745559692383, 7.090023040771484, 7.380300998687744, 7.670578956604004, 7.960856914520264, 8.251134872436523, 8.541412353515625, 8.831690788269043, 9.121968269348145, 9.412246704101562, 9.702524185180664, 9.992801666259766, 10.283079147338867, 10.573357582092285, 10.863635063171387, 11.153913497924805, 11.444190979003906, 11.734469413757324, 12.024746894836426, 12.315025329589844]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 8.0, 8.0, 8.0, 10.0, 7.0, 11.0, 12.0, 22.0, 19.0, 26.0, 34.0, 40.0, 46.0, 54.0, 57.0, 47.0, 60.0, 45.0, 49.0, 61.0, 49.0, 46.0, 41.0, 45.0, 33.0, 33.0, 31.0, 19.0, 16.0, 12.0, 18.0, 13.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.420211791992188, -8.162103652954102, -7.903994560241699, -7.645886421203613, -7.387777805328369, -7.129669189453125, -6.871561050415039, -6.613452434539795, -6.355343818664551, -6.097235202789307, -5.8391265869140625, -5.581018447875977, -5.322909832000732, -5.064801216125488, -4.806693077087402, -4.548584461212158, -4.290475845336914, -4.03236722946167, -3.774258852005005, -3.51615047454834, -3.2580418586730957, -2.9999332427978516, -2.7418248653411865, -2.4837164878845215, -2.2256078720092773, -1.9674993753433228, -1.7093908786773682, -1.4512823820114136, -1.193173885345459, -0.9350653886795044, -0.6769568920135498, -0.4188483953475952, -0.16073989868164062, 0.09736859798431396, 0.35547709465026855, 0.6135855913162231, 0.8716940879821777, 1.1298025846481323, 1.387911081314087, 1.6460195779800415, 1.904128074645996, 2.1622366905212402, 2.4203450679779053, 2.6784534454345703, 2.9365620613098145, 3.1946706771850586, 3.4527790546417236, 3.7108874320983887, 3.968996047973633, 4.227104663848877, 4.485213279724121, 4.743321418762207, 5.001430034637451, 5.259538650512695, 5.517646789550781, 5.775755405426025, 6.0338640213012695, 6.291972637176514, 6.550081253051758, 6.808189392089844, 7.066298007965088, 7.324406623840332, 7.582514762878418, 7.840623378753662, 8.098731994628906]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 13.0, 21.0, 33.0, 39.0, 56.0, 80.0, 134.0, 187.0, 287.0, 481.0, 778.0, 1151.0, 1979.0, 3328.0, 5594.0, 9578.0, 17038.0, 31013.0, 58847.0, 116133.0, 236581.0, 477994.0, 843933.0, 984680.0, 683229.0, 357219.0, 175645.0, 87800.0, 44903.0, 23780.0, 13149.0, 7621.0, 4328.0, 2415.0, 1523.0, 1011.0, 615.0, 394.0, 263.0, 153.0, 97.0, 74.0, 43.0, 17.0, 16.0, 9.0, 5.0, 3.0, 1.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.87109375, -6.65155029296875, -6.4320068359375, -6.21246337890625, -5.992919921875, -5.77337646484375, -5.5538330078125, -5.33428955078125, -5.11474609375, -4.89520263671875, -4.6756591796875, -4.45611572265625, -4.236572265625, -4.01702880859375, -3.7974853515625, -3.57794189453125, -3.3583984375, -3.13885498046875, -2.9193115234375, -2.69976806640625, -2.480224609375, -2.26068115234375, -2.0411376953125, -1.82159423828125, -1.60205078125, -1.38250732421875, -1.1629638671875, -0.94342041015625, -0.723876953125, -0.50433349609375, -0.2847900390625, -0.06524658203125, 0.154296875, 0.37384033203125, 0.5933837890625, 0.81292724609375, 1.032470703125, 1.25201416015625, 1.4715576171875, 1.69110107421875, 1.91064453125, 2.13018798828125, 2.3497314453125, 2.56927490234375, 2.788818359375, 3.00836181640625, 3.2279052734375, 3.44744873046875, 3.6669921875, 3.88653564453125, 4.1060791015625, 4.32562255859375, 4.545166015625, 4.76470947265625, 4.9842529296875, 5.20379638671875, 5.42333984375, 5.64288330078125, 5.8624267578125, 6.08197021484375, 6.301513671875, 6.52105712890625, 6.7406005859375, 6.96014404296875, 7.1796875]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 7.0, 7.0, 8.0, 12.0, 15.0, 15.0, 21.0, 28.0, 18.0, 34.0, 50.0, 52.0, 45.0, 46.0, 40.0, 53.0, 57.0, 57.0, 67.0, 40.0, 42.0, 45.0, 38.0, 36.0, 39.0, 26.0, 13.0, 20.0, 15.0, 14.0, 12.0, 9.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.015625, -5.836669921875, -5.65771484375, -5.478759765625, -5.2998046875, -5.120849609375, -4.94189453125, -4.762939453125, -4.583984375, -4.405029296875, -4.22607421875, -4.047119140625, -3.8681640625, -3.689208984375, -3.51025390625, -3.331298828125, -3.15234375, -2.973388671875, -2.79443359375, -2.615478515625, -2.4365234375, -2.257568359375, -2.07861328125, -1.899658203125, -1.720703125, -1.541748046875, -1.36279296875, -1.183837890625, -1.0048828125, -0.825927734375, -0.64697265625, -0.468017578125, -0.2890625, -0.110107421875, 0.06884765625, 0.247802734375, 0.4267578125, 0.605712890625, 0.78466796875, 0.963623046875, 1.142578125, 1.321533203125, 1.50048828125, 1.679443359375, 1.8583984375, 2.037353515625, 2.21630859375, 2.395263671875, 2.57421875, 2.753173828125, 2.93212890625, 3.111083984375, 3.2900390625, 3.468994140625, 3.64794921875, 3.826904296875, 4.005859375, 4.184814453125, 4.36376953125, 4.542724609375, 4.7216796875, 4.900634765625, 5.07958984375, 5.258544921875, 5.4375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 5.0, 8.0, 3.0, 4.0, 19.0, 18.0, 22.0, 57.0, 51.0, 90.0, 139.0, 210.0, 307.0, 481.0, 753.0, 1258.0, 2024.0, 3233.0, 5376.0, 8964.0, 15465.0, 26350.0, 46824.0, 83925.0, 151110.0, 266426.0, 445891.0, 651230.0, 755358.0, 656425.0, 450504.0, 270082.0, 152715.0, 85138.0, 47508.0, 27208.0, 15854.0, 9021.0, 5473.0, 3302.0, 2058.0, 1281.0, 749.0, 489.0, 330.0, 202.0, 114.0, 84.0, 60.0, 41.0, 19.0, 11.0, 6.0, 12.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.94921875, -5.7662353515625, -5.583251953125, -5.4002685546875, -5.21728515625, -5.0343017578125, -4.851318359375, -4.6683349609375, -4.4853515625, -4.3023681640625, -4.119384765625, -3.9364013671875, -3.75341796875, -3.5704345703125, -3.387451171875, -3.2044677734375, -3.021484375, -2.8385009765625, -2.655517578125, -2.4725341796875, -2.28955078125, -2.1065673828125, -1.923583984375, -1.7406005859375, -1.5576171875, -1.3746337890625, -1.191650390625, -1.0086669921875, -0.82568359375, -0.6427001953125, -0.459716796875, -0.2767333984375, -0.09375, 0.0892333984375, 0.272216796875, 0.4552001953125, 0.63818359375, 0.8211669921875, 1.004150390625, 1.1871337890625, 1.3701171875, 1.5531005859375, 1.736083984375, 1.9190673828125, 2.10205078125, 2.2850341796875, 2.468017578125, 2.6510009765625, 2.833984375, 3.0169677734375, 3.199951171875, 3.3829345703125, 3.56591796875, 3.7489013671875, 3.931884765625, 4.1148681640625, 4.2978515625, 4.4808349609375, 4.663818359375, 4.8468017578125, 5.02978515625, 5.2127685546875, 5.395751953125, 5.5787353515625, 5.76171875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 11.0, 8.0, 11.0, 13.0, 27.0, 40.0, 39.0, 58.0, 83.0, 90.0, 92.0, 138.0, 156.0, 201.0, 211.0, 211.0, 240.0, 267.0, 301.0, 261.0, 212.0, 221.0, 191.0, 176.0, 151.0, 105.0, 108.0, 96.0, 63.0, 53.0, 62.0, 40.0, 24.0, 27.0, 18.0, 18.0, 16.0, 8.0, 9.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.228515625, -2.14837646484375, -2.0682373046875, -1.98809814453125, -1.907958984375, -1.82781982421875, -1.7476806640625, -1.66754150390625, -1.58740234375, -1.50726318359375, -1.4271240234375, -1.34698486328125, -1.266845703125, -1.18670654296875, -1.1065673828125, -1.02642822265625, -0.9462890625, -0.86614990234375, -0.7860107421875, -0.70587158203125, -0.625732421875, -0.54559326171875, -0.4654541015625, -0.38531494140625, -0.30517578125, -0.22503662109375, -0.1448974609375, -0.06475830078125, 0.015380859375, 0.09552001953125, 0.1756591796875, 0.25579833984375, 0.3359375, 0.41607666015625, 0.4962158203125, 0.57635498046875, 0.656494140625, 0.73663330078125, 0.8167724609375, 0.89691162109375, 0.97705078125, 1.05718994140625, 1.1373291015625, 1.21746826171875, 1.297607421875, 1.37774658203125, 1.4578857421875, 1.53802490234375, 1.6181640625, 1.69830322265625, 1.7784423828125, 1.85858154296875, 1.938720703125, 2.01885986328125, 2.0989990234375, 2.17913818359375, 2.25927734375, 2.33941650390625, 2.4195556640625, 2.49969482421875, 2.579833984375, 2.65997314453125, 2.7401123046875, 2.82025146484375, 2.900390625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 12.0, 14.0, 10.0, 13.0, 8.0, 17.0, 33.0, 23.0, 40.0, 42.0, 50.0, 49.0, 59.0, 54.0, 72.0, 73.0, 74.0, 62.0, 50.0, 49.0, 39.0, 33.0, 22.0, 21.0, 15.0, 9.0, 9.0, 14.0, 7.0, 5.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.156864166259766, -5.918482303619385, -5.680099964141846, -5.441718101501465, -5.203336238861084, -4.964953899383545, -4.726572036743164, -4.488189697265625, -4.249807834625244, -4.011425971984863, -3.7730438709259033, -3.5346617698669434, -3.2962796688079834, -3.0578975677490234, -2.8195157051086426, -2.5811336040496826, -2.3427517414093018, -2.104369640350342, -1.8659876585006714, -1.627605676651001, -1.389223575592041, -1.1508415937423706, -0.9124596118927002, -0.6740775108337402, -0.4356955289840698, -0.19731350243091583, 0.04106852412223816, 0.27945053577423096, 0.5178325772285461, 0.7562146186828613, 0.9945966005325317, 1.2329787015914917, 1.471360683441162, 1.7097426652908325, 1.9481247663497925, 2.186506748199463, 2.424888849258423, 2.663270950317383, 2.9016528129577637, 3.1400349140167236, 3.3784170150756836, 3.6167991161346436, 3.8551809787750244, 4.093563079833984, 4.331944942474365, 4.570327281951904, 4.808709144592285, 5.047091484069824, 5.285472869873047, 5.523854732513428, 5.762237071990967, 6.000618934631348, 6.2390007972717285, 6.477383136749268, 6.715764999389648, 6.9541473388671875, 7.192529201507568, 7.430911064147949, 7.669293403625488, 7.907675266265869, 8.14605712890625, 8.384439468383789, 8.622821807861328, 8.86120319366455, 9.09958553314209]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 8.0, 7.0, 8.0, 10.0, 11.0, 20.0, 21.0, 33.0, 39.0, 37.0, 48.0, 48.0, 54.0, 51.0, 57.0, 62.0, 56.0, 55.0, 61.0, 46.0, 45.0, 46.0, 27.0, 27.0, 27.0, 16.0, 15.0, 19.0, 10.0, 12.0, 9.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.033995628356934, -8.76633358001709, -8.498672485351562, -8.231010437011719, -7.963348388671875, -7.6956868171691895, -7.428025245666504, -7.16036319732666, -6.892701625823975, -6.625040054321289, -6.357378005981445, -6.08971643447876, -5.822054862976074, -5.5543928146362305, -5.286731243133545, -5.019069671630859, -4.751407623291016, -4.48374605178833, -4.216084003448486, -3.948422431945801, -3.680760622024536, -3.4130988121032715, -3.145437240600586, -2.8777754306793213, -2.6101136207580566, -2.342451810836792, -2.0747900009155273, -1.8071284294128418, -1.5394666194915771, -1.2718048095703125, -1.0041431188583374, -0.7364814281463623, -0.46882057189941406, -0.2011588215827942, 0.06650292873382568, 0.33416467905044556, 0.6018264293670654, 0.8694882392883301, 1.1371499300003052, 1.4048116207122803, 1.672473430633545, 1.9401352405548096, 2.207797050476074, 2.4754586219787598, 2.7431204319000244, 3.010782241821289, 3.2784438133239746, 3.5461056232452393, 3.813767433166504, 4.0814290046691895, 4.349091053009033, 4.616752624511719, 4.8844146728515625, 5.152076244354248, 5.419737815856934, 5.687399864196777, 5.955061435699463, 6.222723007202148, 6.490385055541992, 6.758046627044678, 7.025708198547363, 7.293370246887207, 7.561031818389893, 7.828693389892578, 8.096355438232422]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 12.0, 11.0, 11.0, 12.0, 23.0, 34.0, 52.0, 60.0, 92.0, 136.0, 167.0, 267.0, 414.0, 612.0, 883.0, 1442.0, 2275.0, 3503.0, 5779.0, 9218.0, 15605.0, 25793.0, 43134.0, 71995.0, 117853.0, 179349.0, 199729.0, 143884.0, 89692.0, 54492.0, 32110.0, 19152.0, 11545.0, 7188.0, 4336.0, 2716.0, 1647.0, 1109.0, 701.0, 503.0, 315.0, 197.0, 151.0, 115.0, 80.0, 56.0, 28.0, 27.0, 22.0, 11.0, 6.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.84814453125, -0.8200759887695312, -0.7920074462890625, -0.7639389038085938, -0.735870361328125, -0.7078018188476562, -0.6797332763671875, -0.6516647338867188, -0.62359619140625, -0.5955276489257812, -0.5674591064453125, -0.5393905639648438, -0.511322021484375, -0.48325347900390625, -0.4551849365234375, -0.42711639404296875, -0.3990478515625, -0.37097930908203125, -0.3429107666015625, -0.31484222412109375, -0.286773681640625, -0.25870513916015625, -0.2306365966796875, -0.20256805419921875, -0.17449951171875, -0.14643096923828125, -0.1183624267578125, -0.09029388427734375, -0.062225341796875, -0.03415679931640625, -0.0060882568359375, 0.02198028564453125, 0.050048828125, 0.07811737060546875, 0.1061859130859375, 0.13425445556640625, 0.162322998046875, 0.19039154052734375, 0.2184600830078125, 0.24652862548828125, 0.27459716796875, 0.30266571044921875, 0.3307342529296875, 0.35880279541015625, 0.386871337890625, 0.41493988037109375, 0.4430084228515625, 0.47107696533203125, 0.4991455078125, 0.5272140502929688, 0.5552825927734375, 0.5833511352539062, 0.611419677734375, 0.6394882202148438, 0.6675567626953125, 0.6956253051757812, 0.72369384765625, 0.7517623901367188, 0.7798309326171875, 0.8078994750976562, 0.835968017578125, 0.8640365600585938, 0.8921051025390625, 0.9201736450195312, 0.9482421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 2.0, 6.0, 7.0, 4.0, 14.0, 11.0, 22.0, 15.0, 25.0, 21.0, 33.0, 38.0, 50.0, 52.0, 55.0, 51.0, 62.0, 58.0, 53.0, 60.0, 56.0, 42.0, 41.0, 35.0, 36.0, 25.0, 30.0, 18.0, 22.0, 12.0, 10.0, 9.0, 8.0, 10.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.046875, -8.777587890625, -8.50830078125, -8.239013671875, -7.9697265625, -7.700439453125, -7.43115234375, -7.161865234375, -6.892578125, -6.623291015625, -6.35400390625, -6.084716796875, -5.8154296875, -5.546142578125, -5.27685546875, -5.007568359375, -4.73828125, -4.468994140625, -4.19970703125, -3.930419921875, -3.6611328125, -3.391845703125, -3.12255859375, -2.853271484375, -2.583984375, -2.314697265625, -2.04541015625, -1.776123046875, -1.5068359375, -1.237548828125, -0.96826171875, -0.698974609375, -0.4296875, -0.160400390625, 0.10888671875, 0.378173828125, 0.6474609375, 0.916748046875, 1.18603515625, 1.455322265625, 1.724609375, 1.993896484375, 2.26318359375, 2.532470703125, 2.8017578125, 3.071044921875, 3.34033203125, 3.609619140625, 3.87890625, 4.148193359375, 4.41748046875, 4.686767578125, 4.9560546875, 5.225341796875, 5.49462890625, 5.763916015625, 6.033203125, 6.302490234375, 6.57177734375, 6.841064453125, 7.1103515625, 7.379638671875, 7.64892578125, 7.918212890625, 8.1875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 7.0, 6.0, 11.0, 16.0, 18.0, 17.0, 51.0, 70.0, 103.0, 160.0, 249.0, 336.0, 481.0, 742.0, 1071.0, 1602.0, 2564.0, 3845.0, 5817.0, 8965.0, 13614.0, 20672.0, 32083.0, 49302.0, 73888.0, 110125.0, 153394.0, 168481.0, 132539.0, 91620.0, 60822.0, 40365.0, 26260.0, 16980.0, 10848.0, 7274.0, 4655.0, 3117.0, 2068.0, 1451.0, 970.0, 617.0, 428.0, 312.0, 174.0, 112.0, 84.0, 71.0, 34.0, 25.0, 24.0, 8.0, 10.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.79443359375, -0.769805908203125, -0.74517822265625, -0.720550537109375, -0.6959228515625, -0.671295166015625, -0.64666748046875, -0.622039794921875, -0.597412109375, -0.572784423828125, -0.54815673828125, -0.523529052734375, -0.4989013671875, -0.474273681640625, -0.44964599609375, -0.425018310546875, -0.400390625, -0.375762939453125, -0.35113525390625, -0.326507568359375, -0.3018798828125, -0.277252197265625, -0.25262451171875, -0.227996826171875, -0.203369140625, -0.178741455078125, -0.15411376953125, -0.129486083984375, -0.1048583984375, -0.080230712890625, -0.05560302734375, -0.030975341796875, -0.00634765625, 0.018280029296875, 0.04290771484375, 0.067535400390625, 0.0921630859375, 0.116790771484375, 0.14141845703125, 0.166046142578125, 0.190673828125, 0.215301513671875, 0.23992919921875, 0.264556884765625, 0.2891845703125, 0.313812255859375, 0.33843994140625, 0.363067626953125, 0.3876953125, 0.412322998046875, 0.43695068359375, 0.461578369140625, 0.4862060546875, 0.510833740234375, 0.53546142578125, 0.560089111328125, 0.584716796875, 0.609344482421875, 0.63397216796875, 0.658599853515625, 0.6832275390625, 0.707855224609375, 0.73248291015625, 0.757110595703125, 0.78173828125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 3.0, 3.0, 5.0, 11.0, 6.0, 6.0, 13.0, 11.0, 20.0, 18.0, 24.0, 23.0, 42.0, 28.0, 26.0, 39.0, 41.0, 34.0, 39.0, 36.0, 48.0, 40.0, 42.0, 34.0, 41.0, 39.0, 32.0, 32.0, 30.0, 32.0, 18.0, 28.0, 22.0, 22.0, 14.0, 18.0, 10.0, 16.0, 10.0, 7.0, 11.0, 7.0, 4.0, 1.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.84375, -3.722747802734375, -3.60174560546875, -3.480743408203125, -3.3597412109375, -3.238739013671875, -3.11773681640625, -2.996734619140625, -2.875732421875, -2.754730224609375, -2.63372802734375, -2.512725830078125, -2.3917236328125, -2.270721435546875, -2.14971923828125, -2.028717041015625, -1.90771484375, -1.786712646484375, -1.66571044921875, -1.544708251953125, -1.4237060546875, -1.302703857421875, -1.18170166015625, -1.060699462890625, -0.939697265625, -0.818695068359375, -0.69769287109375, -0.576690673828125, -0.4556884765625, -0.334686279296875, -0.21368408203125, -0.092681884765625, 0.0283203125, 0.149322509765625, 0.27032470703125, 0.391326904296875, 0.5123291015625, 0.633331298828125, 0.75433349609375, 0.875335693359375, 0.996337890625, 1.117340087890625, 1.23834228515625, 1.359344482421875, 1.4803466796875, 1.601348876953125, 1.72235107421875, 1.843353271484375, 1.96435546875, 2.085357666015625, 2.20635986328125, 2.327362060546875, 2.4483642578125, 2.569366455078125, 2.69036865234375, 2.811370849609375, 2.932373046875, 3.053375244140625, 3.17437744140625, 3.295379638671875, 3.4163818359375, 3.537384033203125, 3.65838623046875, 3.779388427734375, 3.900390625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 9.0, 16.0, 22.0, 27.0, 31.0, 63.0, 60.0, 83.0, 122.0, 203.0, 312.0, 518.0, 841.0, 1349.0, 2231.0, 3914.0, 6769.0, 13018.0, 25158.0, 54971.0, 132899.0, 333566.0, 272541.0, 107236.0, 45506.0, 21400.0, 10883.0, 6031.0, 3399.0, 2018.0, 1257.0, 759.0, 431.0, 333.0, 174.0, 117.0, 78.0, 43.0, 45.0, 22.0, 31.0, 22.0, 14.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.1002197265625, -0.09717178344726562, -0.09412384033203125, -0.09107589721679688, -0.0880279541015625, -0.08498001098632812, -0.08193206787109375, -0.07888412475585938, -0.075836181640625, -0.07278823852539062, -0.06974029541015625, -0.06669235229492188, -0.0636444091796875, -0.060596466064453125, -0.05754852294921875, -0.054500579833984375, -0.05145263671875, -0.048404693603515625, -0.04535675048828125, -0.042308807373046875, -0.0392608642578125, -0.036212921142578125, -0.03316497802734375, -0.030117034912109375, -0.027069091796875, -0.024021148681640625, -0.02097320556640625, -0.017925262451171875, -0.0148773193359375, -0.011829376220703125, -0.00878143310546875, -0.005733489990234375, -0.002685546875, 0.000362396240234375, 0.00341033935546875, 0.006458282470703125, 0.0095062255859375, 0.012554168701171875, 0.01560211181640625, 0.018650054931640625, 0.021697998046875, 0.024745941162109375, 0.02779388427734375, 0.030841827392578125, 0.0338897705078125, 0.036937713623046875, 0.03998565673828125, 0.043033599853515625, 0.04608154296875, 0.049129486083984375, 0.05217742919921875, 0.055225372314453125, 0.0582733154296875, 0.061321258544921875, 0.06436920166015625, 0.06741714477539062, 0.070465087890625, 0.07351303100585938, 0.07656097412109375, 0.07960891723632812, 0.0826568603515625, 0.08570480346679688, 0.08875274658203125, 0.09180068969726562, 0.0948486328125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 7.0, 7.0, 22.0, 39.0, 52.0, 61.0, 64.0, 70.0, 99.0, 106.0, 92.0, 100.0, 62.0, 60.0, 49.0, 25.0, 18.0, 21.0, 15.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3365020751953125e-05, -2.2670254111289978e-05, -2.197548747062683e-05, -2.1280720829963684e-05, -2.0585954189300537e-05, -1.989118754863739e-05, -1.9196420907974243e-05, -1.8501654267311096e-05, -1.780688762664795e-05, -1.7112120985984802e-05, -1.6417354345321655e-05, -1.5722587704658508e-05, -1.5027821063995361e-05, -1.4333054423332214e-05, -1.3638287782669067e-05, -1.294352114200592e-05, -1.2248754501342773e-05, -1.1553987860679626e-05, -1.085922122001648e-05, -1.0164454579353333e-05, -9.469687938690186e-06, -8.774921298027039e-06, -8.080154657363892e-06, -7.385388016700745e-06, -6.690621376037598e-06, -5.995854735374451e-06, -5.301088094711304e-06, -4.606321454048157e-06, -3.91155481338501e-06, -3.216788172721863e-06, -2.522021532058716e-06, -1.8272548913955688e-06, -1.1324882507324219e-06, -4.377216100692749e-07, 2.5704503059387207e-07, 9.51811671257019e-07, 1.646578311920166e-06, 2.341344952583313e-06, 3.03611159324646e-06, 3.730878233909607e-06, 4.425644874572754e-06, 5.120411515235901e-06, 5.815178155899048e-06, 6.509944796562195e-06, 7.204711437225342e-06, 7.899478077888489e-06, 8.594244718551636e-06, 9.289011359214783e-06, 9.98377799987793e-06, 1.0678544640541077e-05, 1.1373311281204224e-05, 1.206807792186737e-05, 1.2762844562530518e-05, 1.3457611203193665e-05, 1.4152377843856812e-05, 1.4847144484519958e-05, 1.5541911125183105e-05, 1.6236677765846252e-05, 1.69314444065094e-05, 1.7626211047172546e-05, 1.8320977687835693e-05, 1.901574432849884e-05, 1.9710510969161987e-05, 2.0405277609825134e-05, 2.110004425048828e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 6.0, 12.0, 12.0, 16.0, 24.0, 31.0, 52.0, 68.0, 97.0, 118.0, 219.0, 314.0, 424.0, 634.0, 1044.0, 1631.0, 2731.0, 5509.0, 11474.0, 30808.0, 101206.0, 419300.0, 341825.0, 83009.0, 25886.0, 10351.0, 4839.0, 2544.0, 1491.0, 968.0, 587.0, 421.0, 261.0, 200.0, 143.0, 65.0, 67.0, 54.0, 40.0, 22.0, 14.0, 10.0, 11.0, 8.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1893310546875, -0.18320846557617188, -0.17708587646484375, -0.17096328735351562, -0.1648406982421875, -0.15871810913085938, -0.15259552001953125, -0.14647293090820312, -0.140350341796875, -0.13422775268554688, -0.12810516357421875, -0.12198257446289062, -0.1158599853515625, -0.10973739624023438, -0.10361480712890625, -0.09749221801757812, -0.09136962890625, -0.08524703979492188, -0.07912445068359375, -0.07300186157226562, -0.0668792724609375, -0.060756683349609375, -0.05463409423828125, -0.048511505126953125, -0.042388916015625, -0.036266326904296875, -0.03014373779296875, -0.024021148681640625, -0.0178985595703125, -0.011775970458984375, -0.00565338134765625, 0.000469207763671875, 0.006591796875, 0.012714385986328125, 0.01883697509765625, 0.024959564208984375, 0.0310821533203125, 0.037204742431640625, 0.04332733154296875, 0.049449920654296875, 0.055572509765625, 0.061695098876953125, 0.06781768798828125, 0.07394027709960938, 0.0800628662109375, 0.08618545532226562, 0.09230804443359375, 0.09843063354492188, 0.10455322265625, 0.11067581176757812, 0.11679840087890625, 0.12292098999023438, 0.1290435791015625, 0.13516616821289062, 0.14128875732421875, 0.14741134643554688, 0.153533935546875, 0.15965652465820312, 0.16577911376953125, 0.17190170288085938, 0.1780242919921875, 0.18414688110351562, 0.19026947021484375, 0.19639205932617188, 0.2025146484375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 10.0, 7.0, 13.0, 13.0, 8.0, 10.0, 24.0, 22.0, 30.0, 23.0, 26.0, 31.0, 32.0, 42.0, 51.0, 73.0, 72.0, 60.0, 60.0, 45.0, 47.0, 41.0, 42.0, 35.0, 33.0, 17.0, 21.0, 15.0, 6.0, 7.0, 13.0, 6.0, 9.0, 9.0, 8.0, 9.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.028411865234375, -0.027597427368164062, -0.026782989501953125, -0.025968551635742188, -0.02515411376953125, -0.024339675903320312, -0.023525238037109375, -0.022710800170898438, -0.0218963623046875, -0.021081924438476562, -0.020267486572265625, -0.019453048706054688, -0.01863861083984375, -0.017824172973632812, -0.017009735107421875, -0.016195297241210938, -0.015380859375, -0.014566421508789062, -0.013751983642578125, -0.012937545776367188, -0.01212310791015625, -0.011308670043945312, -0.010494232177734375, -0.009679794311523438, -0.0088653564453125, -0.008050918579101562, -0.007236480712890625, -0.0064220428466796875, -0.00560760498046875, -0.0047931671142578125, -0.003978729248046875, -0.0031642913818359375, -0.002349853515625, -0.0015354156494140625, -0.000720977783203125, 9.34600830078125e-05, 0.00090789794921875, 0.0017223358154296875, 0.002536773681640625, 0.0033512115478515625, 0.0041656494140625, 0.0049800872802734375, 0.005794525146484375, 0.0066089630126953125, 0.00742340087890625, 0.008237838745117188, 0.009052276611328125, 0.009866714477539062, 0.01068115234375, 0.011495590209960938, 0.012310028076171875, 0.013124465942382812, 0.01393890380859375, 0.014753341674804688, 0.015567779541015625, 0.016382217407226562, 0.0171966552734375, 0.018011093139648438, 0.018825531005859375, 0.019639968872070312, 0.02045440673828125, 0.021268844604492188, 0.022083282470703125, 0.022897720336914062, 0.023712158203125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 7.0, 20.0, 10.0, 12.0, 7.0, 12.0, 30.0, 26.0, 36.0, 45.0, 48.0, 52.0, 49.0, 58.0, 65.0, 73.0, 78.0, 59.0, 58.0, 50.0, 42.0, 33.0, 27.0, 20.0, 16.0, 9.0, 11.0, 12.0, 10.0, 4.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.980368137359619, -5.7423176765441895, -5.504266738891602, -5.266216278076172, -5.028165340423584, -4.790114879608154, -4.552063941955566, -4.314013481140137, -4.075963020324707, -3.8379123210906982, -3.5998616218566895, -3.3618111610412598, -3.123760223388672, -2.885709762573242, -2.6476590633392334, -2.4096083641052246, -2.1715574264526367, -1.933506727218628, -1.6954560279846191, -1.4574054479599, -1.2193547487258911, -0.9813040494918823, -0.7432534694671631, -0.5052027702331543, -0.2671520709991455, -0.029101401567459106, 0.2089492678642273, 0.4469999074935913, 0.6850506067276001, 0.9231013059616089, 1.1611518859863281, 1.399202585220337, 1.637253761291504, 1.8753044605255127, 2.1133551597595215, 2.351405620574951, 2.589456558227539, 2.8275070190429688, 3.0655577182769775, 3.3036084175109863, 3.541659116744995, 3.779709815979004, 4.017760276794434, 4.2558112144470215, 4.493861675262451, 4.731912612915039, 4.969963073730469, 5.208013534545898, 5.446064472198486, 5.684114933013916, 5.922165870666504, 6.160216331481934, 6.3982672691345215, 6.636317729949951, 6.874368667602539, 7.112419128417969, 7.350469589233398, 7.588520050048828, 7.826570987701416, 8.064621925354004, 8.302672386169434, 8.540722846984863, 8.778773307800293, 9.016824722290039, 9.254875183105469]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 7.0, 7.0, 8.0, 10.0, 11.0, 20.0, 22.0, 33.0, 40.0, 35.0, 48.0, 50.0, 52.0, 51.0, 58.0, 65.0, 55.0, 58.0, 57.0, 47.0, 46.0, 44.0, 25.0, 28.0, 26.0, 19.0, 13.0, 20.0, 8.0, 13.0, 9.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.99626350402832, -8.72859001159668, -8.460917472839355, -8.193243980407715, -7.925570964813232, -7.65789794921875, -7.390224456787109, -7.122551441192627, -6.8548784255981445, -6.587205410003662, -6.31953239440918, -6.051858901977539, -5.784185886383057, -5.516512870788574, -5.248839378356934, -4.981166362762451, -4.713493347167969, -4.445820331573486, -4.178147315979004, -3.9104738235473633, -3.642800807952881, -3.3751277923583984, -3.107454538345337, -2.8397812843322754, -2.572108268737793, -2.3044352531433105, -2.036761999130249, -1.769088864326477, -1.501415729522705, -1.233742594718933, -0.9660694599151611, -0.6983963251113892, -0.4307222366333008, -0.1630491018295288, 0.10462403297424316, 0.37229716777801514, 0.6399703025817871, 0.9076434373855591, 1.175316572189331, 1.442989706993103, 1.710662841796875, 1.978335976600647, 2.246009111404419, 2.5136823654174805, 2.781355381011963, 3.0490283966064453, 3.316701650619507, 3.5843749046325684, 3.852047920227051, 4.119720935821533, 4.387393951416016, 4.655067443847656, 4.922740459442139, 5.190413475036621, 5.458086967468262, 5.725759983062744, 5.993432998657227, 6.261106014251709, 6.528779029846191, 6.796452522277832, 7.0641255378723145, 7.331798553466797, 7.5994720458984375, 7.86714506149292, 8.134818077087402]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 10.0, 16.0, 29.0, 39.0, 52.0, 103.0, 141.0, 221.0, 313.0, 510.0, 789.0, 1333.0, 2088.0, 3382.0, 5524.0, 8997.0, 15288.0, 25250.0, 41877.0, 66622.0, 99789.0, 136114.0, 156480.0, 148718.0, 118102.0, 82215.0, 52708.0, 32217.0, 19352.0, 11760.0, 7082.0, 4324.0, 2678.0, 1621.0, 961.0, 646.0, 444.0, 276.0, 140.0, 116.0, 72.0, 34.0, 38.0, 26.0, 13.0, 14.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.609375, -4.45440673828125, -4.2994384765625, -4.14447021484375, -3.989501953125, -3.83453369140625, -3.6795654296875, -3.52459716796875, -3.36962890625, -3.21466064453125, -3.0596923828125, -2.90472412109375, -2.749755859375, -2.59478759765625, -2.4398193359375, -2.28485107421875, -2.1298828125, -1.97491455078125, -1.8199462890625, -1.66497802734375, -1.510009765625, -1.35504150390625, -1.2000732421875, -1.04510498046875, -0.89013671875, -0.73516845703125, -0.5802001953125, -0.42523193359375, -0.270263671875, -0.11529541015625, 0.0396728515625, 0.19464111328125, 0.349609375, 0.50457763671875, 0.6595458984375, 0.81451416015625, 0.969482421875, 1.12445068359375, 1.2794189453125, 1.43438720703125, 1.58935546875, 1.74432373046875, 1.8992919921875, 2.05426025390625, 2.209228515625, 2.36419677734375, 2.5191650390625, 2.67413330078125, 2.8291015625, 2.98406982421875, 3.1390380859375, 3.29400634765625, 3.448974609375, 3.60394287109375, 3.7589111328125, 3.91387939453125, 4.06884765625, 4.22381591796875, 4.3787841796875, 4.53375244140625, 4.688720703125, 4.84368896484375, 4.9986572265625, 5.15362548828125, 5.30859375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 8.0, 7.0, 14.0, 5.0, 8.0, 20.0, 9.0, 21.0, 24.0, 32.0, 31.0, 43.0, 38.0, 37.0, 53.0, 45.0, 53.0, 47.0, 60.0, 51.0, 46.0, 46.0, 37.0, 40.0, 35.0, 47.0, 28.0, 18.0, 14.0, 18.0, 13.0, 14.0, 11.0, 3.0, 7.0, 5.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34375, -7.10687255859375, -6.8699951171875, -6.63311767578125, -6.396240234375, -6.15936279296875, -5.9224853515625, -5.68560791015625, -5.44873046875, -5.21185302734375, -4.9749755859375, -4.73809814453125, -4.501220703125, -4.26434326171875, -4.0274658203125, -3.79058837890625, -3.5537109375, -3.31683349609375, -3.0799560546875, -2.84307861328125, -2.606201171875, -2.36932373046875, -2.1324462890625, -1.89556884765625, -1.65869140625, -1.42181396484375, -1.1849365234375, -0.94805908203125, -0.711181640625, -0.47430419921875, -0.2374267578125, -0.00054931640625, 0.236328125, 0.47320556640625, 0.7100830078125, 0.94696044921875, 1.183837890625, 1.42071533203125, 1.6575927734375, 1.89447021484375, 2.13134765625, 2.36822509765625, 2.6051025390625, 2.84197998046875, 3.078857421875, 3.31573486328125, 3.5526123046875, 3.78948974609375, 4.0263671875, 4.26324462890625, 4.5001220703125, 4.73699951171875, 4.973876953125, 5.21075439453125, 5.4476318359375, 5.68450927734375, 5.92138671875, 6.15826416015625, 6.3951416015625, 6.63201904296875, 6.868896484375, 7.10577392578125, 7.3426513671875, 7.57952880859375, 7.81640625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 4.0, 8.0, 17.0, 19.0, 34.0, 43.0, 46.0, 117.0, 173.0, 262.0, 370.0, 663.0, 1055.0, 1724.0, 2851.0, 4527.0, 7416.0, 12260.0, 19134.0, 31123.0, 48893.0, 72620.0, 102105.0, 129699.0, 143406.0, 134608.0, 109089.0, 79918.0, 53981.0, 35132.0, 21883.0, 13724.0, 8276.0, 5265.0, 3117.0, 1850.0, 1148.0, 730.0, 503.0, 264.0, 200.0, 112.0, 69.0, 40.0, 28.0, 18.0, 17.0, 6.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-4.49609375, -4.3582763671875, -4.220458984375, -4.0826416015625, -3.94482421875, -3.8070068359375, -3.669189453125, -3.5313720703125, -3.3935546875, -3.2557373046875, -3.117919921875, -2.9801025390625, -2.84228515625, -2.7044677734375, -2.566650390625, -2.4288330078125, -2.291015625, -2.1531982421875, -2.015380859375, -1.8775634765625, -1.73974609375, -1.6019287109375, -1.464111328125, -1.3262939453125, -1.1884765625, -1.0506591796875, -0.912841796875, -0.7750244140625, -0.63720703125, -0.4993896484375, -0.361572265625, -0.2237548828125, -0.0859375, 0.0518798828125, 0.189697265625, 0.3275146484375, 0.46533203125, 0.6031494140625, 0.740966796875, 0.8787841796875, 1.0166015625, 1.1544189453125, 1.292236328125, 1.4300537109375, 1.56787109375, 1.7056884765625, 1.843505859375, 1.9813232421875, 2.119140625, 2.2569580078125, 2.394775390625, 2.5325927734375, 2.67041015625, 2.8082275390625, 2.946044921875, 3.0838623046875, 3.2216796875, 3.3594970703125, 3.497314453125, 3.6351318359375, 3.77294921875, 3.9107666015625, 4.048583984375, 4.1864013671875, 4.32421875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 1.0, 6.0, 10.0, 8.0, 16.0, 11.0, 19.0, 15.0, 16.0, 29.0, 26.0, 37.0, 22.0, 38.0, 41.0, 35.0, 41.0, 41.0, 42.0, 46.0, 55.0, 44.0, 39.0, 33.0, 38.0, 38.0, 41.0, 40.0, 23.0, 18.0, 27.0, 18.0, 18.0, 11.0, 11.0, 8.0, 5.0, 10.0, 7.0, 7.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.37109375, -4.24847412109375, -4.1258544921875, -4.00323486328125, -3.880615234375, -3.75799560546875, -3.6353759765625, -3.51275634765625, -3.39013671875, -3.26751708984375, -3.1448974609375, -3.02227783203125, -2.899658203125, -2.77703857421875, -2.6544189453125, -2.53179931640625, -2.4091796875, -2.28656005859375, -2.1639404296875, -2.04132080078125, -1.918701171875, -1.79608154296875, -1.6734619140625, -1.55084228515625, -1.42822265625, -1.30560302734375, -1.1829833984375, -1.06036376953125, -0.937744140625, -0.81512451171875, -0.6925048828125, -0.56988525390625, -0.447265625, -0.32464599609375, -0.2020263671875, -0.07940673828125, 0.043212890625, 0.16583251953125, 0.2884521484375, 0.41107177734375, 0.53369140625, 0.65631103515625, 0.7789306640625, 0.90155029296875, 1.024169921875, 1.14678955078125, 1.2694091796875, 1.39202880859375, 1.5146484375, 1.63726806640625, 1.7598876953125, 1.88250732421875, 2.005126953125, 2.12774658203125, 2.2503662109375, 2.37298583984375, 2.49560546875, 2.61822509765625, 2.7408447265625, 2.86346435546875, 2.986083984375, 3.10870361328125, 3.2313232421875, 3.35394287109375, 3.4765625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 7.0, 8.0, 7.0, 11.0, 20.0, 17.0, 30.0, 27.0, 63.0, 90.0, 128.0, 197.0, 315.0, 479.0, 730.0, 1060.0, 1669.0, 2765.0, 4308.0, 7086.0, 11928.0, 19527.0, 33113.0, 54828.0, 88694.0, 130680.0, 164713.0, 165831.0, 131364.0, 89081.0, 55577.0, 33169.0, 20058.0, 12015.0, 6992.0, 4510.0, 2671.0, 1703.0, 1020.0, 709.0, 445.0, 288.0, 195.0, 140.0, 96.0, 69.0, 41.0, 28.0, 25.0, 16.0, 8.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6328125, -1.5801544189453125, -1.527496337890625, -1.4748382568359375, -1.42218017578125, -1.3695220947265625, -1.316864013671875, -1.2642059326171875, -1.2115478515625, -1.1588897705078125, -1.106231689453125, -1.0535736083984375, -1.00091552734375, -0.9482574462890625, -0.895599365234375, -0.8429412841796875, -0.790283203125, -0.7376251220703125, -0.684967041015625, -0.6323089599609375, -0.57965087890625, -0.5269927978515625, -0.474334716796875, -0.4216766357421875, -0.3690185546875, -0.3163604736328125, -0.263702392578125, -0.2110443115234375, -0.15838623046875, -0.1057281494140625, -0.053070068359375, -0.0004119873046875, 0.05224609375, 0.1049041748046875, 0.157562255859375, 0.2102203369140625, 0.26287841796875, 0.3155364990234375, 0.368194580078125, 0.4208526611328125, 0.4735107421875, 0.5261688232421875, 0.578826904296875, 0.6314849853515625, 0.68414306640625, 0.7368011474609375, 0.789459228515625, 0.8421173095703125, 0.894775390625, 0.9474334716796875, 1.000091552734375, 1.0527496337890625, 1.10540771484375, 1.1580657958984375, 1.210723876953125, 1.2633819580078125, 1.3160400390625, 1.3686981201171875, 1.421356201171875, 1.4740142822265625, 1.52667236328125, 1.5793304443359375, 1.631988525390625, 1.6846466064453125, 1.7373046875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 7.0, 6.0, 4.0, 7.0, 9.0, 9.0, 13.0, 21.0, 26.0, 13.0, 33.0, 20.0, 40.0, 38.0, 45.0, 60.0, 52.0, 77.0, 58.0, 55.0, 62.0, 52.0, 50.0, 38.0, 28.0, 26.0, 25.0, 19.0, 21.0, 12.0, 9.0, 16.0, 8.0, 6.0, 5.0, 6.0, 5.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0001418590545654297, -0.00013751909136772156, -0.00013317912817001343, -0.0001288391649723053, -0.00012449920177459717, -0.00012015923857688904, -0.00011581927537918091, -0.00011147931218147278, -0.00010713934898376465, -0.00010279938578605652, -9.845942258834839e-05, -9.411945939064026e-05, -8.977949619293213e-05, -8.5439532995224e-05, -8.109956979751587e-05, -7.675960659980774e-05, -7.241964340209961e-05, -6.807968020439148e-05, -6.373971700668335e-05, -5.939975380897522e-05, -5.505979061126709e-05, -5.071982741355896e-05, -4.637986421585083e-05, -4.20399010181427e-05, -3.769993782043457e-05, -3.335997462272644e-05, -2.902001142501831e-05, -2.468004822731018e-05, -2.034008502960205e-05, -1.600012183189392e-05, -1.1660158634185791e-05, -7.320195436477661e-06, -2.9802322387695312e-06, 1.3597309589385986e-06, 5.6996941566467285e-06, 1.0039657354354858e-05, 1.4379620552062988e-05, 1.8719583749771118e-05, 2.3059546947479248e-05, 2.7399510145187378e-05, 3.173947334289551e-05, 3.607943654060364e-05, 4.041939973831177e-05, 4.47593629360199e-05, 4.909932613372803e-05, 5.343928933143616e-05, 5.777925252914429e-05, 6.211921572685242e-05, 6.645917892456055e-05, 7.079914212226868e-05, 7.51391053199768e-05, 7.947906851768494e-05, 8.381903171539307e-05, 8.81589949131012e-05, 9.249895811080933e-05, 9.683892130851746e-05, 0.00010117888450622559, 0.00010551884770393372, 0.00010985881090164185, 0.00011419877409934998, 0.0001185387372970581, 0.00012287870049476624, 0.00012721866369247437, 0.0001315586268901825, 0.00013589859008789062]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 3.0, 8.0, 25.0, 26.0, 31.0, 51.0, 93.0, 119.0, 152.0, 240.0, 345.0, 564.0, 755.0, 1089.0, 1689.0, 2642.0, 4075.0, 6341.0, 10079.0, 16325.0, 26512.0, 43299.0, 68785.0, 104060.0, 141828.0, 161280.0, 147866.0, 111021.0, 74670.0, 47424.0, 28909.0, 17714.0, 11072.0, 6698.0, 4347.0, 2875.0, 1823.0, 1176.0, 782.0, 543.0, 374.0, 272.0, 166.0, 124.0, 107.0, 55.0, 42.0, 29.0, 17.0, 17.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.615234375, -1.5641021728515625, -1.512969970703125, -1.4618377685546875, -1.41070556640625, -1.3595733642578125, -1.308441162109375, -1.2573089599609375, -1.2061767578125, -1.1550445556640625, -1.103912353515625, -1.0527801513671875, -1.00164794921875, -0.9505157470703125, -0.899383544921875, -0.8482513427734375, -0.797119140625, -0.7459869384765625, -0.694854736328125, -0.6437225341796875, -0.59259033203125, -0.5414581298828125, -0.490325927734375, -0.4391937255859375, -0.3880615234375, -0.3369293212890625, -0.285797119140625, -0.2346649169921875, -0.18353271484375, -0.1324005126953125, -0.081268310546875, -0.0301361083984375, 0.02099609375, 0.0721282958984375, 0.123260498046875, 0.1743927001953125, 0.22552490234375, 0.2766571044921875, 0.327789306640625, 0.3789215087890625, 0.4300537109375, 0.4811859130859375, 0.532318115234375, 0.5834503173828125, 0.63458251953125, 0.6857147216796875, 0.736846923828125, 0.7879791259765625, 0.839111328125, 0.8902435302734375, 0.941375732421875, 0.9925079345703125, 1.04364013671875, 1.0947723388671875, 1.145904541015625, 1.1970367431640625, 1.2481689453125, 1.2993011474609375, 1.350433349609375, 1.4015655517578125, 1.45269775390625, 1.5038299560546875, 1.554962158203125, 1.6060943603515625, 1.6572265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 8.0, 4.0, 11.0, 8.0, 6.0, 10.0, 16.0, 16.0, 19.0, 15.0, 23.0, 27.0, 19.0, 35.0, 38.0, 45.0, 62.0, 45.0, 60.0, 56.0, 64.0, 37.0, 48.0, 37.0, 36.0, 26.0, 26.0, 25.0, 30.0, 19.0, 15.0, 14.0, 14.0, 10.0, 15.0, 6.0, 10.0, 6.0, 7.0, 3.0, 6.0, 6.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.603515625, -0.5836105346679688, -0.5637054443359375, -0.5438003540039062, -0.523895263671875, -0.5039901733398438, -0.4840850830078125, -0.46417999267578125, -0.44427490234375, -0.42436981201171875, -0.4044647216796875, -0.38455963134765625, -0.364654541015625, -0.34474945068359375, -0.3248443603515625, -0.30493927001953125, -0.2850341796875, -0.26512908935546875, -0.2452239990234375, -0.22531890869140625, -0.205413818359375, -0.18550872802734375, -0.1656036376953125, -0.14569854736328125, -0.12579345703125, -0.10588836669921875, -0.0859832763671875, -0.06607818603515625, -0.046173095703125, -0.02626800537109375, -0.0063629150390625, 0.01354217529296875, 0.033447265625, 0.05335235595703125, 0.0732574462890625, 0.09316253662109375, 0.113067626953125, 0.13297271728515625, 0.1528778076171875, 0.17278289794921875, 0.19268798828125, 0.21259307861328125, 0.2324981689453125, 0.25240325927734375, 0.272308349609375, 0.29221343994140625, 0.3121185302734375, 0.33202362060546875, 0.3519287109375, 0.37183380126953125, 0.3917388916015625, 0.41164398193359375, 0.431549072265625, 0.45145416259765625, 0.4713592529296875, 0.49126434326171875, 0.51116943359375, 0.5310745239257812, 0.5509796142578125, 0.5708847045898438, 0.590789794921875, 0.6106948852539062, 0.6305999755859375, 0.6505050659179688, 0.67041015625]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 13.0, 9.0, 10.0, 12.0, 19.0, 17.0, 27.0, 40.0, 61.0, 57.0, 52.0, 49.0, 65.0, 69.0, 72.0, 74.0, 71.0, 62.0, 40.0, 41.0, 25.0, 25.0, 16.0, 15.0, 14.0, 8.0, 6.0, 11.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.920701026916504, -6.660393238067627, -6.400084972381592, -6.139777183532715, -5.87946891784668, -5.619161128997803, -5.358853340148926, -5.098545074462891, -4.8382368087768555, -4.5779290199279785, -4.317620754241943, -4.057312965393066, -3.7970046997070312, -3.5366969108581543, -3.2763888835906982, -3.016080856323242, -2.7557730674743652, -2.495465040206909, -2.235157012939453, -1.9748491048812866, -1.7145410776138306, -1.4542330503463745, -1.193925142288208, -0.933617115020752, -0.6733090877532959, -0.41300109028816223, -0.15269309282302856, 0.10761487483978271, 0.36792290210723877, 0.6282309293746948, 0.8885388374328613, 1.1488468647003174, 1.4091548919677734, 1.6694629192352295, 1.9297709465026855, 2.1900787353515625, 2.4503870010375977, 2.7106947898864746, 2.9710028171539307, 3.2313108444213867, 3.4916188716888428, 3.751926898956299, 4.012234687805176, 4.272542953491211, 4.532850742340088, 4.793159008026123, 5.053466796875, 5.313775062561035, 5.574082851409912, 5.834390640258789, 6.094698905944824, 6.355006694793701, 6.615314960479736, 6.875622749328613, 7.135931015014648, 7.396238803863525, 7.656546592712402, 7.916854381561279, 8.177162170410156, 8.437470436096191, 8.697778701782227, 8.958086967468262, 9.21839427947998, 9.478702545166016, 9.73901081085205]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 6.0, 10.0, 6.0, 11.0, 11.0, 16.0, 23.0, 23.0, 27.0, 30.0, 35.0, 37.0, 43.0, 54.0, 46.0, 47.0, 54.0, 44.0, 52.0, 62.0, 50.0, 45.0, 37.0, 34.0, 22.0, 29.0, 23.0, 20.0, 16.0, 21.0, 13.0, 13.0, 7.0, 7.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.772137641906738, -7.537145614624023, -7.302153587341309, -7.067161560058594, -6.832169532775879, -6.597177505493164, -6.362185955047607, -6.127193927764893, -5.892201900482178, -5.657209873199463, -5.422217845916748, -5.187225818634033, -4.952234268188477, -4.717242240905762, -4.482250213623047, -4.247258186340332, -4.012266159057617, -3.7772741317749023, -3.5422821044921875, -3.3072903156280518, -3.072298288345337, -2.837306261062622, -2.6023144721984863, -2.3673224449157715, -2.1323304176330566, -1.8973383903503418, -1.6623464822769165, -1.4273545742034912, -1.1923625469207764, -0.9573705196380615, -0.7223786115646362, -0.48738670349121094, -0.2523941993713379, -0.017402231693267822, 0.21758973598480225, 0.4525817036628723, 0.6875736713409424, 0.9225656986236572, 1.1575576066970825, 1.3925495147705078, 1.6275415420532227, 1.8625335693359375, 2.0975255966186523, 2.332517385482788, 2.567509412765503, 2.8025014400482178, 3.0374932289123535, 3.2724852561950684, 3.507477283477783, 3.742469310760498, 3.977461338043213, 4.212453365325928, 4.447444915771484, 4.682436943054199, 4.917428970336914, 5.152420997619629, 5.387413024902344, 5.622405052185059, 5.857397079467773, 6.092389106750488, 6.327381134033203, 6.562373161315918, 6.797364711761475, 7.0323567390441895, 7.267348766326904]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 1.0, 1.0, 5.0, 5.0, 11.0, 11.0, 23.0, 25.0, 39.0, 52.0, 85.0, 133.0, 169.0, 321.0, 408.0, 646.0, 945.0, 1553.0, 2411.0, 3688.0, 5870.0, 9598.0, 15728.0, 26936.0, 46981.0, 85189.0, 156789.0, 290175.0, 509648.0, 761727.0, 825466.0, 619406.0, 369431.0, 201981.0, 110127.0, 61357.0, 34982.0, 20352.0, 12013.0, 7365.0, 4583.0, 2863.0, 1796.0, 1204.0, 770.0, 502.0, 328.0, 203.0, 142.0, 87.0, 62.0, 41.0, 18.0, 11.0, 8.0, 16.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.47265625, -6.27777099609375, -6.0828857421875, -5.88800048828125, -5.693115234375, -5.49822998046875, -5.3033447265625, -5.10845947265625, -4.91357421875, -4.71868896484375, -4.5238037109375, -4.32891845703125, -4.134033203125, -3.93914794921875, -3.7442626953125, -3.54937744140625, -3.3544921875, -3.15960693359375, -2.9647216796875, -2.76983642578125, -2.574951171875, -2.38006591796875, -2.1851806640625, -1.99029541015625, -1.79541015625, -1.60052490234375, -1.4056396484375, -1.21075439453125, -1.015869140625, -0.82098388671875, -0.6260986328125, -0.43121337890625, -0.236328125, -0.04144287109375, 0.1534423828125, 0.34832763671875, 0.543212890625, 0.73809814453125, 0.9329833984375, 1.12786865234375, 1.32275390625, 1.51763916015625, 1.7125244140625, 1.90740966796875, 2.102294921875, 2.29718017578125, 2.4920654296875, 2.68695068359375, 2.8818359375, 3.07672119140625, 3.2716064453125, 3.46649169921875, 3.661376953125, 3.85626220703125, 4.0511474609375, 4.24603271484375, 4.44091796875, 4.63580322265625, 4.8306884765625, 5.02557373046875, 5.220458984375, 5.41534423828125, 5.6102294921875, 5.80511474609375, 6.0]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 5.0, 6.0, 6.0, 10.0, 15.0, 18.0, 25.0, 19.0, 26.0, 25.0, 36.0, 29.0, 46.0, 49.0, 40.0, 50.0, 41.0, 59.0, 37.0, 47.0, 52.0, 48.0, 61.0, 38.0, 35.0, 24.0, 22.0, 19.0, 17.0, 12.0, 20.0, 14.0, 8.0, 14.0, 4.0, 3.0, 2.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.37109375, -5.21075439453125, -5.0504150390625, -4.89007568359375, -4.729736328125, -4.56939697265625, -4.4090576171875, -4.24871826171875, -4.08837890625, -3.92803955078125, -3.7677001953125, -3.60736083984375, -3.447021484375, -3.28668212890625, -3.1263427734375, -2.96600341796875, -2.8056640625, -2.64532470703125, -2.4849853515625, -2.32464599609375, -2.164306640625, -2.00396728515625, -1.8436279296875, -1.68328857421875, -1.52294921875, -1.36260986328125, -1.2022705078125, -1.04193115234375, -0.881591796875, -0.72125244140625, -0.5609130859375, -0.40057373046875, -0.240234375, -0.07989501953125, 0.0804443359375, 0.24078369140625, 0.401123046875, 0.56146240234375, 0.7218017578125, 0.88214111328125, 1.04248046875, 1.20281982421875, 1.3631591796875, 1.52349853515625, 1.683837890625, 1.84417724609375, 2.0045166015625, 2.16485595703125, 2.3251953125, 2.48553466796875, 2.6458740234375, 2.80621337890625, 2.966552734375, 3.12689208984375, 3.2872314453125, 3.44757080078125, 3.60791015625, 3.76824951171875, 3.9285888671875, 4.08892822265625, 4.249267578125, 4.40960693359375, 4.5699462890625, 4.73028564453125, 4.890625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 11.0, 11.0, 15.0, 13.0, 20.0, 34.0, 50.0, 102.0, 139.0, 250.0, 307.0, 586.0, 925.0, 1525.0, 2574.0, 4580.0, 8225.0, 14997.0, 26887.0, 50491.0, 94553.0, 177087.0, 318253.0, 525541.0, 729424.0, 769857.0, 604975.0, 384666.0, 219017.0, 119087.0, 63570.0, 34169.0, 18421.0, 10229.0, 5806.0, 3305.0, 1869.0, 1115.0, 600.0, 386.0, 210.0, 164.0, 99.0, 50.0, 35.0, 24.0, 11.0, 10.0, 5.0, 1.0, 6.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.92578125, -6.72314453125, -6.5205078125, -6.31787109375, -6.115234375, -5.91259765625, -5.7099609375, -5.50732421875, -5.3046875, -5.10205078125, -4.8994140625, -4.69677734375, -4.494140625, -4.29150390625, -4.0888671875, -3.88623046875, -3.68359375, -3.48095703125, -3.2783203125, -3.07568359375, -2.873046875, -2.67041015625, -2.4677734375, -2.26513671875, -2.0625, -1.85986328125, -1.6572265625, -1.45458984375, -1.251953125, -1.04931640625, -0.8466796875, -0.64404296875, -0.44140625, -0.23876953125, -0.0361328125, 0.16650390625, 0.369140625, 0.57177734375, 0.7744140625, 0.97705078125, 1.1796875, 1.38232421875, 1.5849609375, 1.78759765625, 1.990234375, 2.19287109375, 2.3955078125, 2.59814453125, 2.80078125, 3.00341796875, 3.2060546875, 3.40869140625, 3.611328125, 3.81396484375, 4.0166015625, 4.21923828125, 4.421875, 4.62451171875, 4.8271484375, 5.02978515625, 5.232421875, 5.43505859375, 5.6376953125, 5.84033203125, 6.04296875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 6.0, 4.0, 13.0, 21.0, 28.0, 44.0, 67.0, 72.0, 75.0, 115.0, 115.0, 127.0, 190.0, 201.0, 228.0, 258.0, 268.0, 234.0, 275.0, 261.0, 240.0, 210.0, 186.0, 147.0, 137.0, 111.0, 82.0, 84.0, 53.0, 43.0, 42.0, 33.0, 26.0, 23.0, 17.0, 10.0, 7.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8388671875, -1.7552947998046875, -1.671722412109375, -1.5881500244140625, -1.50457763671875, -1.4210052490234375, -1.337432861328125, -1.2538604736328125, -1.1702880859375, -1.0867156982421875, -1.003143310546875, -0.9195709228515625, -0.83599853515625, -0.7524261474609375, -0.668853759765625, -0.5852813720703125, -0.501708984375, -0.4181365966796875, -0.334564208984375, -0.2509918212890625, -0.16741943359375, -0.0838470458984375, -0.000274658203125, 0.0832977294921875, 0.1668701171875, 0.2504425048828125, 0.334014892578125, 0.4175872802734375, 0.50115966796875, 0.5847320556640625, 0.668304443359375, 0.7518768310546875, 0.83544921875, 0.9190216064453125, 1.002593994140625, 1.0861663818359375, 1.16973876953125, 1.2533111572265625, 1.336883544921875, 1.4204559326171875, 1.5040283203125, 1.5876007080078125, 1.671173095703125, 1.7547454833984375, 1.83831787109375, 1.9218902587890625, 2.005462646484375, 2.0890350341796875, 2.172607421875, 2.2561798095703125, 2.339752197265625, 2.4233245849609375, 2.50689697265625, 2.5904693603515625, 2.674041748046875, 2.7576141357421875, 2.8411865234375, 2.9247589111328125, 3.008331298828125, 3.0919036865234375, 3.17547607421875, 3.2590484619140625, 3.342620849609375, 3.4261932373046875, 3.509765625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 9.0, 3.0, 8.0, 7.0, 19.0, 13.0, 24.0, 22.0, 24.0, 32.0, 51.0, 61.0, 58.0, 75.0, 80.0, 68.0, 70.0, 71.0, 57.0, 51.0, 46.0, 30.0, 25.0, 19.0, 19.0, 24.0, 9.0, 16.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.03253173828125, -6.754266738891602, -6.476001739501953, -6.197736740112305, -5.919471740722656, -5.641206741333008, -5.362941265106201, -5.084676265716553, -4.806411266326904, -4.528146266937256, -4.249881267547607, -3.97161602973938, -3.6933510303497314, -3.415086030960083, -3.1368207931518555, -2.858555793762207, -2.5802907943725586, -2.30202579498291, -2.0237607955932617, -1.7454955577850342, -1.4672305583953857, -1.1889655590057373, -0.9107004404067993, -0.6324353218078613, -0.3541703224182129, -0.07590526342391968, 0.20235979557037354, 0.48062485456466675, 0.75888991355896, 1.0371549129486084, 1.3154200315475464, 1.5936851501464844, 1.8719501495361328, 2.1502151489257812, 2.4284801483154297, 2.7067453861236572, 2.9850103855133057, 3.263275384902954, 3.5415406227111816, 3.81980562210083, 4.0980706214904785, 4.376335620880127, 4.654600620269775, 4.932865619659424, 5.2111310958862305, 5.489396095275879, 5.767661094665527, 6.045926094055176, 6.324191093444824, 6.602456092834473, 6.880721092224121, 7.1589860916137695, 7.437251091003418, 7.715516090393066, 7.993781566619873, 8.27204704284668, 8.550312042236328, 8.828577041625977, 9.106842041015625, 9.385107040405273, 9.663372039794922, 9.94163703918457, 10.219902038574219, 10.498167037963867, 10.776432037353516]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 11.0, 5.0, 7.0, 9.0, 15.0, 13.0, 17.0, 24.0, 26.0, 28.0, 34.0, 28.0, 48.0, 36.0, 44.0, 50.0, 58.0, 57.0, 56.0, 48.0, 46.0, 49.0, 40.0, 40.0, 33.0, 32.0, 18.0, 14.0, 33.0, 13.0, 19.0, 16.0, 9.0, 8.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.878626823425293, -7.638662338256836, -7.398697853088379, -7.158733367919922, -6.918768882751465, -6.678804397583008, -6.438839435577393, -6.1988749504089355, -5.9589104652404785, -5.7189459800720215, -5.4789814949035645, -5.239017009735107, -4.999052047729492, -4.759087562561035, -4.519123077392578, -4.279158592224121, -4.039194107055664, -3.799229621887207, -3.55926513671875, -3.319300413131714, -3.079335927963257, -2.8393714427948, -2.5994067192077637, -2.3594422340393066, -2.1194777488708496, -1.8795132637023926, -1.639548659324646, -1.3995840549468994, -1.1596195697784424, -0.9196550846099854, -0.6796904802322388, -0.4397258758544922, -0.19976139068603516, 0.04020315408706665, 0.28016769886016846, 0.5201322436332703, 0.7600967884063721, 1.000061273574829, 1.2400258779525757, 1.4799904823303223, 1.7199549674987793, 1.9599194526672363, 2.1998839378356934, 2.4398486614227295, 2.6798131465911865, 2.9197776317596436, 3.1597423553466797, 3.3997068405151367, 3.6396713256835938, 3.879635810852051, 4.119600296020508, 4.359564781188965, 4.599529266357422, 4.839493751525879, 5.079458713531494, 5.319423198699951, 5.559387683868408, 5.799352169036865, 6.039316654205322, 6.279281139373779, 6.5192461013793945, 6.759210586547852, 6.999175071716309, 7.239139556884766, 7.479104042053223]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 8.0, 8.0, 14.0, 11.0, 25.0, 38.0, 56.0, 88.0, 122.0, 174.0, 278.0, 400.0, 610.0, 843.0, 1379.0, 1978.0, 2907.0, 4659.0, 7144.0, 10963.0, 17143.0, 26101.0, 40999.0, 62727.0, 96119.0, 139392.0, 171806.0, 152260.0, 108390.0, 70973.0, 46335.0, 29500.0, 19104.0, 12382.0, 8190.0, 5287.0, 3469.0, 2230.0, 1486.0, 963.0, 666.0, 417.0, 303.0, 213.0, 138.0, 94.0, 58.0, 44.0, 25.0, 21.0, 10.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.76025390625, -0.735443115234375, -0.71063232421875, -0.685821533203125, -0.6610107421875, -0.636199951171875, -0.61138916015625, -0.586578369140625, -0.561767578125, -0.536956787109375, -0.51214599609375, -0.487335205078125, -0.4625244140625, -0.437713623046875, -0.41290283203125, -0.388092041015625, -0.36328125, -0.338470458984375, -0.31365966796875, -0.288848876953125, -0.2640380859375, -0.239227294921875, -0.21441650390625, -0.189605712890625, -0.164794921875, -0.139984130859375, -0.11517333984375, -0.090362548828125, -0.0655517578125, -0.040740966796875, -0.01593017578125, 0.008880615234375, 0.03369140625, 0.058502197265625, 0.08331298828125, 0.108123779296875, 0.1329345703125, 0.157745361328125, 0.18255615234375, 0.207366943359375, 0.232177734375, 0.256988525390625, 0.28179931640625, 0.306610107421875, 0.3314208984375, 0.356231689453125, 0.38104248046875, 0.405853271484375, 0.4306640625, 0.455474853515625, 0.48028564453125, 0.505096435546875, 0.5299072265625, 0.554718017578125, 0.57952880859375, 0.604339599609375, 0.629150390625, 0.653961181640625, 0.67877197265625, 0.703582763671875, 0.7283935546875, 0.753204345703125, 0.77801513671875, 0.802825927734375, 0.82763671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 8.0, 16.0, 14.0, 18.0, 16.0, 21.0, 25.0, 37.0, 32.0, 33.0, 57.0, 43.0, 49.0, 59.0, 67.0, 61.0, 49.0, 70.0, 43.0, 42.0, 55.0, 46.0, 27.0, 25.0, 17.0, 18.0, 17.0, 12.0, 9.0, 6.0, 4.0, 1.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9375, -9.6536865234375, -9.369873046875, -9.0860595703125, -8.80224609375, -8.5184326171875, -8.234619140625, -7.9508056640625, -7.6669921875, -7.3831787109375, -7.099365234375, -6.8155517578125, -6.53173828125, -6.2479248046875, -5.964111328125, -5.6802978515625, -5.396484375, -5.1126708984375, -4.828857421875, -4.5450439453125, -4.26123046875, -3.9774169921875, -3.693603515625, -3.4097900390625, -3.1259765625, -2.8421630859375, -2.558349609375, -2.2745361328125, -1.99072265625, -1.7069091796875, -1.423095703125, -1.1392822265625, -0.85546875, -0.5716552734375, -0.287841796875, -0.0040283203125, 0.27978515625, 0.5635986328125, 0.847412109375, 1.1312255859375, 1.4150390625, 1.6988525390625, 1.982666015625, 2.2664794921875, 2.55029296875, 2.8341064453125, 3.117919921875, 3.4017333984375, 3.685546875, 3.9693603515625, 4.253173828125, 4.5369873046875, 4.82080078125, 5.1046142578125, 5.388427734375, 5.6722412109375, 5.9560546875, 6.2398681640625, 6.523681640625, 6.8074951171875, 7.09130859375, 7.3751220703125, 7.658935546875, 7.9427490234375, 8.2265625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 7.0, 11.0, 29.0, 35.0, 49.0, 87.0, 122.0, 192.0, 310.0, 430.0, 777.0, 1122.0, 1838.0, 2986.0, 4690.0, 7620.0, 12688.0, 20654.0, 33710.0, 54329.0, 87457.0, 135485.0, 186205.0, 175098.0, 121200.0, 77078.0, 47640.0, 29460.0, 17964.0, 10995.0, 6779.0, 4316.0, 2597.0, 1659.0, 1015.0, 677.0, 445.0, 284.0, 177.0, 114.0, 78.0, 53.0, 36.0, 23.0, 10.0, 9.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.94091796875, -0.9113922119140625, -0.881866455078125, -0.8523406982421875, -0.82281494140625, -0.7932891845703125, -0.763763427734375, -0.7342376708984375, -0.7047119140625, -0.6751861572265625, -0.645660400390625, -0.6161346435546875, -0.58660888671875, -0.5570831298828125, -0.527557373046875, -0.4980316162109375, -0.468505859375, -0.4389801025390625, -0.409454345703125, -0.3799285888671875, -0.35040283203125, -0.3208770751953125, -0.291351318359375, -0.2618255615234375, -0.2322998046875, -0.2027740478515625, -0.173248291015625, -0.1437225341796875, -0.11419677734375, -0.0846710205078125, -0.055145263671875, -0.0256195068359375, 0.00390625, 0.0334320068359375, 0.062957763671875, 0.0924835205078125, 0.12200927734375, 0.1515350341796875, 0.181060791015625, 0.2105865478515625, 0.2401123046875, 0.2696380615234375, 0.299163818359375, 0.3286895751953125, 0.35821533203125, 0.3877410888671875, 0.417266845703125, 0.4467926025390625, 0.476318359375, 0.5058441162109375, 0.535369873046875, 0.5648956298828125, 0.59442138671875, 0.6239471435546875, 0.653472900390625, 0.6829986572265625, 0.7125244140625, 0.7420501708984375, 0.771575927734375, 0.8011016845703125, 0.83062744140625, 0.8601531982421875, 0.889678955078125, 0.9192047119140625, 0.94873046875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 8.0, 3.0, 10.0, 5.0, 12.0, 6.0, 10.0, 16.0, 24.0, 13.0, 18.0, 29.0, 17.0, 25.0, 38.0, 29.0, 27.0, 32.0, 34.0, 40.0, 41.0, 34.0, 47.0, 39.0, 38.0, 41.0, 42.0, 40.0, 34.0, 33.0, 32.0, 24.0, 33.0, 16.0, 20.0, 23.0, 14.0, 8.0, 12.0, 10.0, 3.0, 5.0, 3.0, 4.0, 1.0, 5.0, 1.0, 0.0, 4.0, 1.0, 3.0], "bins": [-4.53515625, -4.406768798828125, -4.27838134765625, -4.149993896484375, -4.0216064453125, -3.893218994140625, -3.76483154296875, -3.636444091796875, -3.508056640625, -3.379669189453125, -3.25128173828125, -3.122894287109375, -2.9945068359375, -2.866119384765625, -2.73773193359375, -2.609344482421875, -2.48095703125, -2.352569580078125, -2.22418212890625, -2.095794677734375, -1.9674072265625, -1.839019775390625, -1.71063232421875, -1.582244873046875, -1.453857421875, -1.325469970703125, -1.19708251953125, -1.068695068359375, -0.9403076171875, -0.811920166015625, -0.68353271484375, -0.555145263671875, -0.4267578125, -0.298370361328125, -0.16998291015625, -0.041595458984375, 0.0867919921875, 0.215179443359375, 0.34356689453125, 0.471954345703125, 0.600341796875, 0.728729248046875, 0.85711669921875, 0.985504150390625, 1.1138916015625, 1.242279052734375, 1.37066650390625, 1.499053955078125, 1.62744140625, 1.755828857421875, 1.88421630859375, 2.012603759765625, 2.1409912109375, 2.269378662109375, 2.39776611328125, 2.526153564453125, 2.654541015625, 2.782928466796875, 2.91131591796875, 3.039703369140625, 3.1680908203125, 3.296478271484375, 3.42486572265625, 3.553253173828125, 3.681640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 9.0, 9.0, 16.0, 10.0, 20.0, 20.0, 40.0, 69.0, 119.0, 182.0, 292.0, 476.0, 755.0, 1204.0, 2072.0, 3713.0, 6806.0, 12666.0, 24762.0, 50442.0, 105326.0, 223151.0, 305467.0, 158830.0, 75803.0, 36367.0, 18269.0, 9562.0, 5123.0, 2825.0, 1623.0, 936.0, 576.0, 343.0, 225.0, 148.0, 96.0, 67.0, 46.0, 25.0, 24.0, 15.0, 10.0, 10.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.090576171875, -0.08793354034423828, -0.08529090881347656, -0.08264827728271484, -0.08000564575195312, -0.0773630142211914, -0.07472038269042969, -0.07207775115966797, -0.06943511962890625, -0.06679248809814453, -0.06414985656738281, -0.061507225036621094, -0.058864593505859375, -0.056221961975097656, -0.05357933044433594, -0.05093669891357422, -0.0482940673828125, -0.04565143585205078, -0.04300880432128906, -0.040366172790527344, -0.037723541259765625, -0.035080909729003906, -0.03243827819824219, -0.02979564666748047, -0.02715301513671875, -0.02451038360595703, -0.021867752075195312, -0.019225120544433594, -0.016582489013671875, -0.013939857482910156, -0.011297225952148438, -0.008654594421386719, -0.006011962890625, -0.0033693313598632812, -0.0007266998291015625, 0.0019159317016601562, 0.004558563232421875, 0.007201194763183594, 0.009843826293945312, 0.012486457824707031, 0.01512908935546875, 0.01777172088623047, 0.020414352416992188, 0.023056983947753906, 0.025699615478515625, 0.028342247009277344, 0.030984878540039062, 0.03362751007080078, 0.0362701416015625, 0.03891277313232422, 0.04155540466308594, 0.044198036193847656, 0.046840667724609375, 0.049483299255371094, 0.05212593078613281, 0.05476856231689453, 0.05741119384765625, 0.06005382537841797, 0.06269645690917969, 0.0653390884399414, 0.06798171997070312, 0.07062435150146484, 0.07326698303222656, 0.07590961456298828, 0.07855224609375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 13.0, 4.0, 9.0, 15.0, 12.0, 16.0, 15.0, 37.0, 31.0, 31.0, 35.0, 30.0, 49.0, 59.0, 44.0, 52.0, 50.0, 57.0, 60.0, 54.0, 59.0, 40.0, 46.0, 32.0, 23.0, 29.0, 16.0, 13.0, 17.0, 10.0, 9.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0], "bins": [-1.3232231140136719e-05, -1.2881122529506683e-05, -1.2530013918876648e-05, -1.2178905308246613e-05, -1.1827796697616577e-05, -1.1476688086986542e-05, -1.1125579476356506e-05, -1.0774470865726471e-05, -1.0423362255096436e-05, -1.00722536444664e-05, -9.721145033836365e-06, -9.37003642320633e-06, -9.018927812576294e-06, -8.667819201946259e-06, -8.316710591316223e-06, -7.965601980686188e-06, -7.614493370056152e-06, -7.263384759426117e-06, -6.9122761487960815e-06, -6.561167538166046e-06, -6.210058927536011e-06, -5.858950316905975e-06, -5.50784170627594e-06, -5.1567330956459045e-06, -4.805624485015869e-06, -4.454515874385834e-06, -4.103407263755798e-06, -3.752298653125763e-06, -3.4011900424957275e-06, -3.050081431865692e-06, -2.6989728212356567e-06, -2.3478642106056213e-06, -1.996755599975586e-06, -1.6456469893455505e-06, -1.2945383787155151e-06, -9.434297680854797e-07, -5.923211574554443e-07, -2.4121254682540894e-07, 1.0989606380462646e-07, 4.6100467443466187e-07, 8.121132850646973e-07, 1.1632218956947327e-06, 1.514330506324768e-06, 1.8654391169548035e-06, 2.216547727584839e-06, 2.5676563382148743e-06, 2.9187649488449097e-06, 3.269873559474945e-06, 3.6209821701049805e-06, 3.972090780735016e-06, 4.323199391365051e-06, 4.674308001995087e-06, 5.025416612625122e-06, 5.3765252232551575e-06, 5.727633833885193e-06, 6.078742444515228e-06, 6.429851055145264e-06, 6.780959665775299e-06, 7.1320682764053345e-06, 7.48317688703537e-06, 7.834285497665405e-06, 8.18539410829544e-06, 8.536502718925476e-06, 8.887611329555511e-06, 9.238719940185547e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 14.0, 13.0, 16.0, 28.0, 38.0, 73.0, 86.0, 125.0, 169.0, 283.0, 412.0, 572.0, 900.0, 1420.0, 2096.0, 3324.0, 5275.0, 8296.0, 13559.0, 22950.0, 39109.0, 68307.0, 122675.0, 215299.0, 228145.0, 134161.0, 74298.0, 42506.0, 25037.0, 14726.0, 8930.0, 5446.0, 3487.0, 2258.0, 1492.0, 1069.0, 630.0, 426.0, 291.0, 199.0, 151.0, 86.0, 52.0, 41.0, 31.0, 16.0, 15.0, 5.0, 2.0, 3.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07916259765625, -0.07669448852539062, -0.07422637939453125, -0.07175827026367188, -0.0692901611328125, -0.06682205200195312, -0.06435394287109375, -0.061885833740234375, -0.059417724609375, -0.056949615478515625, -0.05448150634765625, -0.052013397216796875, -0.0495452880859375, -0.047077178955078125, -0.04460906982421875, -0.042140960693359375, -0.0396728515625, -0.037204742431640625, -0.03473663330078125, -0.032268524169921875, -0.0298004150390625, -0.027332305908203125, -0.02486419677734375, -0.022396087646484375, -0.019927978515625, -0.017459869384765625, -0.01499176025390625, -0.012523651123046875, -0.0100555419921875, -0.007587432861328125, -0.00511932373046875, -0.002651214599609375, -0.00018310546875, 0.002285003662109375, 0.00475311279296875, 0.007221221923828125, 0.0096893310546875, 0.012157440185546875, 0.01462554931640625, 0.017093658447265625, 0.019561767578125, 0.022029876708984375, 0.02449798583984375, 0.026966094970703125, 0.0294342041015625, 0.031902313232421875, 0.03437042236328125, 0.036838531494140625, 0.039306640625, 0.041774749755859375, 0.04424285888671875, 0.046710968017578125, 0.0491790771484375, 0.051647186279296875, 0.05411529541015625, 0.056583404541015625, 0.059051513671875, 0.061519622802734375, 0.06398773193359375, 0.06645584106445312, 0.0689239501953125, 0.07139205932617188, 0.07386016845703125, 0.07632827758789062, 0.07879638671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 3.0, 5.0, 4.0, 5.0, 8.0, 14.0, 18.0, 12.0, 14.0, 23.0, 28.0, 26.0, 39.0, 41.0, 55.0, 67.0, 63.0, 83.0, 75.0, 58.0, 56.0, 48.0, 44.0, 38.0, 26.0, 21.0, 17.0, 25.0, 10.0, 5.0, 16.0, 9.0, 8.0, 6.0, 9.0, 3.0, 2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.029327392578125, -0.028372764587402344, -0.027418136596679688, -0.02646350860595703, -0.025508880615234375, -0.02455425262451172, -0.023599624633789062, -0.022644996643066406, -0.02169036865234375, -0.020735740661621094, -0.019781112670898438, -0.01882648468017578, -0.017871856689453125, -0.01691722869873047, -0.015962600708007812, -0.015007972717285156, -0.0140533447265625, -0.013098716735839844, -0.012144088745117188, -0.011189460754394531, -0.010234832763671875, -0.009280204772949219, -0.008325576782226562, -0.007370948791503906, -0.00641632080078125, -0.005461692810058594, -0.0045070648193359375, -0.0035524368286132812, -0.002597808837890625, -0.0016431808471679688, -0.0006885528564453125, 0.00026607513427734375, 0.001220703125, 0.0021753311157226562, 0.0031299591064453125, 0.004084587097167969, 0.005039215087890625, 0.005993843078613281, 0.0069484710693359375, 0.007903099060058594, 0.00885772705078125, 0.009812355041503906, 0.010766983032226562, 0.011721611022949219, 0.012676239013671875, 0.013630867004394531, 0.014585494995117188, 0.015540122985839844, 0.0164947509765625, 0.017449378967285156, 0.018404006958007812, 0.01935863494873047, 0.020313262939453125, 0.02126789093017578, 0.022222518920898438, 0.023177146911621094, 0.02413177490234375, 0.025086402893066406, 0.026041030883789062, 0.02699565887451172, 0.027950286865234375, 0.02890491485595703, 0.029859542846679688, 0.030814170837402344, 0.031768798828125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 4.0, 8.0, 8.0, 19.0, 14.0, 27.0, 21.0, 26.0, 34.0, 57.0, 61.0, 57.0, 83.0, 79.0, 65.0, 74.0, 67.0, 57.0, 53.0, 37.0, 27.0, 22.0, 17.0, 30.0, 16.0, 9.0, 14.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.052398681640625, -6.770888328552246, -6.489377498626709, -6.20786714553833, -5.926356792449951, -5.644845962524414, -5.363335609436035, -5.081825256347656, -4.800314903259277, -4.518804550170898, -4.237293720245361, -3.9557833671569824, -3.6742730140686035, -3.3927624225616455, -3.1112518310546875, -2.8297414779663086, -2.5482306480407715, -2.2667200565338135, -1.9852097034454346, -1.7036991119384766, -1.422188639640808, -1.1406781673431396, -0.8591675758361816, -0.5776571035385132, -0.2961466312408447, -0.014636129140853882, 0.26687437295913696, 0.5483849048614502, 0.8298953771591187, 1.111405849456787, 1.3929164409637451, 1.6744269132614136, 1.955937385559082, 2.23744797706604, 2.518958330154419, 2.800468921661377, 3.081979274749756, 3.363489866256714, 3.645000457763672, 3.926510810852051, 4.20802116394043, 4.489531517028809, 4.771042346954346, 5.052552700042725, 5.3340630531311035, 5.615573883056641, 5.8970842361450195, 6.178594589233398, 6.4601054191589355, 6.7416157722473145, 7.023126602172852, 7.3046369552612305, 7.586147308349609, 7.867657661437988, 8.149168014526367, 8.430679321289062, 8.712189674377441, 8.99370002746582, 9.2752103805542, 9.556720733642578, 9.838232040405273, 10.119742393493652, 10.401252746582031, 10.68276309967041, 10.964273452758789]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 9.0, 6.0, 7.0, 12.0, 13.0, 13.0, 19.0, 22.0, 25.0, 28.0, 34.0, 29.0, 48.0, 36.0, 44.0, 51.0, 56.0, 57.0, 58.0, 48.0, 47.0, 48.0, 38.0, 43.0, 30.0, 33.0, 17.0, 13.0, 35.0, 12.0, 19.0, 16.0, 9.0, 8.0, 8.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.846552848815918, -7.607483863830566, -7.368414402008057, -7.129344940185547, -6.890275955200195, -6.651206970214844, -6.412137508392334, -6.173068046569824, -5.933999061584473, -5.694930076599121, -5.455860614776611, -5.216791152954102, -4.97772216796875, -4.738653182983398, -4.499583721160889, -4.260514259338379, -4.021445274353027, -3.7823760509490967, -3.543306827545166, -3.3042376041412354, -3.0651683807373047, -2.826099157333374, -2.5870299339294434, -2.3479607105255127, -2.108891487121582, -1.8698222637176514, -1.6307530403137207, -1.39168381690979, -1.1526145935058594, -0.9135453701019287, -0.674476146697998, -0.4354069232940674, -0.19633722305297852, 0.04273200035095215, 0.2818012237548828, 0.5208704471588135, 0.7599396705627441, 0.9990088939666748, 1.2380781173706055, 1.4771473407745361, 1.7162165641784668, 1.9552857875823975, 2.194355010986328, 2.433424234390259, 2.6724934577941895, 2.91156268119812, 3.150631904602051, 3.3897011280059814, 3.628770351409912, 3.8678395748138428, 4.106908798217773, 4.345977783203125, 4.585047245025635, 4.8241167068481445, 5.063185691833496, 5.302254676818848, 5.541324138641357, 5.780393600463867, 6.019462585449219, 6.25853157043457, 6.49760103225708, 6.73667049407959, 6.975739479064941, 7.214808464050293, 7.453877925872803]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 10.0, 8.0, 13.0, 21.0, 25.0, 34.0, 63.0, 97.0, 159.0, 231.0, 349.0, 507.0, 893.0, 1329.0, 2120.0, 3379.0, 5298.0, 8832.0, 14076.0, 22840.0, 36421.0, 56553.0, 85110.0, 116560.0, 142186.0, 147042.0, 126663.0, 96653.0, 66072.0, 42830.0, 27140.0, 17026.0, 10482.0, 6524.0, 4088.0, 2574.0, 1574.0, 1011.0, 646.0, 386.0, 243.0, 169.0, 102.0, 87.0, 50.0, 28.0, 15.0, 21.0, 9.0, 9.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.78515625, -4.6317138671875, -4.478271484375, -4.3248291015625, -4.17138671875, -4.0179443359375, -3.864501953125, -3.7110595703125, -3.5576171875, -3.4041748046875, -3.250732421875, -3.0972900390625, -2.94384765625, -2.7904052734375, -2.636962890625, -2.4835205078125, -2.330078125, -2.1766357421875, -2.023193359375, -1.8697509765625, -1.71630859375, -1.5628662109375, -1.409423828125, -1.2559814453125, -1.1025390625, -0.9490966796875, -0.795654296875, -0.6422119140625, -0.48876953125, -0.3353271484375, -0.181884765625, -0.0284423828125, 0.125, 0.2784423828125, 0.431884765625, 0.5853271484375, 0.73876953125, 0.8922119140625, 1.045654296875, 1.1990966796875, 1.3525390625, 1.5059814453125, 1.659423828125, 1.8128662109375, 1.96630859375, 2.1197509765625, 2.273193359375, 2.4266357421875, 2.580078125, 2.7335205078125, 2.886962890625, 3.0404052734375, 3.19384765625, 3.3472900390625, 3.500732421875, 3.6541748046875, 3.8076171875, 3.9610595703125, 4.114501953125, 4.2679443359375, 4.42138671875, 4.5748291015625, 4.728271484375, 4.8817138671875, 5.03515625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 9.0, 13.0, 7.0, 18.0, 22.0, 24.0, 28.0, 30.0, 34.0, 45.0, 32.0, 47.0, 44.0, 53.0, 68.0, 38.0, 54.0, 50.0, 57.0, 50.0, 44.0, 37.0, 31.0, 28.0, 18.0, 22.0, 22.0, 16.0, 17.0, 14.0, 9.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66015625, -7.40936279296875, -7.1585693359375, -6.90777587890625, -6.656982421875, -6.40618896484375, -6.1553955078125, -5.90460205078125, -5.65380859375, -5.40301513671875, -5.1522216796875, -4.90142822265625, -4.650634765625, -4.39984130859375, -4.1490478515625, -3.89825439453125, -3.6474609375, -3.39666748046875, -3.1458740234375, -2.89508056640625, -2.644287109375, -2.39349365234375, -2.1427001953125, -1.89190673828125, -1.64111328125, -1.39031982421875, -1.1395263671875, -0.88873291015625, -0.637939453125, -0.38714599609375, -0.1363525390625, 0.11444091796875, 0.365234375, 0.61602783203125, 0.8668212890625, 1.11761474609375, 1.368408203125, 1.61920166015625, 1.8699951171875, 2.12078857421875, 2.37158203125, 2.62237548828125, 2.8731689453125, 3.12396240234375, 3.374755859375, 3.62554931640625, 3.8763427734375, 4.12713623046875, 4.3779296875, 4.62872314453125, 4.8795166015625, 5.13031005859375, 5.381103515625, 5.63189697265625, 5.8826904296875, 6.13348388671875, 6.38427734375, 6.63507080078125, 6.8858642578125, 7.13665771484375, 7.387451171875, 7.63824462890625, 7.8890380859375, 8.13983154296875, 8.390625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 11.0, 9.0, 24.0, 45.0, 51.0, 99.0, 134.0, 214.0, 319.0, 498.0, 750.0, 1272.0, 1851.0, 2797.0, 4544.0, 6876.0, 10986.0, 17189.0, 27045.0, 42625.0, 63589.0, 90475.0, 118420.0, 136934.0, 135952.0, 117319.0, 90167.0, 62595.0, 41523.0, 27022.0, 17184.0, 10860.0, 6952.0, 4384.0, 2730.0, 1834.0, 1100.0, 727.0, 526.0, 319.0, 227.0, 126.0, 89.0, 58.0, 30.0, 39.0, 20.0, 8.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.84765625, -4.70068359375, -4.5537109375, -4.40673828125, -4.259765625, -4.11279296875, -3.9658203125, -3.81884765625, -3.671875, -3.52490234375, -3.3779296875, -3.23095703125, -3.083984375, -2.93701171875, -2.7900390625, -2.64306640625, -2.49609375, -2.34912109375, -2.2021484375, -2.05517578125, -1.908203125, -1.76123046875, -1.6142578125, -1.46728515625, -1.3203125, -1.17333984375, -1.0263671875, -0.87939453125, -0.732421875, -0.58544921875, -0.4384765625, -0.29150390625, -0.14453125, 0.00244140625, 0.1494140625, 0.29638671875, 0.443359375, 0.59033203125, 0.7373046875, 0.88427734375, 1.03125, 1.17822265625, 1.3251953125, 1.47216796875, 1.619140625, 1.76611328125, 1.9130859375, 2.06005859375, 2.20703125, 2.35400390625, 2.5009765625, 2.64794921875, 2.794921875, 2.94189453125, 3.0888671875, 3.23583984375, 3.3828125, 3.52978515625, 3.6767578125, 3.82373046875, 3.970703125, 4.11767578125, 4.2646484375, 4.41162109375, 4.55859375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 8.0, 11.0, 11.0, 6.0, 15.0, 12.0, 24.0, 18.0, 17.0, 23.0, 28.0, 25.0, 39.0, 34.0, 35.0, 40.0, 33.0, 34.0, 33.0, 30.0, 39.0, 23.0, 41.0, 40.0, 30.0, 39.0, 32.0, 29.0, 40.0, 23.0, 22.0, 25.0, 14.0, 17.0, 13.0, 11.0, 11.0, 9.0, 12.0, 4.0, 8.0, 11.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0], "bins": [-3.681640625, -3.564971923828125, -3.44830322265625, -3.331634521484375, -3.2149658203125, -3.098297119140625, -2.98162841796875, -2.864959716796875, -2.748291015625, -2.631622314453125, -2.51495361328125, -2.398284912109375, -2.2816162109375, -2.164947509765625, -2.04827880859375, -1.931610107421875, -1.81494140625, -1.698272705078125, -1.58160400390625, -1.464935302734375, -1.3482666015625, -1.231597900390625, -1.11492919921875, -0.998260498046875, -0.881591796875, -0.764923095703125, -0.64825439453125, -0.531585693359375, -0.4149169921875, -0.298248291015625, -0.18157958984375, -0.064910888671875, 0.0517578125, 0.168426513671875, 0.28509521484375, 0.401763916015625, 0.5184326171875, 0.635101318359375, 0.75177001953125, 0.868438720703125, 0.985107421875, 1.101776123046875, 1.21844482421875, 1.335113525390625, 1.4517822265625, 1.568450927734375, 1.68511962890625, 1.801788330078125, 1.91845703125, 2.035125732421875, 2.15179443359375, 2.268463134765625, 2.3851318359375, 2.501800537109375, 2.61846923828125, 2.735137939453125, 2.851806640625, 2.968475341796875, 3.08514404296875, 3.201812744140625, 3.3184814453125, 3.435150146484375, 3.55181884765625, 3.668487548828125, 3.78515625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 5.0, 5.0, 6.0, 22.0, 22.0, 22.0, 36.0, 33.0, 52.0, 80.0, 129.0, 143.0, 230.0, 326.0, 423.0, 692.0, 1064.0, 1622.0, 2446.0, 4030.0, 6916.0, 11602.0, 20352.0, 35915.0, 63935.0, 110241.0, 169078.0, 198720.0, 166297.0, 107563.0, 62487.0, 35244.0, 19845.0, 11201.0, 6576.0, 4002.0, 2430.0, 1551.0, 966.0, 669.0, 427.0, 341.0, 222.0, 159.0, 116.0, 80.0, 71.0, 60.0, 28.0, 17.0, 27.0, 13.0, 9.0, 7.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.421875, -2.3424072265625, -2.262939453125, -2.1834716796875, -2.10400390625, -2.0245361328125, -1.945068359375, -1.8656005859375, -1.7861328125, -1.7066650390625, -1.627197265625, -1.5477294921875, -1.46826171875, -1.3887939453125, -1.309326171875, -1.2298583984375, -1.150390625, -1.0709228515625, -0.991455078125, -0.9119873046875, -0.83251953125, -0.7530517578125, -0.673583984375, -0.5941162109375, -0.5146484375, -0.4351806640625, -0.355712890625, -0.2762451171875, -0.19677734375, -0.1173095703125, -0.037841796875, 0.0416259765625, 0.12109375, 0.2005615234375, 0.280029296875, 0.3594970703125, 0.43896484375, 0.5184326171875, 0.597900390625, 0.6773681640625, 0.7568359375, 0.8363037109375, 0.915771484375, 0.9952392578125, 1.07470703125, 1.1541748046875, 1.233642578125, 1.3131103515625, 1.392578125, 1.4720458984375, 1.551513671875, 1.6309814453125, 1.71044921875, 1.7899169921875, 1.869384765625, 1.9488525390625, 2.0283203125, 2.1077880859375, 2.187255859375, 2.2667236328125, 2.34619140625, 2.4256591796875, 2.505126953125, 2.5845947265625, 2.6640625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 10.0, 11.0, 26.0, 36.0, 54.0, 82.0, 84.0, 126.0, 103.0, 113.0, 75.0, 72.0, 62.0, 50.0, 30.0, 12.0, 18.0, 10.0, 6.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000278472900390625, -0.00026716291904449463, -0.00025585293769836426, -0.0002445429563522339, -0.00023323297500610352, -0.00022192299365997314, -0.00021061301231384277, -0.0001993030309677124, -0.00018799304962158203, -0.00017668306827545166, -0.0001653730869293213, -0.00015406310558319092, -0.00014275312423706055, -0.00013144314289093018, -0.0001201331615447998, -0.00010882318019866943, -9.751319885253906e-05, -8.620321750640869e-05, -7.489323616027832e-05, -6.358325481414795e-05, -5.227327346801758e-05, -4.096329212188721e-05, -2.9653310775756836e-05, -1.8343329429626465e-05, -7.033348083496094e-06, 4.276633262634277e-06, 1.558661460876465e-05, 2.689659595489502e-05, 3.820657730102539e-05, 4.951655864715576e-05, 6.082653999328613e-05, 7.21365213394165e-05, 8.344650268554688e-05, 9.475648403167725e-05, 0.00010606646537780762, 0.00011737644672393799, 0.00012868642807006836, 0.00013999640941619873, 0.0001513063907623291, 0.00016261637210845947, 0.00017392635345458984, 0.00018523633480072021, 0.00019654631614685059, 0.00020785629749298096, 0.00021916627883911133, 0.0002304762601852417, 0.00024178624153137207, 0.00025309622287750244, 0.0002644062042236328, 0.0002757161855697632, 0.00028702616691589355, 0.0002983361482620239, 0.0003096461296081543, 0.00032095611095428467, 0.00033226609230041504, 0.0003435760736465454, 0.0003548860549926758, 0.00036619603633880615, 0.0003775060176849365, 0.0003888159990310669, 0.00040012598037719727, 0.00041143596172332764, 0.000422745943069458, 0.0004340559244155884, 0.00044536590576171875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 10.0, 7.0, 6.0, 15.0, 16.0, 25.0, 52.0, 70.0, 97.0, 171.0, 235.0, 356.0, 585.0, 898.0, 1381.0, 2348.0, 3672.0, 6128.0, 10766.0, 18253.0, 31828.0, 55308.0, 93427.0, 142113.0, 182407.0, 174289.0, 128194.0, 81376.0, 47931.0, 27482.0, 15873.0, 9184.0, 5382.0, 3205.0, 2022.0, 1236.0, 789.0, 494.0, 336.0, 204.0, 135.0, 97.0, 62.0, 32.0, 24.0, 16.0, 9.0, 7.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0], "bins": [-2.615234375, -2.54022216796875, -2.4652099609375, -2.39019775390625, -2.315185546875, -2.24017333984375, -2.1651611328125, -2.09014892578125, -2.01513671875, -1.94012451171875, -1.8651123046875, -1.79010009765625, -1.715087890625, -1.64007568359375, -1.5650634765625, -1.49005126953125, -1.4150390625, -1.34002685546875, -1.2650146484375, -1.19000244140625, -1.114990234375, -1.03997802734375, -0.9649658203125, -0.88995361328125, -0.81494140625, -0.73992919921875, -0.6649169921875, -0.58990478515625, -0.514892578125, -0.43988037109375, -0.3648681640625, -0.28985595703125, -0.21484375, -0.13983154296875, -0.0648193359375, 0.01019287109375, 0.085205078125, 0.16021728515625, 0.2352294921875, 0.31024169921875, 0.38525390625, 0.46026611328125, 0.5352783203125, 0.61029052734375, 0.685302734375, 0.76031494140625, 0.8353271484375, 0.91033935546875, 0.9853515625, 1.06036376953125, 1.1353759765625, 1.21038818359375, 1.285400390625, 1.36041259765625, 1.4354248046875, 1.51043701171875, 1.58544921875, 1.66046142578125, 1.7354736328125, 1.81048583984375, 1.885498046875, 1.96051025390625, 2.0355224609375, 2.11053466796875, 2.185546875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 8.0, 1.0, 2.0, 5.0, 2.0, 4.0, 3.0, 10.0, 13.0, 16.0, 13.0, 23.0, 18.0, 21.0, 36.0, 28.0, 31.0, 40.0, 55.0, 49.0, 51.0, 65.0, 69.0, 46.0, 54.0, 54.0, 30.0, 52.0, 42.0, 28.0, 18.0, 20.0, 11.0, 16.0, 19.0, 11.0, 9.0, 3.0, 11.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.9267578125, -0.90045166015625, -0.8741455078125, -0.84783935546875, -0.821533203125, -0.79522705078125, -0.7689208984375, -0.74261474609375, -0.71630859375, -0.69000244140625, -0.6636962890625, -0.63739013671875, -0.611083984375, -0.58477783203125, -0.5584716796875, -0.53216552734375, -0.505859375, -0.47955322265625, -0.4532470703125, -0.42694091796875, -0.400634765625, -0.37432861328125, -0.3480224609375, -0.32171630859375, -0.29541015625, -0.26910400390625, -0.2427978515625, -0.21649169921875, -0.190185546875, -0.16387939453125, -0.1375732421875, -0.11126708984375, -0.0849609375, -0.05865478515625, -0.0323486328125, -0.00604248046875, 0.020263671875, 0.04656982421875, 0.0728759765625, 0.09918212890625, 0.12548828125, 0.15179443359375, 0.1781005859375, 0.20440673828125, 0.230712890625, 0.25701904296875, 0.2833251953125, 0.30963134765625, 0.3359375, 0.36224365234375, 0.3885498046875, 0.41485595703125, 0.441162109375, 0.46746826171875, 0.4937744140625, 0.52008056640625, 0.54638671875, 0.57269287109375, 0.5989990234375, 0.62530517578125, 0.651611328125, 0.67791748046875, 0.7042236328125, 0.73052978515625, 0.7568359375]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 9.0, 13.0, 10.0, 22.0, 21.0, 29.0, 37.0, 45.0, 44.0, 62.0, 81.0, 82.0, 72.0, 65.0, 61.0, 64.0, 41.0, 46.0, 38.0, 26.0, 31.0, 26.0, 12.0, 12.0, 10.0, 6.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.215301513671875, -7.9357099533081055, -7.656118869781494, -7.376527786254883, -7.096936225891113, -6.817344665527344, -6.537753582000732, -6.258162498474121, -5.978570938110352, -5.698979377746582, -5.419388294219971, -5.139797210693359, -4.86020565032959, -4.58061408996582, -4.301023006439209, -4.021431922912598, -3.741840362548828, -3.4622490406036377, -3.1826577186584473, -2.903066396713257, -2.6234750747680664, -2.343883752822876, -2.0642924308776855, -1.7847011089324951, -1.5051097869873047, -1.2255184650421143, -0.9459271430969238, -0.6663358211517334, -0.38674449920654297, -0.10715317726135254, 0.1724381446838379, 0.4520294666290283, 0.7316207885742188, 1.0112121105194092, 1.2908034324645996, 1.57039475440979, 1.8499860763549805, 2.129577398300171, 2.4091687202453613, 2.6887600421905518, 2.968351364135742, 3.2479426860809326, 3.527534008026123, 3.8071253299713135, 4.086716651916504, 4.366308212280273, 4.645899295806885, 4.925490379333496, 5.205081939697266, 5.484673500061035, 5.7642645835876465, 6.043855667114258, 6.323447227478027, 6.603038787841797, 6.882629871368408, 7.1622209548950195, 7.441812515258789, 7.721404075622559, 8.000995635986328, 8.280586242675781, 8.56017780303955, 8.83976936340332, 9.119359970092773, 9.398951530456543, 9.678543090820312]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 6.0, 6.0, 9.0, 10.0, 10.0, 16.0, 26.0, 23.0, 24.0, 31.0, 28.0, 35.0, 38.0, 36.0, 39.0, 42.0, 46.0, 55.0, 44.0, 52.0, 53.0, 45.0, 37.0, 41.0, 38.0, 21.0, 34.0, 18.0, 22.0, 25.0, 18.0, 12.0, 20.0, 7.0, 7.0, 5.0, 8.0, 5.0, 4.0, 3.0, 1.0, 0.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.536931037902832, -7.297118663787842, -7.057306289672852, -6.817493438720703, -6.577681064605713, -6.337868690490723, -6.098056316375732, -5.858243942260742, -5.618431091308594, -5.3786187171936035, -5.138806343078613, -4.898993492126465, -4.659181118011475, -4.419368743896484, -4.179556369781494, -3.939743995666504, -3.6999316215515137, -3.4601192474365234, -3.220306634902954, -2.980494260787964, -2.7406816482543945, -2.5008692741394043, -2.261056900024414, -2.021244525909424, -1.7814319133758545, -1.5416194200515747, -1.301806926727295, -1.0619945526123047, -0.8221820592880249, -0.5823695659637451, -0.3425571918487549, -0.1027446985244751, 0.13706731796264648, 0.3768797814846039, 0.6166922450065613, 0.8565046787261963, 1.096317172050476, 1.3361296653747559, 1.575942039489746, 1.8157545328140259, 2.0555670261383057, 2.295379400253296, 2.5351920127868652, 2.7750043869018555, 3.0148167610168457, 3.254629373550415, 3.4944417476654053, 3.7342543601989746, 3.974066734313965, 4.213879108428955, 4.453691482543945, 4.693504333496094, 4.933316707611084, 5.173129081726074, 5.4129414558410645, 5.652753829956055, 5.892566680908203, 6.132379055023193, 6.372191429138184, 6.612004280090332, 6.851816654205322, 7.0916290283203125, 7.331441402435303, 7.571253776550293, 7.811066150665283]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 8.0, 11.0, 12.0, 11.0, 35.0, 45.0, 62.0, 123.0, 158.0, 263.0, 386.0, 656.0, 1071.0, 1779.0, 3080.0, 5335.0, 9618.0, 17293.0, 32455.0, 62818.0, 122755.0, 237668.0, 444192.0, 720823.0, 872438.0, 716887.0, 442106.0, 239103.0, 123494.0, 63450.0, 33778.0, 18354.0, 10165.0, 5770.0, 3219.0, 1958.0, 1151.0, 674.0, 411.0, 266.0, 149.0, 96.0, 55.0, 35.0, 23.0, 21.0, 9.0, 13.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.80078125, -7.57476806640625, -7.3487548828125, -7.12274169921875, -6.896728515625, -6.67071533203125, -6.4447021484375, -6.21868896484375, -5.99267578125, -5.76666259765625, -5.5406494140625, -5.31463623046875, -5.088623046875, -4.86260986328125, -4.6365966796875, -4.41058349609375, -4.1845703125, -3.95855712890625, -3.7325439453125, -3.50653076171875, -3.280517578125, -3.05450439453125, -2.8284912109375, -2.60247802734375, -2.37646484375, -2.15045166015625, -1.9244384765625, -1.69842529296875, -1.472412109375, -1.24639892578125, -1.0203857421875, -0.79437255859375, -0.568359375, -0.34234619140625, -0.1163330078125, 0.10968017578125, 0.335693359375, 0.56170654296875, 0.7877197265625, 1.01373291015625, 1.23974609375, 1.46575927734375, 1.6917724609375, 1.91778564453125, 2.143798828125, 2.36981201171875, 2.5958251953125, 2.82183837890625, 3.0478515625, 3.27386474609375, 3.4998779296875, 3.72589111328125, 3.951904296875, 4.17791748046875, 4.4039306640625, 4.62994384765625, 4.85595703125, 5.08197021484375, 5.3079833984375, 5.53399658203125, 5.760009765625, 5.98602294921875, 6.2120361328125, 6.43804931640625, 6.6640625]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 11.0, 9.0, 14.0, 12.0, 21.0, 21.0, 31.0, 34.0, 27.0, 35.0, 25.0, 48.0, 37.0, 46.0, 48.0, 44.0, 47.0, 57.0, 41.0, 38.0, 42.0, 42.0, 34.0, 33.0, 25.0, 23.0, 33.0, 17.0, 16.0, 18.0, 11.0, 4.0, 9.0, 9.0, 5.0, 4.0, 7.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.56640625, -5.39532470703125, -5.2242431640625, -5.05316162109375, -4.882080078125, -4.71099853515625, -4.5399169921875, -4.36883544921875, -4.19775390625, -4.02667236328125, -3.8555908203125, -3.68450927734375, -3.513427734375, -3.34234619140625, -3.1712646484375, -3.00018310546875, -2.8291015625, -2.65802001953125, -2.4869384765625, -2.31585693359375, -2.144775390625, -1.97369384765625, -1.8026123046875, -1.63153076171875, -1.46044921875, -1.28936767578125, -1.1182861328125, -0.94720458984375, -0.776123046875, -0.60504150390625, -0.4339599609375, -0.26287841796875, -0.091796875, 0.07928466796875, 0.2503662109375, 0.42144775390625, 0.592529296875, 0.76361083984375, 0.9346923828125, 1.10577392578125, 1.27685546875, 1.44793701171875, 1.6190185546875, 1.79010009765625, 1.961181640625, 2.13226318359375, 2.3033447265625, 2.47442626953125, 2.6455078125, 2.81658935546875, 2.9876708984375, 3.15875244140625, 3.329833984375, 3.50091552734375, 3.6719970703125, 3.84307861328125, 4.01416015625, 4.18524169921875, 4.3563232421875, 4.52740478515625, 4.698486328125, 4.86956787109375, 5.0406494140625, 5.21173095703125, 5.3828125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 16.0, 29.0, 62.0, 66.0, 117.0, 188.0, 309.0, 492.0, 776.0, 1222.0, 2165.0, 3870.0, 6782.0, 11568.0, 21040.0, 38242.0, 68379.0, 120625.0, 209825.0, 344439.0, 515862.0, 658377.0, 677811.0, 560879.0, 388004.0, 240279.0, 140999.0, 79837.0, 44583.0, 24779.0, 13869.0, 7873.0, 4455.0, 2628.0, 1538.0, 883.0, 545.0, 317.0, 212.0, 116.0, 87.0, 43.0, 43.0, 19.0, 16.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.671875, -6.47052001953125, -6.2691650390625, -6.06781005859375, -5.866455078125, -5.66510009765625, -5.4637451171875, -5.26239013671875, -5.06103515625, -4.85968017578125, -4.6583251953125, -4.45697021484375, -4.255615234375, -4.05426025390625, -3.8529052734375, -3.65155029296875, -3.4501953125, -3.24884033203125, -3.0474853515625, -2.84613037109375, -2.644775390625, -2.44342041015625, -2.2420654296875, -2.04071044921875, -1.83935546875, -1.63800048828125, -1.4366455078125, -1.23529052734375, -1.033935546875, -0.83258056640625, -0.6312255859375, -0.42987060546875, -0.228515625, -0.02716064453125, 0.1741943359375, 0.37554931640625, 0.576904296875, 0.77825927734375, 0.9796142578125, 1.18096923828125, 1.38232421875, 1.58367919921875, 1.7850341796875, 1.98638916015625, 2.187744140625, 2.38909912109375, 2.5904541015625, 2.79180908203125, 2.9931640625, 3.19451904296875, 3.3958740234375, 3.59722900390625, 3.798583984375, 3.99993896484375, 4.2012939453125, 4.40264892578125, 4.60400390625, 4.80535888671875, 5.0067138671875, 5.20806884765625, 5.409423828125, 5.61077880859375, 5.8121337890625, 6.01348876953125, 6.21484375]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 11.0, 13.0, 12.0, 16.0, 34.0, 40.0, 57.0, 60.0, 78.0, 109.0, 130.0, 156.0, 184.0, 216.0, 203.0, 250.0, 227.0, 236.0, 226.0, 281.0, 240.0, 218.0, 201.0, 157.0, 137.0, 105.0, 91.0, 72.0, 70.0, 51.0, 45.0, 33.0, 21.0, 11.0, 22.0, 10.0, 8.0, 12.0, 8.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.34222412109375, -2.2528076171875, -2.16339111328125, -2.073974609375, -1.98455810546875, -1.8951416015625, -1.80572509765625, -1.71630859375, -1.62689208984375, -1.5374755859375, -1.44805908203125, -1.358642578125, -1.26922607421875, -1.1798095703125, -1.09039306640625, -1.0009765625, -0.91156005859375, -0.8221435546875, -0.73272705078125, -0.643310546875, -0.55389404296875, -0.4644775390625, -0.37506103515625, -0.28564453125, -0.19622802734375, -0.1068115234375, -0.01739501953125, 0.072021484375, 0.16143798828125, 0.2508544921875, 0.34027099609375, 0.4296875, 0.51910400390625, 0.6085205078125, 0.69793701171875, 0.787353515625, 0.87677001953125, 0.9661865234375, 1.05560302734375, 1.14501953125, 1.23443603515625, 1.3238525390625, 1.41326904296875, 1.502685546875, 1.59210205078125, 1.6815185546875, 1.77093505859375, 1.8603515625, 1.94976806640625, 2.0391845703125, 2.12860107421875, 2.218017578125, 2.30743408203125, 2.3968505859375, 2.48626708984375, 2.57568359375, 2.66510009765625, 2.7545166015625, 2.84393310546875, 2.933349609375, 3.02276611328125, 3.1121826171875, 3.20159912109375, 3.291015625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 3.0, 13.0, 10.0, 15.0, 14.0, 16.0, 27.0, 36.0, 39.0, 50.0, 48.0, 52.0, 56.0, 64.0, 74.0, 64.0, 55.0, 66.0, 59.0, 55.0, 26.0, 24.0, 33.0, 17.0, 15.0, 6.0, 14.0, 6.0, 5.0, 5.0, 7.0, 4.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.295978546142578, -9.025918006896973, -8.755857467651367, -8.485796928405762, -8.215736389160156, -7.945675849914551, -7.675614833831787, -7.405554294586182, -7.135493755340576, -6.865433216094971, -6.595372676849365, -6.32531213760376, -6.055251121520996, -5.785190582275391, -5.515130043029785, -5.24506950378418, -4.975008964538574, -4.704948425292969, -4.434887886047363, -4.164827346801758, -3.8947665691375732, -3.6247060298919678, -3.354645252227783, -3.0845847129821777, -2.8145241737365723, -2.544463634490967, -2.2744030952453613, -2.0043423175811768, -1.7342817783355713, -1.4642212390899658, -1.1941605806350708, -0.9240999221801758, -0.6540389060974121, -0.38397830724716187, -0.11391770839691162, 0.15614289045333862, 0.42620348930358887, 0.6962640285491943, 0.9663246870040894, 1.2363853454589844, 1.5064458847045898, 1.7765064239501953, 2.046566963195801, 2.3166277408599854, 2.586688280105591, 2.8567488193511963, 3.126809597015381, 3.3968701362609863, 3.666930675506592, 3.9369912147521973, 4.207051753997803, 4.477112293243408, 4.747173309326172, 5.017233848571777, 5.287294387817383, 5.557354927062988, 5.827415466308594, 6.097476005554199, 6.367536544799805, 6.63759708404541, 6.907657623291016, 7.177718162536621, 7.447779178619385, 7.71783971786499, 7.987900257110596]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 5.0, 3.0, 6.0, 7.0, 12.0, 14.0, 17.0, 13.0, 19.0, 27.0, 25.0, 36.0, 26.0, 46.0, 38.0, 28.0, 48.0, 51.0, 50.0, 42.0, 39.0, 46.0, 37.0, 35.0, 39.0, 39.0, 32.0, 27.0, 33.0, 24.0, 22.0, 18.0, 21.0, 10.0, 12.0, 12.0, 10.0, 3.0, 13.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-7.442991256713867, -7.217339038848877, -6.991686820983887, -6.7660346031188965, -6.540382385253906, -6.314730644226074, -6.089078426361084, -5.863426208496094, -5.6377739906311035, -5.412121772766113, -5.186469554901123, -4.960817337036133, -4.735165596008301, -4.509512901306152, -4.28386116027832, -4.05820894241333, -3.83255672454834, -3.6069045066833496, -3.3812522888183594, -3.1556003093719482, -2.929948091506958, -2.7042958736419678, -2.4786438941955566, -2.2529916763305664, -2.027339458465576, -1.801687240600586, -1.5760351419448853, -1.3503830432891846, -1.1247308254241943, -0.8990786075592041, -0.6734265089035034, -0.44777441024780273, -0.2221221923828125, 0.003529965877532959, 0.22918212413787842, 0.4548342823982239, 0.6804864406585693, 0.9061386585235596, 1.1317907571792603, 1.357442855834961, 1.5830950736999512, 1.8087472915649414, 2.0343995094299316, 2.2600514888763428, 2.485703706741333, 2.7113559246063232, 2.9370079040527344, 3.1626601219177246, 3.388312339782715, 3.613964557647705, 3.8396167755126953, 4.0652689933776855, 4.290921211242676, 4.516572952270508, 4.742225170135498, 4.967877388000488, 5.1935296058654785, 5.419181823730469, 5.644834041595459, 5.870486259460449, 6.096138000488281, 6.32179069519043, 6.547442436218262, 6.773094654083252, 6.998746871948242]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 10.0, 15.0, 23.0, 24.0, 53.0, 75.0, 114.0, 189.0, 273.0, 411.0, 592.0, 969.0, 1465.0, 2203.0, 3627.0, 5602.0, 8810.0, 14306.0, 23406.0, 37534.0, 60523.0, 96180.0, 144185.0, 186935.0, 160842.0, 111482.0, 71536.0, 44230.0, 27218.0, 16786.0, 10551.0, 6523.0, 4202.0, 2723.0, 1731.0, 1098.0, 716.0, 450.0, 322.0, 202.0, 146.0, 105.0, 53.0, 36.0, 24.0, 19.0, 10.0, 8.0, 6.0, 1.0, 1.0, 4.0, 3.0, 2.0], "bins": [-0.99462890625, -0.965087890625, -0.935546875, -0.906005859375, -0.87646484375, -0.846923828125, -0.8173828125, -0.787841796875, -0.75830078125, -0.728759765625, -0.69921875, -0.669677734375, -0.64013671875, -0.610595703125, -0.5810546875, -0.551513671875, -0.52197265625, -0.492431640625, -0.462890625, -0.433349609375, -0.40380859375, -0.374267578125, -0.3447265625, -0.315185546875, -0.28564453125, -0.256103515625, -0.2265625, -0.197021484375, -0.16748046875, -0.137939453125, -0.1083984375, -0.078857421875, -0.04931640625, -0.019775390625, 0.009765625, 0.039306640625, 0.06884765625, 0.098388671875, 0.1279296875, 0.157470703125, 0.18701171875, 0.216552734375, 0.24609375, 0.275634765625, 0.30517578125, 0.334716796875, 0.3642578125, 0.393798828125, 0.42333984375, 0.452880859375, 0.482421875, 0.511962890625, 0.54150390625, 0.571044921875, 0.6005859375, 0.630126953125, 0.65966796875, 0.689208984375, 0.71875, 0.748291015625, 0.77783203125, 0.807373046875, 0.8369140625, 0.866455078125, 0.89599609375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 3.0, 12.0, 14.0, 8.0, 18.0, 12.0, 13.0, 29.0, 32.0, 32.0, 43.0, 33.0, 39.0, 43.0, 32.0, 56.0, 63.0, 47.0, 51.0, 50.0, 36.0, 45.0, 34.0, 43.0, 31.0, 21.0, 27.0, 24.0, 21.0, 19.0, 16.0, 8.0, 9.0, 9.0, 5.0, 5.0, 1.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-9.46875, -9.20855712890625, -8.9483642578125, -8.68817138671875, -8.427978515625, -8.16778564453125, -7.9075927734375, -7.64739990234375, -7.38720703125, -7.12701416015625, -6.8668212890625, -6.60662841796875, -6.346435546875, -6.08624267578125, -5.8260498046875, -5.56585693359375, -5.3056640625, -5.04547119140625, -4.7852783203125, -4.52508544921875, -4.264892578125, -4.00469970703125, -3.7445068359375, -3.48431396484375, -3.22412109375, -2.96392822265625, -2.7037353515625, -2.44354248046875, -2.183349609375, -1.92315673828125, -1.6629638671875, -1.40277099609375, -1.142578125, -0.88238525390625, -0.6221923828125, -0.36199951171875, -0.101806640625, 0.15838623046875, 0.4185791015625, 0.67877197265625, 0.93896484375, 1.19915771484375, 1.4593505859375, 1.71954345703125, 1.979736328125, 2.23992919921875, 2.5001220703125, 2.76031494140625, 3.0205078125, 3.28070068359375, 3.5408935546875, 3.80108642578125, 4.061279296875, 4.32147216796875, 4.5816650390625, 4.84185791015625, 5.10205078125, 5.36224365234375, 5.6224365234375, 5.88262939453125, 6.142822265625, 6.40301513671875, 6.6632080078125, 6.92340087890625, 7.18359375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 5.0, 8.0, 12.0, 15.0, 19.0, 38.0, 45.0, 81.0, 93.0, 162.0, 227.0, 334.0, 527.0, 799.0, 1156.0, 1643.0, 2655.0, 3926.0, 5734.0, 8725.0, 13226.0, 20236.0, 30585.0, 46003.0, 69265.0, 101020.0, 140802.0, 164279.0, 138285.0, 98920.0, 67612.0, 45302.0, 29568.0, 19306.0, 12700.0, 8276.0, 5575.0, 3782.0, 2523.0, 1648.0, 1119.0, 767.0, 509.0, 344.0, 219.0, 152.0, 112.0, 74.0, 36.0, 31.0, 33.0, 20.0, 11.0, 9.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.8720703125, -0.8443603515625, -0.816650390625, -0.7889404296875, -0.76123046875, -0.7335205078125, -0.705810546875, -0.6781005859375, -0.650390625, -0.6226806640625, -0.594970703125, -0.5672607421875, -0.53955078125, -0.5118408203125, -0.484130859375, -0.4564208984375, -0.4287109375, -0.4010009765625, -0.373291015625, -0.3455810546875, -0.31787109375, -0.2901611328125, -0.262451171875, -0.2347412109375, -0.20703125, -0.1793212890625, -0.151611328125, -0.1239013671875, -0.09619140625, -0.0684814453125, -0.040771484375, -0.0130615234375, 0.0146484375, 0.0423583984375, 0.070068359375, 0.0977783203125, 0.12548828125, 0.1531982421875, 0.180908203125, 0.2086181640625, 0.236328125, 0.2640380859375, 0.291748046875, 0.3194580078125, 0.34716796875, 0.3748779296875, 0.402587890625, 0.4302978515625, 0.4580078125, 0.4857177734375, 0.513427734375, 0.5411376953125, 0.56884765625, 0.5965576171875, 0.624267578125, 0.6519775390625, 0.6796875, 0.7073974609375, 0.735107421875, 0.7628173828125, 0.79052734375, 0.8182373046875, 0.845947265625, 0.8736572265625, 0.9013671875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 6.0, 4.0, 4.0, 6.0, 9.0, 12.0, 8.0, 13.0, 8.0, 16.0, 11.0, 20.0, 19.0, 29.0, 29.0, 36.0, 30.0, 33.0, 30.0, 42.0, 43.0, 41.0, 47.0, 42.0, 39.0, 46.0, 33.0, 36.0, 34.0, 35.0, 31.0, 35.0, 28.0, 24.0, 18.0, 18.0, 21.0, 14.0, 10.0, 13.0, 12.0, 5.0, 7.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.3671875, -4.2266845703125, -4.086181640625, -3.9456787109375, -3.80517578125, -3.6646728515625, -3.524169921875, -3.3836669921875, -3.2431640625, -3.1026611328125, -2.962158203125, -2.8216552734375, -2.68115234375, -2.5406494140625, -2.400146484375, -2.2596435546875, -2.119140625, -1.9786376953125, -1.838134765625, -1.6976318359375, -1.55712890625, -1.4166259765625, -1.276123046875, -1.1356201171875, -0.9951171875, -0.8546142578125, -0.714111328125, -0.5736083984375, -0.43310546875, -0.2926025390625, -0.152099609375, -0.0115966796875, 0.12890625, 0.2694091796875, 0.409912109375, 0.5504150390625, 0.69091796875, 0.8314208984375, 0.971923828125, 1.1124267578125, 1.2529296875, 1.3934326171875, 1.533935546875, 1.6744384765625, 1.81494140625, 1.9554443359375, 2.095947265625, 2.2364501953125, 2.376953125, 2.5174560546875, 2.657958984375, 2.7984619140625, 2.93896484375, 3.0794677734375, 3.219970703125, 3.3604736328125, 3.5009765625, 3.6414794921875, 3.781982421875, 3.9224853515625, 4.06298828125, 4.2034912109375, 4.343994140625, 4.4844970703125, 4.625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 12.0, 15.0, 15.0, 20.0, 42.0, 50.0, 98.0, 120.0, 232.0, 387.0, 563.0, 992.0, 1617.0, 2965.0, 5506.0, 10949.0, 22306.0, 48232.0, 115099.0, 285374.0, 318659.0, 129779.0, 54266.0, 25059.0, 11932.0, 6308.0, 3308.0, 1849.0, 1072.0, 643.0, 407.0, 232.0, 166.0, 88.0, 54.0, 45.0, 25.0, 15.0, 14.0, 10.0, 11.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.113037109375, -0.109619140625, -0.106201171875, -0.102783203125, -0.099365234375, -0.095947265625, -0.092529296875, -0.089111328125, -0.085693359375, -0.082275390625, -0.078857421875, -0.075439453125, -0.072021484375, -0.068603515625, -0.065185546875, -0.061767578125, -0.058349609375, -0.054931640625, -0.051513671875, -0.048095703125, -0.044677734375, -0.041259765625, -0.037841796875, -0.034423828125, -0.031005859375, -0.027587890625, -0.024169921875, -0.020751953125, -0.017333984375, -0.013916015625, -0.010498046875, -0.007080078125, -0.003662109375, -0.000244140625, 0.003173828125, 0.006591796875, 0.010009765625, 0.013427734375, 0.016845703125, 0.020263671875, 0.023681640625, 0.027099609375, 0.030517578125, 0.033935546875, 0.037353515625, 0.040771484375, 0.044189453125, 0.047607421875, 0.051025390625, 0.054443359375, 0.057861328125, 0.061279296875, 0.064697265625, 0.068115234375, 0.071533203125, 0.074951171875, 0.078369140625, 0.081787109375, 0.085205078125, 0.088623046875, 0.092041015625, 0.095458984375, 0.098876953125, 0.102294921875, 0.105712890625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 7.0, 5.0, 9.0, 10.0, 8.0, 14.0, 13.0, 21.0, 24.0, 29.0, 36.0, 41.0, 46.0, 65.0, 56.0, 67.0, 52.0, 53.0, 68.0, 43.0, 52.0, 56.0, 50.0, 27.0, 34.0, 18.0, 22.0, 18.0, 12.0, 15.0, 6.0, 4.0, 10.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2934207916259766e-05, -1.2527219951152802e-05, -1.2120231986045837e-05, -1.1713244020938873e-05, -1.130625605583191e-05, -1.0899268090724945e-05, -1.0492280125617981e-05, -1.0085292160511017e-05, -9.678304195404053e-06, -9.271316230297089e-06, -8.864328265190125e-06, -8.45734030008316e-06, -8.050352334976196e-06, -7.643364369869232e-06, -7.236376404762268e-06, -6.829388439655304e-06, -6.42240047454834e-06, -6.015412509441376e-06, -5.608424544334412e-06, -5.2014365792274475e-06, -4.794448614120483e-06, -4.387460649013519e-06, -3.980472683906555e-06, -3.573484718799591e-06, -3.166496753692627e-06, -2.759508788585663e-06, -2.3525208234786987e-06, -1.9455328583717346e-06, -1.5385448932647705e-06, -1.1315569281578064e-06, -7.245689630508423e-07, -3.175809979438782e-07, 8.940696716308594e-08, 4.9639493227005e-07, 9.033828973770142e-07, 1.3103708624839783e-06, 1.7173588275909424e-06, 2.1243467926979065e-06, 2.5313347578048706e-06, 2.9383227229118347e-06, 3.345310688018799e-06, 3.752298653125763e-06, 4.159286618232727e-06, 4.566274583339691e-06, 4.973262548446655e-06, 5.380250513553619e-06, 5.7872384786605835e-06, 6.194226443767548e-06, 6.601214408874512e-06, 7.008202373981476e-06, 7.41519033908844e-06, 7.822178304195404e-06, 8.229166269302368e-06, 8.636154234409332e-06, 9.043142199516296e-06, 9.45013016462326e-06, 9.857118129730225e-06, 1.0264106094837189e-05, 1.0671094059944153e-05, 1.1078082025051117e-05, 1.1485069990158081e-05, 1.1892057955265045e-05, 1.229904592037201e-05, 1.2706033885478973e-05, 1.3113021850585938e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 5.0, 9.0, 13.0, 16.0, 17.0, 37.0, 45.0, 74.0, 110.0, 143.0, 244.0, 342.0, 482.0, 728.0, 1116.0, 1590.0, 2496.0, 4057.0, 6618.0, 10577.0, 18288.0, 31875.0, 57892.0, 108478.0, 206275.0, 262886.0, 150966.0, 79220.0, 42909.0, 24224.0, 14055.0, 8295.0, 5141.0, 3222.0, 2106.0, 1322.0, 871.0, 544.0, 383.0, 240.0, 172.0, 129.0, 103.0, 79.0, 44.0, 31.0, 28.0, 19.0, 14.0, 11.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0997314453125, -0.09654045104980469, -0.09334945678710938, -0.09015846252441406, -0.08696746826171875, -0.08377647399902344, -0.08058547973632812, -0.07739448547363281, -0.0742034912109375, -0.07101249694824219, -0.06782150268554688, -0.06463050842285156, -0.06143951416015625, -0.05824851989746094, -0.055057525634765625, -0.05186653137207031, -0.048675537109375, -0.04548454284667969, -0.042293548583984375, -0.03910255432128906, -0.03591156005859375, -0.03272056579589844, -0.029529571533203125, -0.026338577270507812, -0.0231475830078125, -0.019956588745117188, -0.016765594482421875, -0.013574600219726562, -0.01038360595703125, -0.0071926116943359375, -0.004001617431640625, -0.0008106231689453125, 0.00238037109375, 0.0055713653564453125, 0.008762359619140625, 0.011953353881835938, 0.01514434814453125, 0.018335342407226562, 0.021526336669921875, 0.024717330932617188, 0.0279083251953125, 0.031099319458007812, 0.034290313720703125, 0.03748130798339844, 0.04067230224609375, 0.04386329650878906, 0.047054290771484375, 0.05024528503417969, 0.053436279296875, 0.05662727355957031, 0.059818267822265625, 0.06300926208496094, 0.06620025634765625, 0.06939125061035156, 0.07258224487304688, 0.07577323913574219, 0.0789642333984375, 0.08215522766113281, 0.08534622192382812, 0.08853721618652344, 0.09172821044921875, 0.09491920471191406, 0.09811019897460938, 0.10130119323730469, 0.1044921875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 2.0, 3.0, 7.0, 9.0, 5.0, 6.0, 12.0, 11.0, 10.0, 8.0, 26.0, 17.0, 18.0, 21.0, 27.0, 31.0, 44.0, 63.0, 52.0, 82.0, 102.0, 59.0, 46.0, 53.0, 46.0, 38.0, 22.0, 32.0, 17.0, 17.0, 15.0, 15.0, 17.0, 11.0, 8.0, 10.0, 5.0, 4.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.033782958984375, -0.032694339752197266, -0.03160572052001953, -0.030517101287841797, -0.029428482055664062, -0.028339862823486328, -0.027251243591308594, -0.02616262435913086, -0.025074005126953125, -0.02398538589477539, -0.022896766662597656, -0.021808147430419922, -0.020719528198242188, -0.019630908966064453, -0.01854228973388672, -0.017453670501708984, -0.01636505126953125, -0.015276432037353516, -0.014187812805175781, -0.013099193572998047, -0.012010574340820312, -0.010921955108642578, -0.009833335876464844, -0.00874471664428711, -0.007656097412109375, -0.006567478179931641, -0.005478858947753906, -0.004390239715576172, -0.0033016204833984375, -0.002213001251220703, -0.0011243820190429688, -3.5762786865234375e-05, 0.0010528564453125, 0.0021414756774902344, 0.0032300949096679688, 0.004318714141845703, 0.0054073333740234375, 0.006495952606201172, 0.007584571838378906, 0.00867319107055664, 0.009761810302734375, 0.01085042953491211, 0.011939048767089844, 0.013027667999267578, 0.014116287231445312, 0.015204906463623047, 0.01629352569580078, 0.017382144927978516, 0.01847076416015625, 0.019559383392333984, 0.02064800262451172, 0.021736621856689453, 0.022825241088867188, 0.023913860321044922, 0.025002479553222656, 0.02609109878540039, 0.027179718017578125, 0.02826833724975586, 0.029356956481933594, 0.030445575714111328, 0.03153419494628906, 0.0326228141784668, 0.03371143341064453, 0.034800052642822266, 0.035888671875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 8.0, 9.0, 10.0, 13.0, 19.0, 18.0, 26.0, 38.0, 44.0, 47.0, 44.0, 60.0, 54.0, 56.0, 79.0, 56.0, 62.0, 59.0, 61.0, 52.0, 27.0, 23.0, 33.0, 15.0, 19.0, 7.0, 14.0, 3.0, 6.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.1707124710083, -8.903457641601562, -8.63620376586914, -8.368948936462402, -8.101694107055664, -7.834439754486084, -7.567185401916504, -7.299930572509766, -7.0326762199401855, -6.7654218673706055, -6.498167037963867, -6.230912685394287, -5.963658332824707, -5.696403503417969, -5.429149150848389, -5.161894798278809, -4.89463996887207, -4.62738561630249, -4.360130786895752, -4.092876434326172, -3.8256218433380127, -3.5583672523498535, -3.2911128997802734, -3.0238583087921143, -2.756603717803955, -2.489349126815796, -2.2220945358276367, -1.9548401832580566, -1.6875855922698975, -1.4203310012817383, -1.1530765295028687, -0.885822057723999, -0.6185684204101562, -0.35131388902664185, -0.08405935764312744, 0.18319517374038696, 0.45044970512390137, 0.7177042961120605, 0.9849587678909302, 1.2522132396697998, 1.519467830657959, 1.7867224216461182, 2.0539770126342773, 2.3212313652038574, 2.5884859561920166, 2.855740547180176, 3.122994899749756, 3.390249490737915, 3.657504081726074, 3.9247586727142334, 4.192013263702393, 4.459267616271973, 4.726522445678711, 4.993776798248291, 5.261031150817871, 5.528285980224609, 5.7955403327941895, 6.0627946853637695, 6.330049514770508, 6.597303867340088, 6.864558219909668, 7.131813049316406, 7.399067401885986, 7.666321754455566, 7.933576583862305]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 3.0, 6.0, 7.0, 11.0, 15.0, 16.0, 15.0, 20.0, 25.0, 26.0, 35.0, 25.0, 47.0, 38.0, 31.0, 43.0, 54.0, 48.0, 44.0, 39.0, 45.0, 37.0, 36.0, 39.0, 40.0, 29.0, 29.0, 33.0, 25.0, 21.0, 17.0, 21.0, 10.0, 12.0, 12.0, 11.0, 3.0, 12.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-7.426126956939697, -7.2002105712890625, -6.974294185638428, -6.748377799987793, -6.522461891174316, -6.296545028686523, -6.070629119873047, -5.844712734222412, -5.618796348571777, -5.392879962921143, -5.166963577270508, -4.941047191619873, -4.715130805969238, -4.489214897155762, -4.263298511505127, -4.037382125854492, -3.8114657402038574, -3.5855493545532227, -3.359632968902588, -3.1337168216705322, -2.9078004360198975, -2.6818840503692627, -2.455967903137207, -2.2300515174865723, -2.0041351318359375, -1.7782187461853027, -1.5523024797439575, -1.3263862133026123, -1.1004698276519775, -0.8745534420013428, -0.6486371755599976, -0.42272090911865234, -0.19680404663085938, 0.029112279415130615, 0.2550286054611206, 0.4809449315071106, 0.7068612575531006, 0.9327776432037354, 1.1586939096450806, 1.3846101760864258, 1.6105265617370605, 1.8364429473876953, 2.06235933303833, 2.2882754802703857, 2.5141918659210205, 2.7401082515716553, 2.966024398803711, 3.1919407844543457, 3.4178571701049805, 3.6437735557556152, 3.86968994140625, 4.095606327056885, 4.3215227127075195, 4.547438621520996, 4.773355007171631, 4.999271392822266, 5.2251877784729, 5.451104164123535, 5.67702054977417, 5.902936935424805, 6.128852844238281, 6.354769706726074, 6.580685615539551, 6.8066020011901855, 7.03251838684082]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 6.0, 12.0, 13.0, 31.0, 46.0, 75.0, 108.0, 197.0, 240.0, 419.0, 580.0, 847.0, 1277.0, 1968.0, 2992.0, 4515.0, 6568.0, 9870.0, 14731.0, 21528.0, 31760.0, 44734.0, 62142.0, 82398.0, 99893.0, 112816.0, 115019.0, 106764.0, 89867.0, 69938.0, 52152.0, 36737.0, 25783.0, 17400.0, 11578.0, 7806.0, 5273.0, 3472.0, 2233.0, 1571.0, 1085.0, 684.0, 475.0, 332.0, 218.0, 126.0, 90.0, 60.0, 53.0, 27.0, 15.0, 13.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.974609375, -3.851226806640625, -3.72784423828125, -3.604461669921875, -3.4810791015625, -3.357696533203125, -3.23431396484375, -3.110931396484375, -2.987548828125, -2.864166259765625, -2.74078369140625, -2.617401123046875, -2.4940185546875, -2.370635986328125, -2.24725341796875, -2.123870849609375, -2.00048828125, -1.877105712890625, -1.75372314453125, -1.630340576171875, -1.5069580078125, -1.383575439453125, -1.26019287109375, -1.136810302734375, -1.013427734375, -0.890045166015625, -0.76666259765625, -0.643280029296875, -0.5198974609375, -0.396514892578125, -0.27313232421875, -0.149749755859375, -0.0263671875, 0.097015380859375, 0.22039794921875, 0.343780517578125, 0.4671630859375, 0.590545654296875, 0.71392822265625, 0.837310791015625, 0.960693359375, 1.084075927734375, 1.20745849609375, 1.330841064453125, 1.4542236328125, 1.577606201171875, 1.70098876953125, 1.824371337890625, 1.94775390625, 2.071136474609375, 2.19451904296875, 2.317901611328125, 2.4412841796875, 2.564666748046875, 2.68804931640625, 2.811431884765625, 2.934814453125, 3.058197021484375, 3.18157958984375, 3.304962158203125, 3.4283447265625, 3.551727294921875, 3.67510986328125, 3.798492431640625, 3.921875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 2.0, 7.0, 9.0, 16.0, 14.0, 18.0, 17.0, 17.0, 19.0, 26.0, 29.0, 35.0, 50.0, 29.0, 44.0, 45.0, 45.0, 56.0, 46.0, 39.0, 39.0, 46.0, 25.0, 41.0, 29.0, 35.0, 26.0, 24.0, 31.0, 23.0, 16.0, 26.0, 14.0, 10.0, 4.0, 10.0, 7.0, 2.0, 6.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.3984375, -7.17218017578125, -6.9459228515625, -6.71966552734375, -6.493408203125, -6.26715087890625, -6.0408935546875, -5.81463623046875, -5.58837890625, -5.36212158203125, -5.1358642578125, -4.90960693359375, -4.683349609375, -4.45709228515625, -4.2308349609375, -4.00457763671875, -3.7783203125, -3.55206298828125, -3.3258056640625, -3.09954833984375, -2.873291015625, -2.64703369140625, -2.4207763671875, -2.19451904296875, -1.96826171875, -1.74200439453125, -1.5157470703125, -1.28948974609375, -1.063232421875, -0.83697509765625, -0.6107177734375, -0.38446044921875, -0.158203125, 0.06805419921875, 0.2943115234375, 0.52056884765625, 0.746826171875, 0.97308349609375, 1.1993408203125, 1.42559814453125, 1.65185546875, 1.87811279296875, 2.1043701171875, 2.33062744140625, 2.556884765625, 2.78314208984375, 3.0093994140625, 3.23565673828125, 3.4619140625, 3.68817138671875, 3.9144287109375, 4.14068603515625, 4.366943359375, 4.59320068359375, 4.8194580078125, 5.04571533203125, 5.27197265625, 5.49822998046875, 5.7244873046875, 5.95074462890625, 6.177001953125, 6.40325927734375, 6.6295166015625, 6.85577392578125, 7.08203125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 10.0, 10.0, 17.0, 41.0, 59.0, 80.0, 125.0, 211.0, 339.0, 599.0, 935.0, 1486.0, 2508.0, 4198.0, 6993.0, 11241.0, 17986.0, 28894.0, 44354.0, 65338.0, 90107.0, 114383.0, 130586.0, 130549.0, 115482.0, 91982.0, 67129.0, 45383.0, 29415.0, 18649.0, 11628.0, 6993.0, 4293.0, 2563.0, 1600.0, 949.0, 554.0, 335.0, 225.0, 123.0, 78.0, 46.0, 28.0, 18.0, 11.0, 9.0, 7.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-4.8828125, -4.73931884765625, -4.5958251953125, -4.45233154296875, -4.308837890625, -4.16534423828125, -4.0218505859375, -3.87835693359375, -3.73486328125, -3.59136962890625, -3.4478759765625, -3.30438232421875, -3.160888671875, -3.01739501953125, -2.8739013671875, -2.73040771484375, -2.5869140625, -2.44342041015625, -2.2999267578125, -2.15643310546875, -2.012939453125, -1.86944580078125, -1.7259521484375, -1.58245849609375, -1.43896484375, -1.29547119140625, -1.1519775390625, -1.00848388671875, -0.864990234375, -0.72149658203125, -0.5780029296875, -0.43450927734375, -0.291015625, -0.14752197265625, -0.0040283203125, 0.13946533203125, 0.282958984375, 0.42645263671875, 0.5699462890625, 0.71343994140625, 0.85693359375, 1.00042724609375, 1.1439208984375, 1.28741455078125, 1.430908203125, 1.57440185546875, 1.7178955078125, 1.86138916015625, 2.0048828125, 2.14837646484375, 2.2918701171875, 2.43536376953125, 2.578857421875, 2.72235107421875, 2.8658447265625, 3.00933837890625, 3.15283203125, 3.29632568359375, 3.4398193359375, 3.58331298828125, 3.726806640625, 3.87030029296875, 4.0137939453125, 4.15728759765625, 4.30078125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 7.0, 6.0, 10.0, 9.0, 9.0, 7.0, 16.0, 13.0, 18.0, 14.0, 40.0, 27.0, 16.0, 30.0, 31.0, 33.0, 34.0, 25.0, 40.0, 36.0, 33.0, 38.0, 32.0, 33.0, 38.0, 32.0, 26.0, 38.0, 22.0, 32.0, 32.0, 29.0, 20.0, 28.0, 20.0, 13.0, 14.0, 14.0, 16.0, 18.0, 4.0, 7.0, 5.0, 1.0, 6.0, 6.0, 8.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.419921875, -3.303314208984375, -3.18670654296875, -3.070098876953125, -2.9534912109375, -2.836883544921875, -2.72027587890625, -2.603668212890625, -2.487060546875, -2.370452880859375, -2.25384521484375, -2.137237548828125, -2.0206298828125, -1.904022216796875, -1.78741455078125, -1.670806884765625, -1.55419921875, -1.437591552734375, -1.32098388671875, -1.204376220703125, -1.0877685546875, -0.971160888671875, -0.85455322265625, -0.737945556640625, -0.621337890625, -0.504730224609375, -0.38812255859375, -0.271514892578125, -0.1549072265625, -0.038299560546875, 0.07830810546875, 0.194915771484375, 0.3115234375, 0.428131103515625, 0.54473876953125, 0.661346435546875, 0.7779541015625, 0.894561767578125, 1.01116943359375, 1.127777099609375, 1.244384765625, 1.360992431640625, 1.47760009765625, 1.594207763671875, 1.7108154296875, 1.827423095703125, 1.94403076171875, 2.060638427734375, 2.17724609375, 2.293853759765625, 2.41046142578125, 2.527069091796875, 2.6436767578125, 2.760284423828125, 2.87689208984375, 2.993499755859375, 3.110107421875, 3.226715087890625, 3.34332275390625, 3.459930419921875, 3.5765380859375, 3.693145751953125, 3.80975341796875, 3.926361083984375, 4.04296875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 7.0, 10.0, 16.0, 16.0, 36.0, 44.0, 59.0, 97.0, 118.0, 156.0, 203.0, 325.0, 463.0, 660.0, 1000.0, 1587.0, 2493.0, 3987.0, 6640.0, 11257.0, 18997.0, 32278.0, 53394.0, 85148.0, 123814.0, 155092.0, 160575.0, 135185.0, 97240.0, 62416.0, 38510.0, 22529.0, 13447.0, 7758.0, 4762.0, 2845.0, 1750.0, 1177.0, 771.0, 536.0, 325.0, 210.0, 180.0, 127.0, 92.0, 71.0, 46.0, 29.0, 24.0, 17.0, 14.0, 10.0, 7.0, 1.0, 5.0, 0.0, 2.0, 2.0], "bins": [-2.158203125, -2.091094970703125, -2.02398681640625, -1.956878662109375, -1.8897705078125, -1.822662353515625, -1.75555419921875, -1.688446044921875, -1.621337890625, -1.554229736328125, -1.48712158203125, -1.420013427734375, -1.3529052734375, -1.285797119140625, -1.21868896484375, -1.151580810546875, -1.08447265625, -1.017364501953125, -0.95025634765625, -0.883148193359375, -0.8160400390625, -0.748931884765625, -0.68182373046875, -0.614715576171875, -0.547607421875, -0.480499267578125, -0.41339111328125, -0.346282958984375, -0.2791748046875, -0.212066650390625, -0.14495849609375, -0.077850341796875, -0.0107421875, 0.056365966796875, 0.12347412109375, 0.190582275390625, 0.2576904296875, 0.324798583984375, 0.39190673828125, 0.459014892578125, 0.526123046875, 0.593231201171875, 0.66033935546875, 0.727447509765625, 0.7945556640625, 0.861663818359375, 0.92877197265625, 0.995880126953125, 1.06298828125, 1.130096435546875, 1.19720458984375, 1.264312744140625, 1.3314208984375, 1.398529052734375, 1.46563720703125, 1.532745361328125, 1.599853515625, 1.666961669921875, 1.73406982421875, 1.801177978515625, 1.8682861328125, 1.935394287109375, 2.00250244140625, 2.069610595703125, 2.13671875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 4.0, 4.0, 8.0, 16.0, 19.0, 21.0, 27.0, 23.0, 27.0, 36.0, 31.0, 40.0, 54.0, 60.0, 48.0, 60.0, 51.0, 57.0, 52.0, 61.0, 58.0, 37.0, 27.0, 28.0, 38.0, 28.0, 11.0, 11.0, 9.0, 11.0, 9.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017952919006347656, -0.00017348118126392365, -0.00016743317246437073, -0.0001613851636648178, -0.0001553371548652649, -0.00014928914606571198, -0.00014324113726615906, -0.00013719312846660614, -0.00013114511966705322, -0.0001250971108675003, -0.00011904910206794739, -0.00011300109326839447, -0.00010695308446884155, -0.00010090507566928864, -9.485706686973572e-05, -8.88090580701828e-05, -8.276104927062988e-05, -7.671304047107697e-05, -7.066503167152405e-05, -6.461702287197113e-05, -5.856901407241821e-05, -5.2521005272865295e-05, -4.647299647331238e-05, -4.042498767375946e-05, -3.437697887420654e-05, -2.8328970074653625e-05, -2.2280961275100708e-05, -1.623295247554779e-05, -1.0184943675994873e-05, -4.1369348764419556e-06, 1.911073923110962e-06, 7.95908272266388e-06, 1.4007091522216797e-05, 2.0055100321769714e-05, 2.6103109121322632e-05, 3.215111792087555e-05, 3.819912672042847e-05, 4.4247135519981384e-05, 5.02951443195343e-05, 5.634315311908722e-05, 6.239116191864014e-05, 6.843917071819305e-05, 7.448717951774597e-05, 8.053518831729889e-05, 8.65831971168518e-05, 9.263120591640472e-05, 9.867921471595764e-05, 0.00010472722351551056, 0.00011077523231506348, 0.0001168232411146164, 0.0001228712499141693, 0.00012891925871372223, 0.00013496726751327515, 0.00014101527631282806, 0.00014706328511238098, 0.0001531112939119339, 0.00015915930271148682, 0.00016520731151103973, 0.00017125532031059265, 0.00017730332911014557, 0.00018335133790969849, 0.0001893993467092514, 0.00019544735550880432, 0.00020149536430835724, 0.00020754337310791016]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 16.0, 17.0, 16.0, 42.0, 49.0, 74.0, 137.0, 175.0, 293.0, 424.0, 618.0, 980.0, 1573.0, 2523.0, 4241.0, 7461.0, 12234.0, 21149.0, 36829.0, 61637.0, 98913.0, 142909.0, 171071.0, 161955.0, 123326.0, 80932.0, 49400.0, 28694.0, 16480.0, 9677.0, 5663.0, 3383.0, 2063.0, 1308.0, 762.0, 520.0, 324.0, 218.0, 143.0, 92.0, 64.0, 54.0, 34.0, 26.0, 16.0, 5.0, 10.0, 7.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0], "bins": [-2.4375, -2.363128662109375, -2.28875732421875, -2.214385986328125, -2.1400146484375, -2.065643310546875, -1.99127197265625, -1.916900634765625, -1.842529296875, -1.768157958984375, -1.69378662109375, -1.619415283203125, -1.5450439453125, -1.470672607421875, -1.39630126953125, -1.321929931640625, -1.24755859375, -1.173187255859375, -1.09881591796875, -1.024444580078125, -0.9500732421875, -0.875701904296875, -0.80133056640625, -0.726959228515625, -0.652587890625, -0.578216552734375, -0.50384521484375, -0.429473876953125, -0.3551025390625, -0.280731201171875, -0.20635986328125, -0.131988525390625, -0.0576171875, 0.016754150390625, 0.09112548828125, 0.165496826171875, 0.2398681640625, 0.314239501953125, 0.38861083984375, 0.462982177734375, 0.537353515625, 0.611724853515625, 0.68609619140625, 0.760467529296875, 0.8348388671875, 0.909210205078125, 0.98358154296875, 1.057952880859375, 1.13232421875, 1.206695556640625, 1.28106689453125, 1.355438232421875, 1.4298095703125, 1.504180908203125, 1.57855224609375, 1.652923583984375, 1.727294921875, 1.801666259765625, 1.87603759765625, 1.950408935546875, 2.0247802734375, 2.099151611328125, 2.17352294921875, 2.247894287109375, 2.322265625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 7.0, 6.0, 9.0, 7.0, 5.0, 8.0, 16.0, 20.0, 27.0, 23.0, 28.0, 40.0, 49.0, 35.0, 58.0, 72.0, 58.0, 49.0, 71.0, 55.0, 55.0, 37.0, 41.0, 40.0, 27.0, 34.0, 24.0, 19.0, 13.0, 12.0, 12.0, 5.0, 6.0, 7.0, 5.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84765625, -0.8224563598632812, -0.7972564697265625, -0.7720565795898438, -0.746856689453125, -0.7216567993164062, -0.6964569091796875, -0.6712570190429688, -0.64605712890625, -0.6208572387695312, -0.5956573486328125, -0.5704574584960938, -0.545257568359375, -0.5200576782226562, -0.4948577880859375, -0.46965789794921875, -0.4444580078125, -0.41925811767578125, -0.3940582275390625, -0.36885833740234375, -0.343658447265625, -0.31845855712890625, -0.2932586669921875, -0.26805877685546875, -0.24285888671875, -0.21765899658203125, -0.1924591064453125, -0.16725921630859375, -0.142059326171875, -0.11685943603515625, -0.0916595458984375, -0.06645965576171875, -0.041259765625, -0.01605987548828125, 0.0091400146484375, 0.03433990478515625, 0.059539794921875, 0.08473968505859375, 0.1099395751953125, 0.13513946533203125, 0.16033935546875, 0.18553924560546875, 0.2107391357421875, 0.23593902587890625, 0.261138916015625, 0.28633880615234375, 0.3115386962890625, 0.33673858642578125, 0.3619384765625, 0.38713836669921875, 0.4123382568359375, 0.43753814697265625, 0.462738037109375, 0.48793792724609375, 0.5131378173828125, 0.5383377075195312, 0.56353759765625, 0.5887374877929688, 0.6139373779296875, 0.6391372680664062, 0.664337158203125, 0.6895370483398438, 0.7147369384765625, 0.7399368286132812, 0.76513671875]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 8.0, 10.0, 17.0, 25.0, 16.0, 26.0, 32.0, 33.0, 34.0, 39.0, 56.0, 62.0, 63.0, 69.0, 65.0, 69.0, 58.0, 53.0, 47.0, 51.0, 23.0, 20.0, 26.0, 11.0, 14.0, 13.0, 9.0, 8.0, 8.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.507555961608887, -9.239373207092285, -8.97119140625, -8.703008651733398, -8.434825897216797, -8.166643142700195, -7.89846134185791, -7.630278587341309, -7.362096309661865, -7.093914031982422, -6.82573127746582, -6.557548999786377, -6.289366722106934, -6.021183967590332, -5.753001689910889, -5.484819412231445, -5.216636657714844, -4.9484543800354, -4.680271625518799, -4.4120893478393555, -4.143906593322754, -3.8757243156433105, -3.607542037963867, -3.3393595218658447, -3.0711770057678223, -2.8029944896698, -2.5348119735717773, -2.266629695892334, -1.9984471797943115, -1.730264663696289, -1.4620822668075562, -1.1938998699188232, -0.925717830657959, -0.6575353741645813, -0.3893529176712036, -0.12117046117782593, 0.14701199531555176, 0.4151945114135742, 0.6833769083023071, 0.95155930519104, 1.2197418212890625, 1.487924337387085, 1.7561067342758179, 2.024289131164551, 2.2924716472625732, 2.5606541633605957, 2.828836441040039, 3.0970189571380615, 3.365201473236084, 3.6333839893341064, 3.901566505432129, 4.169748783111572, 4.437931060791016, 4.706113815307617, 4.9742960929870605, 5.242478370666504, 5.5106611251831055, 5.778843402862549, 6.04702615737915, 6.315208435058594, 6.583391189575195, 6.851573467254639, 7.119755744934082, 7.387938499450684, 7.656120777130127]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 4.0, 10.0, 7.0, 11.0, 11.0, 20.0, 17.0, 23.0, 34.0, 25.0, 29.0, 33.0, 35.0, 38.0, 55.0, 54.0, 49.0, 55.0, 36.0, 49.0, 44.0, 49.0, 36.0, 27.0, 36.0, 27.0, 33.0, 28.0, 17.0, 23.0, 15.0, 14.0, 12.0, 8.0, 6.0, 8.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.208320617675781, -7.959070205688477, -7.70982027053833, -7.460569858551025, -7.211319923400879, -6.962069511413574, -6.7128190994262695, -6.463569164276123, -6.214319229125977, -5.965068817138672, -5.715818881988525, -5.466568470001221, -5.217318534851074, -4.9680681228637695, -4.718817710876465, -4.469567775726318, -4.220317363739014, -3.971067190170288, -3.7218170166015625, -3.472566604614258, -3.2233166694641113, -2.9740662574768066, -2.724816083908081, -2.4755659103393555, -2.22631573677063, -1.9770655632019043, -1.7278153896331787, -1.4785650968551636, -1.229314923286438, -0.9800647497177124, -0.7308144569396973, -0.4815642833709717, -0.2323141098022461, 0.01693609356880188, 0.26618629693984985, 0.5154365301132202, 0.7646867036819458, 1.0139368772506714, 1.2631871700286865, 1.512437343597412, 1.7616875171661377, 2.0109376907348633, 2.260187864303589, 2.5094380378723145, 2.758688449859619, 3.0079383850097656, 3.2571887969970703, 3.506438970565796, 3.7556891441345215, 4.004939556121826, 4.254189491271973, 4.503439903259277, 4.752689838409424, 5.0019402503967285, 5.251190185546875, 5.50044059753418, 5.749691009521484, 5.998941421508789, 6.2481913566589355, 6.49744176864624, 6.746691703796387, 6.995942115783691, 7.245192527770996, 7.494442462921143, 7.743692398071289]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 12.0, 24.0, 28.0, 53.0, 62.0, 123.0, 177.0, 272.0, 449.0, 711.0, 1099.0, 1834.0, 3039.0, 5363.0, 9414.0, 16326.0, 28931.0, 53294.0, 96871.0, 177209.0, 311752.0, 506743.0, 697322.0, 744236.0, 607475.0, 398536.0, 235995.0, 130837.0, 72500.0, 40224.0, 22564.0, 12815.0, 7051.0, 4247.0, 2555.0, 1539.0, 968.0, 616.0, 390.0, 223.0, 154.0, 78.0, 56.0, 39.0, 28.0, 14.0, 11.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-7.47265625, -7.2479248046875, -7.023193359375, -6.7984619140625, -6.57373046875, -6.3489990234375, -6.124267578125, -5.8995361328125, -5.6748046875, -5.4500732421875, -5.225341796875, -5.0006103515625, -4.77587890625, -4.5511474609375, -4.326416015625, -4.1016845703125, -3.876953125, -3.6522216796875, -3.427490234375, -3.2027587890625, -2.97802734375, -2.7532958984375, -2.528564453125, -2.3038330078125, -2.0791015625, -1.8543701171875, -1.629638671875, -1.4049072265625, -1.18017578125, -0.9554443359375, -0.730712890625, -0.5059814453125, -0.28125, -0.0565185546875, 0.168212890625, 0.3929443359375, 0.61767578125, 0.8424072265625, 1.067138671875, 1.2918701171875, 1.5166015625, 1.7413330078125, 1.966064453125, 2.1907958984375, 2.41552734375, 2.6402587890625, 2.864990234375, 3.0897216796875, 3.314453125, 3.5391845703125, 3.763916015625, 3.9886474609375, 4.21337890625, 4.4381103515625, 4.662841796875, 4.8875732421875, 5.1123046875, 5.3370361328125, 5.561767578125, 5.7864990234375, 6.01123046875, 6.2359619140625, 6.460693359375, 6.6854248046875, 6.91015625]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 5.0, 4.0, 5.0, 7.0, 9.0, 8.0, 15.0, 22.0, 13.0, 21.0, 37.0, 24.0, 34.0, 39.0, 41.0, 39.0, 46.0, 51.0, 64.0, 46.0, 49.0, 48.0, 51.0, 41.0, 43.0, 25.0, 35.0, 33.0, 32.0, 19.0, 12.0, 18.0, 18.0, 10.0, 6.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.171875, -5.9761962890625, -5.780517578125, -5.5848388671875, -5.38916015625, -5.1934814453125, -4.997802734375, -4.8021240234375, -4.6064453125, -4.4107666015625, -4.215087890625, -4.0194091796875, -3.82373046875, -3.6280517578125, -3.432373046875, -3.2366943359375, -3.041015625, -2.8453369140625, -2.649658203125, -2.4539794921875, -2.25830078125, -2.0626220703125, -1.866943359375, -1.6712646484375, -1.4755859375, -1.2799072265625, -1.084228515625, -0.8885498046875, -0.69287109375, -0.4971923828125, -0.301513671875, -0.1058349609375, 0.08984375, 0.2855224609375, 0.481201171875, 0.6768798828125, 0.87255859375, 1.0682373046875, 1.263916015625, 1.4595947265625, 1.6552734375, 1.8509521484375, 2.046630859375, 2.2423095703125, 2.43798828125, 2.6336669921875, 2.829345703125, 3.0250244140625, 3.220703125, 3.4163818359375, 3.612060546875, 3.8077392578125, 4.00341796875, 4.1990966796875, 4.394775390625, 4.5904541015625, 4.7861328125, 4.9818115234375, 5.177490234375, 5.3731689453125, 5.56884765625, 5.7645263671875, 5.960205078125, 6.1558837890625, 6.3515625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 9.0, 7.0, 16.0, 25.0, 50.0, 63.0, 117.0, 153.0, 268.0, 445.0, 668.0, 1086.0, 1851.0, 2956.0, 4915.0, 8256.0, 13761.0, 23716.0, 40740.0, 67901.0, 114191.0, 185127.0, 286989.0, 412408.0, 530049.0, 592332.0, 561109.0, 457836.0, 330180.0, 219053.0, 135921.0, 82555.0, 48589.0, 28743.0, 17068.0, 10070.0, 5947.0, 3501.0, 2106.0, 1339.0, 862.0, 473.0, 322.0, 207.0, 118.0, 70.0, 45.0, 36.0, 22.0, 9.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.390625, -6.18890380859375, -5.9871826171875, -5.78546142578125, -5.583740234375, -5.38201904296875, -5.1802978515625, -4.97857666015625, -4.77685546875, -4.57513427734375, -4.3734130859375, -4.17169189453125, -3.969970703125, -3.76824951171875, -3.5665283203125, -3.36480712890625, -3.1630859375, -2.96136474609375, -2.7596435546875, -2.55792236328125, -2.356201171875, -2.15447998046875, -1.9527587890625, -1.75103759765625, -1.54931640625, -1.34759521484375, -1.1458740234375, -0.94415283203125, -0.742431640625, -0.54071044921875, -0.3389892578125, -0.13726806640625, 0.064453125, 0.26617431640625, 0.4678955078125, 0.66961669921875, 0.871337890625, 1.07305908203125, 1.2747802734375, 1.47650146484375, 1.67822265625, 1.87994384765625, 2.0816650390625, 2.28338623046875, 2.485107421875, 2.68682861328125, 2.8885498046875, 3.09027099609375, 3.2919921875, 3.49371337890625, 3.6954345703125, 3.89715576171875, 4.098876953125, 4.30059814453125, 4.5023193359375, 4.70404052734375, 4.90576171875, 5.10748291015625, 5.3092041015625, 5.51092529296875, 5.712646484375, 5.91436767578125, 6.1160888671875, 6.31781005859375, 6.51953125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 4.0, 4.0, 8.0, 12.0, 8.0, 20.0, 20.0, 20.0, 26.0, 38.0, 57.0, 68.0, 81.0, 79.0, 93.0, 100.0, 133.0, 125.0, 178.0, 164.0, 197.0, 185.0, 216.0, 218.0, 219.0, 201.0, 181.0, 169.0, 174.0, 159.0, 161.0, 125.0, 102.0, 96.0, 75.0, 54.0, 67.0, 50.0, 31.0, 27.0, 32.0, 18.0, 16.0, 19.0, 14.0, 9.0, 3.0, 5.0, 8.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.33203125, -2.2496337890625, -2.167236328125, -2.0848388671875, -2.00244140625, -1.9200439453125, -1.837646484375, -1.7552490234375, -1.6728515625, -1.5904541015625, -1.508056640625, -1.4256591796875, -1.34326171875, -1.2608642578125, -1.178466796875, -1.0960693359375, -1.013671875, -0.9312744140625, -0.848876953125, -0.7664794921875, -0.68408203125, -0.6016845703125, -0.519287109375, -0.4368896484375, -0.3544921875, -0.2720947265625, -0.189697265625, -0.1072998046875, -0.02490234375, 0.0574951171875, 0.139892578125, 0.2222900390625, 0.3046875, 0.3870849609375, 0.469482421875, 0.5518798828125, 0.63427734375, 0.7166748046875, 0.799072265625, 0.8814697265625, 0.9638671875, 1.0462646484375, 1.128662109375, 1.2110595703125, 1.29345703125, 1.3758544921875, 1.458251953125, 1.5406494140625, 1.623046875, 1.7054443359375, 1.787841796875, 1.8702392578125, 1.95263671875, 2.0350341796875, 2.117431640625, 2.1998291015625, 2.2822265625, 2.3646240234375, 2.447021484375, 2.5294189453125, 2.61181640625, 2.6942138671875, 2.776611328125, 2.8590087890625, 2.94140625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 5.0, 9.0, 12.0, 15.0, 22.0, 14.0, 27.0, 33.0, 47.0, 59.0, 54.0, 59.0, 76.0, 63.0, 65.0, 75.0, 65.0, 52.0, 43.0, 42.0, 30.0, 28.0, 16.0, 18.0, 19.0, 12.0, 6.0, 10.0, 5.0, 3.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.520401954650879, -10.192163467407227, -9.863924026489258, -9.535685539245605, -9.207447052001953, -8.8792085647583, -8.550969123840332, -8.22273063659668, -7.894492149353027, -7.566253185272217, -7.2380146980285645, -6.909775733947754, -6.581537246704102, -6.253298282623291, -5.9250593185424805, -5.596820831298828, -5.268581867218018, -4.940342903137207, -4.612104415893555, -4.283865451812744, -3.955626964569092, -3.6273880004882812, -3.29914927482605, -2.9709105491638184, -2.642671823501587, -2.3144330978393555, -1.986194372177124, -1.657955527305603, -1.3297168016433716, -1.0014780759811401, -0.6732392311096191, -0.3450005054473877, -0.01676177978515625, 0.3114769756793976, 0.6397157311439514, 0.9679545164108276, 1.296193242073059, 1.6244319677352905, 1.9526708126068115, 2.280909538269043, 2.6091482639312744, 2.937386989593506, 3.2656257152557373, 3.5938644409179688, 3.9221034049987793, 4.250341892242432, 4.578580856323242, 4.9068193435668945, 5.235058307647705, 5.563297271728516, 5.891535758972168, 6.2197747230529785, 6.548013210296631, 6.876252174377441, 7.204490661621094, 7.532729625701904, 7.860968589782715, 8.189207077026367, 8.517446517944336, 8.845685005187988, 9.17392349243164, 9.502161979675293, 9.830401420593262, 10.158639907836914, 10.486878395080566]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 12.0, 9.0, 15.0, 15.0, 11.0, 13.0, 20.0, 18.0, 26.0, 35.0, 21.0, 28.0, 41.0, 41.0, 45.0, 46.0, 48.0, 49.0, 55.0, 39.0, 40.0, 23.0, 37.0, 41.0, 34.0, 31.0, 22.0, 30.0, 24.0, 19.0, 21.0, 14.0, 12.0, 13.0, 11.0, 8.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-8.61169719696045, -8.359784126281738, -8.107870101928711, -7.85595703125, -7.604043483734131, -7.352129936218262, -7.100216865539551, -6.848303318023682, -6.5963897705078125, -6.344476222991943, -6.092562675476074, -5.840649604797363, -5.588736057281494, -5.336822509765625, -5.084909439086914, -4.832995891571045, -4.581082344055176, -4.329168796539307, -4.0772552490234375, -3.8253421783447266, -3.5734286308288574, -3.3215150833129883, -3.0696017742156982, -2.817688465118408, -2.565774917602539, -2.31386137008667, -2.06194806098938, -1.8100346326828003, -1.5581212043762207, -1.3062077760696411, -1.0542943477630615, -0.8023809194564819, -0.5504665374755859, -0.29855310916900635, -0.04663968086242676, 0.20527374744415283, 0.4571871757507324, 0.709100604057312, 0.9610140323638916, 1.2129274606704712, 1.4648408889770508, 1.7167543172836304, 1.96866774559021, 2.2205810546875, 2.472494602203369, 2.7244081497192383, 2.9763214588165283, 3.2282347679138184, 3.4801483154296875, 3.7320618629455566, 3.9839751720428467, 4.235888481140137, 4.487802028656006, 4.739715576171875, 4.991628646850586, 5.243542194366455, 5.495455741882324, 5.747369289398193, 5.9992828369140625, 6.251195907592773, 6.503109455108643, 6.755023002624512, 7.006936073303223, 7.258849620819092, 7.510763168334961]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 14.0, 14.0, 22.0, 42.0, 66.0, 91.0, 141.0, 237.0, 382.0, 593.0, 1034.0, 1679.0, 2764.0, 4631.0, 7998.0, 13780.0, 23854.0, 41219.0, 71186.0, 120326.0, 184046.0, 206753.0, 148300.0, 91918.0, 53890.0, 30775.0, 17784.0, 10203.0, 6030.0, 3532.0, 2093.0, 1224.0, 733.0, 454.0, 257.0, 168.0, 126.0, 76.0, 42.0, 24.0, 17.0, 19.0, 11.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.048828125, -1.01031494140625, -0.9718017578125, -0.93328857421875, -0.894775390625, -0.85626220703125, -0.8177490234375, -0.77923583984375, -0.74072265625, -0.70220947265625, -0.6636962890625, -0.62518310546875, -0.586669921875, -0.54815673828125, -0.5096435546875, -0.47113037109375, -0.4326171875, -0.39410400390625, -0.3555908203125, -0.31707763671875, -0.278564453125, -0.24005126953125, -0.2015380859375, -0.16302490234375, -0.12451171875, -0.08599853515625, -0.0474853515625, -0.00897216796875, 0.029541015625, 0.06805419921875, 0.1065673828125, 0.14508056640625, 0.18359375, 0.22210693359375, 0.2606201171875, 0.29913330078125, 0.337646484375, 0.37615966796875, 0.4146728515625, 0.45318603515625, 0.49169921875, 0.53021240234375, 0.5687255859375, 0.60723876953125, 0.645751953125, 0.68426513671875, 0.7227783203125, 0.76129150390625, 0.7998046875, 0.83831787109375, 0.8768310546875, 0.91534423828125, 0.953857421875, 0.99237060546875, 1.0308837890625, 1.06939697265625, 1.10791015625, 1.14642333984375, 1.1849365234375, 1.22344970703125, 1.261962890625, 1.30047607421875, 1.3389892578125, 1.37750244140625, 1.416015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 9.0, 5.0, 4.0, 10.0, 4.0, 8.0, 19.0, 20.0, 17.0, 20.0, 27.0, 21.0, 39.0, 29.0, 32.0, 24.0, 31.0, 50.0, 46.0, 57.0, 41.0, 46.0, 42.0, 39.0, 38.0, 37.0, 45.0, 30.0, 25.0, 28.0, 30.0, 17.0, 17.0, 18.0, 15.0, 10.0, 9.0, 13.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.6171875, -8.3546142578125, -8.092041015625, -7.8294677734375, -7.56689453125, -7.3043212890625, -7.041748046875, -6.7791748046875, -6.5166015625, -6.2540283203125, -5.991455078125, -5.7288818359375, -5.46630859375, -5.2037353515625, -4.941162109375, -4.6785888671875, -4.416015625, -4.1534423828125, -3.890869140625, -3.6282958984375, -3.36572265625, -3.1031494140625, -2.840576171875, -2.5780029296875, -2.3154296875, -2.0528564453125, -1.790283203125, -1.5277099609375, -1.26513671875, -1.0025634765625, -0.739990234375, -0.4774169921875, -0.21484375, 0.0477294921875, 0.310302734375, 0.5728759765625, 0.83544921875, 1.0980224609375, 1.360595703125, 1.6231689453125, 1.8857421875, 2.1483154296875, 2.410888671875, 2.6734619140625, 2.93603515625, 3.1986083984375, 3.461181640625, 3.7237548828125, 3.986328125, 4.2489013671875, 4.511474609375, 4.7740478515625, 5.03662109375, 5.2991943359375, 5.561767578125, 5.8243408203125, 6.0869140625, 6.3494873046875, 6.612060546875, 6.8746337890625, 7.13720703125, 7.3997802734375, 7.662353515625, 7.9249267578125, 8.1875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 4.0, 4.0, 10.0, 12.0, 15.0, 32.0, 29.0, 34.0, 61.0, 95.0, 159.0, 222.0, 331.0, 520.0, 790.0, 1268.0, 1942.0, 2883.0, 4655.0, 7261.0, 11377.0, 17893.0, 28767.0, 45513.0, 71613.0, 109596.0, 155975.0, 176002.0, 142692.0, 97165.0, 62987.0, 39952.0, 25057.0, 15595.0, 10069.0, 6428.0, 4042.0, 2683.0, 1658.0, 1055.0, 713.0, 472.0, 309.0, 206.0, 134.0, 99.0, 60.0, 44.0, 26.0, 12.0, 15.0, 15.0, 4.0, 10.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.087890625, -1.053192138671875, -1.01849365234375, -0.983795166015625, -0.9490966796875, -0.914398193359375, -0.87969970703125, -0.845001220703125, -0.810302734375, -0.775604248046875, -0.74090576171875, -0.706207275390625, -0.6715087890625, -0.636810302734375, -0.60211181640625, -0.567413330078125, -0.53271484375, -0.498016357421875, -0.46331787109375, -0.428619384765625, -0.3939208984375, -0.359222412109375, -0.32452392578125, -0.289825439453125, -0.255126953125, -0.220428466796875, -0.18572998046875, -0.151031494140625, -0.1163330078125, -0.081634521484375, -0.04693603515625, -0.012237548828125, 0.0224609375, 0.057159423828125, 0.09185791015625, 0.126556396484375, 0.1612548828125, 0.195953369140625, 0.23065185546875, 0.265350341796875, 0.300048828125, 0.334747314453125, 0.36944580078125, 0.404144287109375, 0.4388427734375, 0.473541259765625, 0.50823974609375, 0.542938232421875, 0.57763671875, 0.612335205078125, 0.64703369140625, 0.681732177734375, 0.7164306640625, 0.751129150390625, 0.78582763671875, 0.820526123046875, 0.855224609375, 0.889923095703125, 0.92462158203125, 0.959320068359375, 0.9940185546875, 1.028717041015625, 1.06341552734375, 1.098114013671875, 1.1328125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 5.0, 8.0, 8.0, 17.0, 19.0, 23.0, 16.0, 24.0, 35.0, 31.0, 27.0, 30.0, 43.0, 35.0, 35.0, 48.0, 43.0, 32.0, 36.0, 43.0, 51.0, 33.0, 31.0, 38.0, 37.0, 32.0, 25.0, 29.0, 27.0, 29.0, 21.0, 14.0, 8.0, 12.0, 8.0, 8.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.37890625, -5.2154541015625, -5.052001953125, -4.8885498046875, -4.72509765625, -4.5616455078125, -4.398193359375, -4.2347412109375, -4.0712890625, -3.9078369140625, -3.744384765625, -3.5809326171875, -3.41748046875, -3.2540283203125, -3.090576171875, -2.9271240234375, -2.763671875, -2.6002197265625, -2.436767578125, -2.2733154296875, -2.10986328125, -1.9464111328125, -1.782958984375, -1.6195068359375, -1.4560546875, -1.2926025390625, -1.129150390625, -0.9656982421875, -0.80224609375, -0.6387939453125, -0.475341796875, -0.3118896484375, -0.1484375, 0.0150146484375, 0.178466796875, 0.3419189453125, 0.50537109375, 0.6688232421875, 0.832275390625, 0.9957275390625, 1.1591796875, 1.3226318359375, 1.486083984375, 1.6495361328125, 1.81298828125, 1.9764404296875, 2.139892578125, 2.3033447265625, 2.466796875, 2.6302490234375, 2.793701171875, 2.9571533203125, 3.12060546875, 3.2840576171875, 3.447509765625, 3.6109619140625, 3.7744140625, 3.9378662109375, 4.101318359375, 4.2647705078125, 4.42822265625, 4.5916748046875, 4.755126953125, 4.9185791015625, 5.08203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 9.0, 4.0, 7.0, 10.0, 8.0, 14.0, 24.0, 40.0, 49.0, 108.0, 137.0, 223.0, 373.0, 634.0, 1315.0, 2487.0, 5449.0, 12043.0, 29898.0, 78930.0, 225944.0, 408326.0, 175891.0, 62841.0, 24490.0, 9973.0, 4620.0, 2131.0, 1143.0, 551.0, 321.0, 191.0, 120.0, 84.0, 58.0, 35.0, 29.0, 14.0, 6.0, 9.0, 6.0, 5.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.150146484375, -0.14564895629882812, -0.14115142822265625, -0.13665390014648438, -0.1321563720703125, -0.12765884399414062, -0.12316131591796875, -0.11866378784179688, -0.114166259765625, -0.10966873168945312, -0.10517120361328125, -0.10067367553710938, -0.0961761474609375, -0.09167861938476562, -0.08718109130859375, -0.08268356323242188, -0.07818603515625, -0.07368850708007812, -0.06919097900390625, -0.06469345092773438, -0.0601959228515625, -0.055698394775390625, -0.05120086669921875, -0.046703338623046875, -0.042205810546875, -0.037708282470703125, -0.03321075439453125, -0.028713226318359375, -0.0242156982421875, -0.019718170166015625, -0.01522064208984375, -0.010723114013671875, -0.0062255859375, -0.001728057861328125, 0.00276947021484375, 0.007266998291015625, 0.0117645263671875, 0.016262054443359375, 0.02075958251953125, 0.025257110595703125, 0.029754638671875, 0.034252166748046875, 0.03874969482421875, 0.043247222900390625, 0.0477447509765625, 0.052242279052734375, 0.05673980712890625, 0.061237335205078125, 0.06573486328125, 0.07023239135742188, 0.07472991943359375, 0.07922744750976562, 0.0837249755859375, 0.08822250366210938, 0.09272003173828125, 0.09721755981445312, 0.101715087890625, 0.10621261596679688, 0.11071014404296875, 0.11520767211914062, 0.1197052001953125, 0.12420272827148438, 0.12870025634765625, 0.13319778442382812, 0.1376953125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 9.0, 7.0, 10.0, 7.0, 13.0, 13.0, 19.0, 17.0, 20.0, 26.0, 23.0, 37.0, 45.0, 43.0, 43.0, 45.0, 52.0, 44.0, 51.0, 44.0, 59.0, 48.0, 45.0, 38.0, 39.0, 42.0, 22.0, 27.0, 20.0, 20.0, 14.0, 9.0, 9.0, 4.0, 5.0, 4.0, 8.0, 5.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1444091796875e-05, -1.1081807315349579e-05, -1.0719522833824158e-05, -1.0357238352298737e-05, -9.994953870773315e-06, -9.632669389247894e-06, -9.270384907722473e-06, -8.908100426197052e-06, -8.545815944671631e-06, -8.18353146314621e-06, -7.821246981620789e-06, -7.4589625000953674e-06, -7.096678018569946e-06, -6.734393537044525e-06, -6.372109055519104e-06, -6.009824573993683e-06, -5.647540092468262e-06, -5.2852556109428406e-06, -4.9229711294174194e-06, -4.560686647891998e-06, -4.198402166366577e-06, -3.836117684841156e-06, -3.473833203315735e-06, -3.1115487217903137e-06, -2.7492642402648926e-06, -2.3869797587394714e-06, -2.0246952772140503e-06, -1.6624107956886292e-06, -1.300126314163208e-06, -9.378418326377869e-07, -5.755573511123657e-07, -2.1327286958694458e-07, 1.4901161193847656e-07, 5.112960934638977e-07, 8.735805749893188e-07, 1.23586505651474e-06, 1.5981495380401611e-06, 1.9604340195655823e-06, 2.3227185010910034e-06, 2.6850029826164246e-06, 3.0472874641418457e-06, 3.409571945667267e-06, 3.771856427192688e-06, 4.134140908718109e-06, 4.49642539024353e-06, 4.858709871768951e-06, 5.2209943532943726e-06, 5.583278834819794e-06, 5.945563316345215e-06, 6.307847797870636e-06, 6.670132279396057e-06, 7.032416760921478e-06, 7.394701242446899e-06, 7.75698572397232e-06, 8.119270205497742e-06, 8.481554687023163e-06, 8.843839168548584e-06, 9.206123650074005e-06, 9.568408131599426e-06, 9.930692613124847e-06, 1.0292977094650269e-05, 1.065526157617569e-05, 1.101754605770111e-05, 1.1379830539226532e-05, 1.1742115020751953e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 7.0, 10.0, 9.0, 19.0, 24.0, 27.0, 58.0, 57.0, 86.0, 121.0, 202.0, 259.0, 362.0, 523.0, 846.0, 1242.0, 1885.0, 2895.0, 4493.0, 7051.0, 11239.0, 18519.0, 30211.0, 52008.0, 91546.0, 161165.0, 238176.0, 177908.0, 101484.0, 58089.0, 33536.0, 20217.0, 12411.0, 7767.0, 4781.0, 3144.0, 2045.0, 1360.0, 865.0, 565.0, 399.0, 291.0, 198.0, 132.0, 107.0, 67.0, 43.0, 45.0, 23.0, 18.0, 11.0, 3.0, 8.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.11126708984375, -0.1079549789428711, -0.10464286804199219, -0.10133075714111328, -0.09801864624023438, -0.09470653533935547, -0.09139442443847656, -0.08808231353759766, -0.08477020263671875, -0.08145809173583984, -0.07814598083496094, -0.07483386993408203, -0.07152175903320312, -0.06820964813232422, -0.06489753723144531, -0.061585426330566406, -0.0582733154296875, -0.054961204528808594, -0.05164909362792969, -0.04833698272705078, -0.045024871826171875, -0.04171276092529297, -0.03840065002441406, -0.035088539123535156, -0.03177642822265625, -0.028464317321777344, -0.025152206420898438, -0.02184009552001953, -0.018527984619140625, -0.015215873718261719, -0.011903762817382812, -0.008591651916503906, -0.005279541015625, -0.0019674301147460938, 0.0013446807861328125, 0.004656791687011719, 0.007968902587890625, 0.011281013488769531, 0.014593124389648438, 0.017905235290527344, 0.02121734619140625, 0.024529457092285156, 0.027841567993164062, 0.03115367889404297, 0.034465789794921875, 0.03777790069580078, 0.04109001159667969, 0.044402122497558594, 0.0477142333984375, 0.051026344299316406, 0.05433845520019531, 0.05765056610107422, 0.060962677001953125, 0.06427478790283203, 0.06758689880371094, 0.07089900970458984, 0.07421112060546875, 0.07752323150634766, 0.08083534240722656, 0.08414745330810547, 0.08745956420898438, 0.09077167510986328, 0.09408378601074219, 0.0973958969116211, 0.1007080078125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 4.0, 5.0, 5.0, 3.0, 5.0, 8.0, 12.0, 14.0, 18.0, 22.0, 24.0, 29.0, 45.0, 47.0, 70.0, 94.0, 88.0, 87.0, 74.0, 79.0, 55.0, 45.0, 34.0, 29.0, 24.0, 13.0, 16.0, 17.0, 12.0, 9.0, 5.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051605224609375, -0.050080299377441406, -0.04855537414550781, -0.04703044891357422, -0.045505523681640625, -0.04398059844970703, -0.04245567321777344, -0.040930747985839844, -0.03940582275390625, -0.037880897521972656, -0.03635597229003906, -0.03483104705810547, -0.033306121826171875, -0.03178119659423828, -0.030256271362304688, -0.028731346130371094, -0.0272064208984375, -0.025681495666503906, -0.024156570434570312, -0.02263164520263672, -0.021106719970703125, -0.01958179473876953, -0.018056869506835938, -0.016531944274902344, -0.01500701904296875, -0.013482093811035156, -0.011957168579101562, -0.010432243347167969, -0.008907318115234375, -0.007382392883300781, -0.0058574676513671875, -0.004332542419433594, -0.0028076171875, -0.0012826919555664062, 0.0002422332763671875, 0.0017671585083007812, 0.003292083740234375, 0.004817008972167969, 0.0063419342041015625, 0.007866859436035156, 0.00939178466796875, 0.010916709899902344, 0.012441635131835938, 0.013966560363769531, 0.015491485595703125, 0.01701641082763672, 0.018541336059570312, 0.020066261291503906, 0.0215911865234375, 0.023116111755371094, 0.024641036987304688, 0.02616596221923828, 0.027690887451171875, 0.02921581268310547, 0.030740737915039062, 0.032265663146972656, 0.03379058837890625, 0.035315513610839844, 0.03684043884277344, 0.03836536407470703, 0.039890289306640625, 0.04141521453857422, 0.04294013977050781, 0.044465065002441406, 0.045989990234375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 11.0, 6.0, 10.0, 12.0, 17.0, 19.0, 23.0, 21.0, 35.0, 46.0, 55.0, 64.0, 56.0, 70.0, 66.0, 70.0, 66.0, 69.0, 51.0, 40.0, 45.0, 32.0, 23.0, 17.0, 16.0, 23.0, 8.0, 6.0, 10.0, 5.0, 3.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.38602352142334, -10.060490608215332, -9.734957695007324, -9.409423828125, -9.083890914916992, -8.758358001708984, -8.432825088500977, -8.107292175292969, -7.7817583084106445, -7.456225395202637, -7.130692005157471, -6.805159091949463, -6.479625701904297, -6.154092788696289, -5.828559875488281, -5.503026485443115, -5.177493572235107, -4.8519606590271, -4.526427268981934, -4.200894355773926, -3.8753609657287598, -3.549828052520752, -3.224294900894165, -2.898761749267578, -2.573228597640991, -2.2476954460144043, -1.9221622943878174, -1.59662926197052, -1.271096110343933, -0.9455629587173462, -0.6200299263000488, -0.2944967746734619, 0.031036376953125, 0.3565694987773895, 0.682102620601654, 1.0076357126235962, 1.333168864250183, 1.65870201587677, 1.9842350482940674, 2.3097681999206543, 2.635301351547241, 2.960834503173828, 3.286367654800415, 3.611900806427002, 3.9374337196350098, 4.262967109680176, 4.588500022888184, 4.914032936096191, 5.239566326141357, 5.565099239349365, 5.890632629394531, 6.216165542602539, 6.541698932647705, 6.867231845855713, 7.192765235900879, 7.518298149108887, 7.8438310623168945, 8.169363975524902, 8.49489688873291, 8.820430755615234, 9.145963668823242, 9.47149658203125, 9.797029495239258, 10.122562408447266, 10.44809627532959]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 4.0, 12.0, 9.0, 15.0, 14.0, 11.0, 12.0, 22.0, 17.0, 26.0, 30.0, 26.0, 29.0, 39.0, 40.0, 49.0, 46.0, 45.0, 51.0, 53.0, 41.0, 40.0, 23.0, 38.0, 41.0, 32.0, 32.0, 23.0, 30.0, 23.0, 18.0, 21.0, 15.0, 12.0, 13.0, 11.0, 8.0, 7.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-8.618572235107422, -8.366349220275879, -8.11412525177002, -7.861902236938477, -7.609678745269775, -7.357455253601074, -7.105231761932373, -6.853008270263672, -6.600785255432129, -6.348561763763428, -6.096338272094727, -5.844115257263184, -5.591891765594482, -5.339668273925781, -5.08744478225708, -4.835221290588379, -4.582997798919678, -4.330774307250977, -4.078550815582275, -3.8263275623321533, -3.5741043090820312, -3.32188081741333, -3.069657325744629, -2.8174338340759277, -2.5652105808258057, -2.3129870891571045, -2.0607638359069824, -1.8085403442382812, -1.5563169717788696, -1.304093599319458, -1.0518701076507568, -0.7996467351913452, -0.5474233627319336, -0.2951999604701996, -0.042976558208465576, 0.20924687385559082, 0.46147024631500244, 0.7136936187744141, 0.9659171104431152, 1.2181404829025269, 1.4703638553619385, 1.72258722782135, 1.9748106002807617, 2.227034091949463, 2.479257583618164, 2.731480836868286, 2.9837043285369873, 3.2359275817871094, 3.4881510734558105, 3.7403745651245117, 3.992597818374634, 4.244821548461914, 4.497044563293457, 4.749268054962158, 5.001491546630859, 5.2537150382995605, 5.505938529968262, 5.758162021636963, 6.010385513305664, 6.262608528137207, 6.514832019805908, 6.767055511474609, 7.0192790031433105, 7.271502494812012, 7.523725509643555]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 4.0, 11.0, 21.0, 22.0, 57.0, 55.0, 86.0, 143.0, 177.0, 283.0, 379.0, 642.0, 884.0, 1226.0, 1850.0, 2762.0, 4179.0, 6183.0, 9078.0, 13426.0, 19354.0, 28252.0, 39401.0, 54075.0, 70759.0, 89029.0, 102913.0, 110501.0, 107174.0, 95124.0, 78995.0, 61152.0, 45758.0, 32739.0, 23018.0, 15844.0, 10744.0, 7219.0, 4949.0, 3315.0, 2212.0, 1470.0, 950.0, 701.0, 425.0, 346.0, 213.0, 146.0, 116.0, 65.0, 48.0, 35.0, 22.0, 14.0, 7.0, 4.0, 7.0], "bins": [-4.44140625, -4.3134765625, -4.185546875, -4.0576171875, -3.9296875, -3.8017578125, -3.673828125, -3.5458984375, -3.41796875, -3.2900390625, -3.162109375, -3.0341796875, -2.90625, -2.7783203125, -2.650390625, -2.5224609375, -2.39453125, -2.2666015625, -2.138671875, -2.0107421875, -1.8828125, -1.7548828125, -1.626953125, -1.4990234375, -1.37109375, -1.2431640625, -1.115234375, -0.9873046875, -0.859375, -0.7314453125, -0.603515625, -0.4755859375, -0.34765625, -0.2197265625, -0.091796875, 0.0361328125, 0.1640625, 0.2919921875, 0.419921875, 0.5478515625, 0.67578125, 0.8037109375, 0.931640625, 1.0595703125, 1.1875, 1.3154296875, 1.443359375, 1.5712890625, 1.69921875, 1.8271484375, 1.955078125, 2.0830078125, 2.2109375, 2.3388671875, 2.466796875, 2.5947265625, 2.72265625, 2.8505859375, 2.978515625, 3.1064453125, 3.234375, 3.3623046875, 3.490234375, 3.6181640625, 3.74609375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 7.0, 5.0, 7.0, 12.0, 12.0, 10.0, 13.0, 16.0, 23.0, 20.0, 12.0, 17.0, 22.0, 19.0, 35.0, 37.0, 44.0, 40.0, 53.0, 42.0, 42.0, 37.0, 45.0, 49.0, 19.0, 24.0, 27.0, 31.0, 38.0, 31.0, 27.0, 23.0, 23.0, 18.0, 28.0, 11.0, 15.0, 9.0, 14.0, 8.0, 8.0, 5.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-7.1484375, -6.91522216796875, -6.6820068359375, -6.44879150390625, -6.215576171875, -5.98236083984375, -5.7491455078125, -5.51593017578125, -5.28271484375, -5.04949951171875, -4.8162841796875, -4.58306884765625, -4.349853515625, -4.11663818359375, -3.8834228515625, -3.65020751953125, -3.4169921875, -3.18377685546875, -2.9505615234375, -2.71734619140625, -2.484130859375, -2.25091552734375, -2.0177001953125, -1.78448486328125, -1.55126953125, -1.31805419921875, -1.0848388671875, -0.85162353515625, -0.618408203125, -0.38519287109375, -0.1519775390625, 0.08123779296875, 0.314453125, 0.54766845703125, 0.7808837890625, 1.01409912109375, 1.247314453125, 1.48052978515625, 1.7137451171875, 1.94696044921875, 2.18017578125, 2.41339111328125, 2.6466064453125, 2.87982177734375, 3.113037109375, 3.34625244140625, 3.5794677734375, 3.81268310546875, 4.0458984375, 4.27911376953125, 4.5123291015625, 4.74554443359375, 4.978759765625, 5.21197509765625, 5.4451904296875, 5.67840576171875, 5.91162109375, 6.14483642578125, 6.3780517578125, 6.61126708984375, 6.844482421875, 7.07769775390625, 7.3109130859375, 7.54412841796875, 7.77734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 7.0, 3.0, 4.0, 11.0, 14.0, 28.0, 42.0, 63.0, 96.0, 163.0, 245.0, 414.0, 633.0, 986.0, 1505.0, 2414.0, 3640.0, 5361.0, 8211.0, 12475.0, 18697.0, 27441.0, 39391.0, 54680.0, 72774.0, 91234.0, 106769.0, 113444.0, 109466.0, 97527.0, 80247.0, 60878.0, 44515.0, 31343.0, 21446.0, 14525.0, 9621.0, 6362.0, 4133.0, 2790.0, 1765.0, 1195.0, 705.0, 474.0, 314.0, 175.0, 114.0, 84.0, 47.0, 39.0, 27.0, 11.0, 8.0, 8.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.939453125, -3.806732177734375, -3.67401123046875, -3.541290283203125, -3.4085693359375, -3.275848388671875, -3.14312744140625, -3.010406494140625, -2.877685546875, -2.744964599609375, -2.61224365234375, -2.479522705078125, -2.3468017578125, -2.214080810546875, -2.08135986328125, -1.948638916015625, -1.81591796875, -1.683197021484375, -1.55047607421875, -1.417755126953125, -1.2850341796875, -1.152313232421875, -1.01959228515625, -0.886871337890625, -0.754150390625, -0.621429443359375, -0.48870849609375, -0.355987548828125, -0.2232666015625, -0.090545654296875, 0.04217529296875, 0.174896240234375, 0.3076171875, 0.440338134765625, 0.57305908203125, 0.705780029296875, 0.8385009765625, 0.971221923828125, 1.10394287109375, 1.236663818359375, 1.369384765625, 1.502105712890625, 1.63482666015625, 1.767547607421875, 1.9002685546875, 2.032989501953125, 2.16571044921875, 2.298431396484375, 2.43115234375, 2.563873291015625, 2.69659423828125, 2.829315185546875, 2.9620361328125, 3.094757080078125, 3.22747802734375, 3.360198974609375, 3.492919921875, 3.625640869140625, 3.75836181640625, 3.891082763671875, 4.0238037109375, 4.156524658203125, 4.28924560546875, 4.421966552734375, 4.5546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 9.0, 5.0, 7.0, 4.0, 11.0, 10.0, 8.0, 19.0, 13.0, 15.0, 16.0, 15.0, 20.0, 31.0, 33.0, 33.0, 36.0, 37.0, 30.0, 38.0, 43.0, 42.0, 45.0, 45.0, 42.0, 36.0, 44.0, 27.0, 27.0, 34.0, 19.0, 23.0, 33.0, 21.0, 15.0, 20.0, 23.0, 13.0, 19.0, 9.0, 16.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.6484375, -4.50140380859375, -4.3543701171875, -4.20733642578125, -4.060302734375, -3.91326904296875, -3.7662353515625, -3.61920166015625, -3.47216796875, -3.32513427734375, -3.1781005859375, -3.03106689453125, -2.884033203125, -2.73699951171875, -2.5899658203125, -2.44293212890625, -2.2958984375, -2.14886474609375, -2.0018310546875, -1.85479736328125, -1.707763671875, -1.56072998046875, -1.4136962890625, -1.26666259765625, -1.11962890625, -0.97259521484375, -0.8255615234375, -0.67852783203125, -0.531494140625, -0.38446044921875, -0.2374267578125, -0.09039306640625, 0.056640625, 0.20367431640625, 0.3507080078125, 0.49774169921875, 0.644775390625, 0.79180908203125, 0.9388427734375, 1.08587646484375, 1.23291015625, 1.37994384765625, 1.5269775390625, 1.67401123046875, 1.821044921875, 1.96807861328125, 2.1151123046875, 2.26214599609375, 2.4091796875, 2.55621337890625, 2.7032470703125, 2.85028076171875, 2.997314453125, 3.14434814453125, 3.2913818359375, 3.43841552734375, 3.58544921875, 3.73248291015625, 3.8795166015625, 4.02655029296875, 4.173583984375, 4.32061767578125, 4.4676513671875, 4.61468505859375, 4.76171875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 11.0, 12.0, 12.0, 13.0, 26.0, 31.0, 83.0, 111.0, 165.0, 242.0, 381.0, 595.0, 903.0, 1393.0, 2118.0, 3294.0, 5142.0, 7784.0, 11664.0, 17706.0, 26138.0, 38528.0, 54796.0, 73726.0, 92124.0, 108467.0, 115646.0, 111804.0, 98635.0, 81060.0, 61199.0, 44034.0, 30313.0, 20876.0, 13820.0, 8842.0, 5732.0, 3938.0, 2518.0, 1607.0, 1080.0, 691.0, 469.0, 299.0, 181.0, 120.0, 81.0, 47.0, 35.0, 24.0, 13.0, 18.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.49609375, -1.4456939697265625, -1.395294189453125, -1.3448944091796875, -1.29449462890625, -1.2440948486328125, -1.193695068359375, -1.1432952880859375, -1.0928955078125, -1.0424957275390625, -0.992095947265625, -0.9416961669921875, -0.89129638671875, -0.8408966064453125, -0.790496826171875, -0.7400970458984375, -0.689697265625, -0.6392974853515625, -0.588897705078125, -0.5384979248046875, -0.48809814453125, -0.4376983642578125, -0.387298583984375, -0.3368988037109375, -0.2864990234375, -0.2360992431640625, -0.185699462890625, -0.1352996826171875, -0.08489990234375, -0.0345001220703125, 0.015899658203125, 0.0662994384765625, 0.11669921875, 0.1670989990234375, 0.217498779296875, 0.2678985595703125, 0.31829833984375, 0.3686981201171875, 0.419097900390625, 0.4694976806640625, 0.5198974609375, 0.5702972412109375, 0.620697021484375, 0.6710968017578125, 0.72149658203125, 0.7718963623046875, 0.822296142578125, 0.8726959228515625, 0.923095703125, 0.9734954833984375, 1.023895263671875, 1.0742950439453125, 1.12469482421875, 1.1750946044921875, 1.225494384765625, 1.2758941650390625, 1.3262939453125, 1.3766937255859375, 1.427093505859375, 1.4774932861328125, 1.52789306640625, 1.5782928466796875, 1.628692626953125, 1.6790924072265625, 1.7294921875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 4.0, 5.0, 4.0, 8.0, 14.0, 9.0, 10.0, 11.0, 19.0, 28.0, 34.0, 28.0, 26.0, 30.0, 40.0, 49.0, 46.0, 38.0, 38.0, 46.0, 46.0, 42.0, 47.0, 55.0, 31.0, 36.0, 41.0, 32.0, 28.0, 28.0, 18.0, 16.0, 14.0, 11.0, 15.0, 12.0, 7.0, 6.0, 10.0, 3.0, 4.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001608133316040039, -0.00015539862215518951, -0.00014998391270637512, -0.00014456920325756073, -0.00013915449380874634, -0.00013373978435993195, -0.00012832507491111755, -0.00012291036546230316, -0.00011749565601348877, -0.00011208094656467438, -0.00010666623711585999, -0.0001012515276670456, -9.58368182182312e-05, -9.042210876941681e-05, -8.500739932060242e-05, -7.959268987178802e-05, -7.417798042297363e-05, -6.876327097415924e-05, -6.334856152534485e-05, -5.7933852076530457e-05, -5.2519142627716064e-05, -4.710443317890167e-05, -4.168972373008728e-05, -3.627501428127289e-05, -3.0860304832458496e-05, -2.5445595383644104e-05, -2.0030885934829712e-05, -1.461617648601532e-05, -9.201467037200928e-06, -3.7867575883865356e-06, 1.6279518604278564e-06, 7.0426613092422485e-06, 1.245737075805664e-05, 1.7872080206871033e-05, 2.3286789655685425e-05, 2.8701499104499817e-05, 3.411620855331421e-05, 3.95309180021286e-05, 4.494562745094299e-05, 5.0360336899757385e-05, 5.577504634857178e-05, 6.118975579738617e-05, 6.660446524620056e-05, 7.201917469501495e-05, 7.743388414382935e-05, 8.284859359264374e-05, 8.826330304145813e-05, 9.367801249027252e-05, 9.909272193908691e-05, 0.0001045074313879013, 0.0001099221408367157, 0.00011533685028553009, 0.00012075155973434448, 0.00012616626918315887, 0.00013158097863197327, 0.00013699568808078766, 0.00014241039752960205, 0.00014782510697841644, 0.00015323981642723083, 0.00015865452587604523, 0.00016406923532485962, 0.000169483944773674, 0.0001748986542224884, 0.0001803133636713028, 0.0001857280731201172]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 13.0, 13.0, 17.0, 20.0, 34.0, 80.0, 100.0, 172.0, 254.0, 372.0, 568.0, 927.0, 1384.0, 2218.0, 3695.0, 5775.0, 9355.0, 15117.0, 23795.0, 36310.0, 54735.0, 77456.0, 102556.0, 122656.0, 130607.0, 122955.0, 102508.0, 78176.0, 55078.0, 37096.0, 23771.0, 15169.0, 9348.0, 5957.0, 3845.0, 2420.0, 1429.0, 946.0, 568.0, 352.0, 257.0, 179.0, 93.0, 58.0, 51.0, 31.0, 15.0, 12.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.79296875, -1.7342071533203125, -1.675445556640625, -1.6166839599609375, -1.55792236328125, -1.4991607666015625, -1.440399169921875, -1.3816375732421875, -1.3228759765625, -1.2641143798828125, -1.205352783203125, -1.1465911865234375, -1.08782958984375, -1.0290679931640625, -0.970306396484375, -0.9115447998046875, -0.852783203125, -0.7940216064453125, -0.735260009765625, -0.6764984130859375, -0.61773681640625, -0.5589752197265625, -0.500213623046875, -0.4414520263671875, -0.3826904296875, -0.3239288330078125, -0.265167236328125, -0.2064056396484375, -0.14764404296875, -0.0888824462890625, -0.030120849609375, 0.0286407470703125, 0.08740234375, 0.1461639404296875, 0.204925537109375, 0.2636871337890625, 0.32244873046875, 0.3812103271484375, 0.439971923828125, 0.4987335205078125, 0.5574951171875, 0.6162567138671875, 0.675018310546875, 0.7337799072265625, 0.79254150390625, 0.8513031005859375, 0.910064697265625, 0.9688262939453125, 1.027587890625, 1.0863494873046875, 1.145111083984375, 1.2038726806640625, 1.26263427734375, 1.3213958740234375, 1.380157470703125, 1.4389190673828125, 1.4976806640625, 1.5564422607421875, 1.615203857421875, 1.6739654541015625, 1.73272705078125, 1.7914886474609375, 1.850250244140625, 1.9090118408203125, 1.9677734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 5.0, 4.0, 5.0, 4.0, 7.0, 12.0, 11.0, 7.0, 15.0, 12.0, 16.0, 26.0, 19.0, 29.0, 43.0, 36.0, 20.0, 42.0, 51.0, 49.0, 63.0, 45.0, 45.0, 62.0, 43.0, 47.0, 48.0, 33.0, 37.0, 27.0, 29.0, 21.0, 17.0, 14.0, 10.0, 8.0, 11.0, 7.0, 9.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8779296875, -0.8516464233398438, -0.8253631591796875, -0.7990798950195312, -0.772796630859375, -0.7465133666992188, -0.7202301025390625, -0.6939468383789062, -0.66766357421875, -0.6413803100585938, -0.6150970458984375, -0.5888137817382812, -0.562530517578125, -0.5362472534179688, -0.5099639892578125, -0.48368072509765625, -0.4573974609375, -0.43111419677734375, -0.4048309326171875, -0.37854766845703125, -0.352264404296875, -0.32598114013671875, -0.2996978759765625, -0.27341461181640625, -0.24713134765625, -0.22084808349609375, -0.1945648193359375, -0.16828155517578125, -0.141998291015625, -0.11571502685546875, -0.0894317626953125, -0.06314849853515625, -0.036865234375, -0.01058197021484375, 0.0157012939453125, 0.04198455810546875, 0.068267822265625, 0.09455108642578125, 0.1208343505859375, 0.14711761474609375, 0.17340087890625, 0.19968414306640625, 0.2259674072265625, 0.25225067138671875, 0.278533935546875, 0.30481719970703125, 0.3311004638671875, 0.35738372802734375, 0.3836669921875, 0.40995025634765625, 0.4362335205078125, 0.46251678466796875, 0.488800048828125, 0.5150833129882812, 0.5413665771484375, 0.5676498413085938, 0.59393310546875, 0.6202163696289062, 0.6464996337890625, 0.6727828979492188, 0.699066162109375, 0.7253494262695312, 0.7516326904296875, 0.7779159545898438, 0.80419921875]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 7.0, 12.0, 14.0, 22.0, 20.0, 26.0, 27.0, 38.0, 53.0, 53.0, 76.0, 70.0, 72.0, 73.0, 58.0, 73.0, 58.0, 46.0, 48.0, 24.0, 30.0, 17.0, 21.0, 20.0, 10.0, 5.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.807265281677246, -10.46921157836914, -10.131156921386719, -9.793103218078613, -9.455049514770508, -9.116994857788086, -8.77894115447998, -8.440887451171875, -8.102832794189453, -7.7647786140441895, -7.426724433898926, -7.08867073059082, -6.750616550445557, -6.412562370300293, -6.0745086669921875, -5.736454486846924, -5.39840030670166, -5.0603461265563965, -4.722291946411133, -4.384238243103027, -4.046184062957764, -3.7081298828125, -3.3700759410858154, -3.032021999359131, -2.693967819213867, -2.3559136390686035, -2.017859697341919, -1.6798056364059448, -1.3417515754699707, -1.0036975145339966, -0.6656434535980225, -0.3275895118713379, 0.010465621948242188, 0.3485196828842163, 0.6865737438201904, 1.0246278047561646, 1.3626818656921387, 1.7007359266281128, 2.038789987564087, 2.3768439292907715, 2.714898109436035, 3.052952289581299, 3.3910062313079834, 3.729060173034668, 4.067114353179932, 4.405168533325195, 4.743222236633301, 5.0812764167785645, 5.419330596923828, 5.757384777069092, 6.0954389572143555, 6.433492660522461, 6.771546840667725, 7.109601020812988, 7.447654724121094, 7.785708904266357, 8.123763084411621, 8.461816787719727, 8.799871444702148, 9.137925148010254, 9.47597885131836, 9.814033508300781, 10.152087211608887, 10.490140914916992, 10.828195571899414]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 11.0, 12.0, 11.0, 11.0, 10.0, 10.0, 25.0, 20.0, 25.0, 29.0, 23.0, 25.0, 36.0, 35.0, 41.0, 52.0, 35.0, 43.0, 50.0, 44.0, 44.0, 50.0, 41.0, 32.0, 26.0, 24.0, 20.0, 21.0, 22.0, 27.0, 25.0, 22.0, 15.0, 20.0, 10.0, 9.0, 10.0, 5.0, 8.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-8.298343658447266, -8.04475212097168, -7.791159629821777, -7.537567615509033, -7.283975601196289, -7.030383586883545, -6.776791572570801, -6.523199558258057, -6.2696075439453125, -6.016015529632568, -5.762423515319824, -5.50883150100708, -5.255239486694336, -5.001647472381592, -4.748055458068848, -4.4944634437561035, -4.240871429443359, -3.9872794151306152, -3.733687400817871, -3.480095386505127, -3.226503372192383, -2.9729113578796387, -2.7193193435668945, -2.4657273292541504, -2.2121353149414062, -1.958543300628662, -1.704951286315918, -1.4513592720031738, -1.1977672576904297, -0.9441752433776855, -0.6905832290649414, -0.43699121475219727, -0.18339920043945312, 0.07019281387329102, 0.32378482818603516, 0.5773768424987793, 0.8309688568115234, 1.0845608711242676, 1.3381528854370117, 1.5917448997497559, 1.8453369140625, 2.098928928375244, 2.3525209426879883, 2.6061129570007324, 2.8597049713134766, 3.1132969856262207, 3.366888999938965, 3.620481014251709, 3.874073028564453, 4.127665042877197, 4.381257057189941, 4.6348490715026855, 4.88844108581543, 5.142033100128174, 5.395625114440918, 5.649217128753662, 5.902809143066406, 6.15640115737915, 6.4099931716918945, 6.663585186004639, 6.917177200317383, 7.170769214630127, 7.424361228942871, 7.677953243255615, 7.931545257568359]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 8.0, 3.0, 8.0, 8.0, 10.0, 29.0, 56.0, 64.0, 97.0, 163.0, 260.0, 344.0, 549.0, 893.0, 1295.0, 2021.0, 3179.0, 4804.0, 7623.0, 11789.0, 18676.0, 29400.0, 47207.0, 75269.0, 119330.0, 185981.0, 280904.0, 398181.0, 514038.0, 575105.0, 547109.0, 444442.0, 325044.0, 219116.0, 141891.0, 89218.0, 56486.0, 35024.0, 21606.0, 13809.0, 8607.0, 5262.0, 3355.0, 2158.0, 1379.0, 900.0, 578.0, 368.0, 225.0, 168.0, 85.0, 65.0, 35.0, 31.0, 14.0, 10.0, 7.0, 7.0, 3.0, 1.0], "bins": [-6.9765625, -6.76959228515625, -6.5626220703125, -6.35565185546875, -6.148681640625, -5.94171142578125, -5.7347412109375, -5.52777099609375, -5.32080078125, -5.11383056640625, -4.9068603515625, -4.69989013671875, -4.492919921875, -4.28594970703125, -4.0789794921875, -3.87200927734375, -3.6650390625, -3.45806884765625, -3.2510986328125, -3.04412841796875, -2.837158203125, -2.63018798828125, -2.4232177734375, -2.21624755859375, -2.00927734375, -1.80230712890625, -1.5953369140625, -1.38836669921875, -1.181396484375, -0.97442626953125, -0.7674560546875, -0.56048583984375, -0.353515625, -0.14654541015625, 0.0604248046875, 0.26739501953125, 0.474365234375, 0.68133544921875, 0.8883056640625, 1.09527587890625, 1.30224609375, 1.50921630859375, 1.7161865234375, 1.92315673828125, 2.130126953125, 2.33709716796875, 2.5440673828125, 2.75103759765625, 2.9580078125, 3.16497802734375, 3.3719482421875, 3.57891845703125, 3.785888671875, 3.99285888671875, 4.1998291015625, 4.40679931640625, 4.61376953125, 4.82073974609375, 5.0277099609375, 5.23468017578125, 5.441650390625, 5.64862060546875, 5.8555908203125, 6.06256103515625, 6.26953125]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 4.0, 7.0, 7.0, 6.0, 12.0, 9.0, 11.0, 12.0, 23.0, 16.0, 19.0, 23.0, 23.0, 31.0, 26.0, 32.0, 29.0, 43.0, 41.0, 40.0, 45.0, 41.0, 51.0, 46.0, 42.0, 35.0, 38.0, 29.0, 23.0, 29.0, 26.0, 21.0, 17.0, 27.0, 20.0, 17.0, 16.0, 17.0, 11.0, 9.0, 10.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-6.42578125, -6.23114013671875, -6.0364990234375, -5.84185791015625, -5.647216796875, -5.45257568359375, -5.2579345703125, -5.06329345703125, -4.86865234375, -4.67401123046875, -4.4793701171875, -4.28472900390625, -4.090087890625, -3.89544677734375, -3.7008056640625, -3.50616455078125, -3.3115234375, -3.11688232421875, -2.9222412109375, -2.72760009765625, -2.532958984375, -2.33831787109375, -2.1436767578125, -1.94903564453125, -1.75439453125, -1.55975341796875, -1.3651123046875, -1.17047119140625, -0.975830078125, -0.78118896484375, -0.5865478515625, -0.39190673828125, -0.197265625, -0.00262451171875, 0.1920166015625, 0.38665771484375, 0.581298828125, 0.77593994140625, 0.9705810546875, 1.16522216796875, 1.35986328125, 1.55450439453125, 1.7491455078125, 1.94378662109375, 2.138427734375, 2.33306884765625, 2.5277099609375, 2.72235107421875, 2.9169921875, 3.11163330078125, 3.3062744140625, 3.50091552734375, 3.695556640625, 3.89019775390625, 4.0848388671875, 4.27947998046875, 4.47412109375, 4.66876220703125, 4.8634033203125, 5.05804443359375, 5.252685546875, 5.44732666015625, 5.6419677734375, 5.83660888671875, 6.03125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 10.0, 15.0, 20.0, 28.0, 42.0, 83.0, 152.0, 250.0, 361.0, 616.0, 1050.0, 1725.0, 2880.0, 4741.0, 8173.0, 13794.0, 22778.0, 39035.0, 64141.0, 104956.0, 168767.0, 255070.0, 365082.0, 474907.0, 549370.0, 550349.0, 481957.0, 372673.0, 263378.0, 173231.0, 109170.0, 66299.0, 40140.0, 24039.0, 14286.0, 8485.0, 4845.0, 2892.0, 1786.0, 1063.0, 611.0, 384.0, 239.0, 169.0, 101.0, 65.0, 25.0, 21.0, 15.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.73046875, -7.4964599609375, -7.262451171875, -7.0284423828125, -6.79443359375, -6.5604248046875, -6.326416015625, -6.0924072265625, -5.8583984375, -5.6243896484375, -5.390380859375, -5.1563720703125, -4.92236328125, -4.6883544921875, -4.454345703125, -4.2203369140625, -3.986328125, -3.7523193359375, -3.518310546875, -3.2843017578125, -3.05029296875, -2.8162841796875, -2.582275390625, -2.3482666015625, -2.1142578125, -1.8802490234375, -1.646240234375, -1.4122314453125, -1.17822265625, -0.9442138671875, -0.710205078125, -0.4761962890625, -0.2421875, -0.0081787109375, 0.225830078125, 0.4598388671875, 0.69384765625, 0.9278564453125, 1.161865234375, 1.3958740234375, 1.6298828125, 1.8638916015625, 2.097900390625, 2.3319091796875, 2.56591796875, 2.7999267578125, 3.033935546875, 3.2679443359375, 3.501953125, 3.7359619140625, 3.969970703125, 4.2039794921875, 4.43798828125, 4.6719970703125, 4.906005859375, 5.1400146484375, 5.3740234375, 5.6080322265625, 5.842041015625, 6.0760498046875, 6.31005859375, 6.5440673828125, 6.778076171875, 7.0120849609375, 7.24609375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 12.0, 15.0, 16.0, 22.0, 19.0, 35.0, 46.0, 52.0, 71.0, 91.0, 99.0, 127.0, 135.0, 141.0, 166.0, 209.0, 205.0, 235.0, 209.0, 252.0, 195.0, 214.0, 212.0, 210.0, 155.0, 160.0, 121.0, 123.0, 78.0, 78.0, 81.0, 67.0, 46.0, 45.0, 23.0, 26.0, 23.0, 11.0, 14.0, 7.0, 10.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.66796875, -3.559112548828125, -3.45025634765625, -3.341400146484375, -3.2325439453125, -3.123687744140625, -3.01483154296875, -2.905975341796875, -2.797119140625, -2.688262939453125, -2.57940673828125, -2.470550537109375, -2.3616943359375, -2.252838134765625, -2.14398193359375, -2.035125732421875, -1.92626953125, -1.817413330078125, -1.70855712890625, -1.599700927734375, -1.4908447265625, -1.381988525390625, -1.27313232421875, -1.164276123046875, -1.055419921875, -0.946563720703125, -0.83770751953125, -0.728851318359375, -0.6199951171875, -0.511138916015625, -0.40228271484375, -0.293426513671875, -0.1845703125, -0.075714111328125, 0.03314208984375, 0.141998291015625, 0.2508544921875, 0.359710693359375, 0.46856689453125, 0.577423095703125, 0.686279296875, 0.795135498046875, 0.90399169921875, 1.012847900390625, 1.1217041015625, 1.230560302734375, 1.33941650390625, 1.448272705078125, 1.55712890625, 1.665985107421875, 1.77484130859375, 1.883697509765625, 1.9925537109375, 2.101409912109375, 2.21026611328125, 2.319122314453125, 2.427978515625, 2.536834716796875, 2.64569091796875, 2.754547119140625, 2.8634033203125, 2.972259521484375, 3.08111572265625, 3.189971923828125, 3.298828125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 3.0, 4.0, 7.0, 7.0, 14.0, 20.0, 14.0, 22.0, 27.0, 33.0, 30.0, 36.0, 28.0, 60.0, 51.0, 40.0, 43.0, 41.0, 49.0, 52.0, 56.0, 47.0, 43.0, 32.0, 43.0, 40.0, 33.0, 12.0, 14.0, 14.0, 15.0, 26.0, 9.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.248176574707031, -8.941280364990234, -8.634384155273438, -8.32748794555664, -8.020591735839844, -7.713695526123047, -7.40679931640625, -7.099903106689453, -6.793006896972656, -6.486110687255859, -6.1792144775390625, -5.872318267822266, -5.565422058105469, -5.258525848388672, -4.951629638671875, -4.644733428955078, -4.3378376960754395, -4.030941486358643, -3.7240452766418457, -3.417149066925049, -3.110252857208252, -2.803356647491455, -2.4964606761932373, -2.1895644664764404, -1.8826682567596436, -1.5757720470428467, -1.2688758373260498, -0.9619797468185425, -0.6550835371017456, -0.34818732738494873, -0.041291236877441406, 0.26560497283935547, 0.5725011825561523, 0.8793973922729492, 1.186293601989746, 1.4931896924972534, 1.8000859022140503, 2.1069822311401367, 2.4138782024383545, 2.7207744121551514, 3.0276706218719482, 3.334566831588745, 3.641463041305542, 3.9483590126037598, 4.255255222320557, 4.5621514320373535, 4.86904764175415, 5.175943851470947, 5.482840061187744, 5.789736270904541, 6.096632480621338, 6.403528690338135, 6.710424900054932, 7.0173211097717285, 7.324216842651367, 7.631113052368164, 7.938009262084961, 8.244905471801758, 8.551801681518555, 8.858697891235352, 9.165594100952148, 9.472490310668945, 9.779386520385742, 10.086282730102539, 10.393178939819336]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 3.0, 1.0, 8.0, 6.0, 9.0, 13.0, 15.0, 14.0, 18.0, 18.0, 11.0, 25.0, 25.0, 23.0, 26.0, 42.0, 47.0, 46.0, 29.0, 47.0, 42.0, 37.0, 37.0, 46.0, 48.0, 44.0, 33.0, 34.0, 35.0, 36.0, 24.0, 24.0, 24.0, 21.0, 18.0, 11.0, 25.0, 11.0, 6.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.251880645751953, -9.955938339233398, -9.659996032714844, -9.364054679870605, -9.06811237335205, -8.772170066833496, -8.476227760314941, -8.180285453796387, -7.88434362411499, -7.5884013175964355, -7.292459487915039, -6.996517181396484, -6.70057487487793, -6.404633045196533, -6.1086907386779785, -5.812748908996582, -5.516806602478027, -5.220864295959473, -4.924922466278076, -4.6289801597595215, -4.333038330078125, -4.03709602355957, -3.7411537170410156, -3.44521164894104, -3.1492695808410645, -2.853327512741089, -2.5573854446411133, -2.2614431381225586, -1.965501070022583, -1.6695590019226074, -1.3736168146133423, -1.0776746273040771, -0.7817325592041016, -0.4857904314994812, -0.18984830379486084, 0.10609382390975952, 0.4020359516143799, 0.6979780197143555, 0.9939202070236206, 1.2898623943328857, 1.5858044624328613, 1.881746530532837, 2.1776885986328125, 2.473630905151367, 2.7695729732513428, 3.0655150413513184, 3.361457347869873, 3.6573994159698486, 3.953341484069824, 4.249283790588379, 4.545225620269775, 4.84116792678833, 5.137109756469727, 5.433052062988281, 5.728994369506836, 6.024936676025391, 6.320878505706787, 6.616820812225342, 6.912762641906738, 7.208704948425293, 7.504647254943848, 7.800589084625244, 8.09653091430664, 8.392473220825195, 8.68841552734375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 5.0, 11.0, 15.0, 17.0, 20.0, 32.0, 61.0, 79.0, 125.0, 197.0, 260.0, 381.0, 548.0, 904.0, 1318.0, 1975.0, 3107.0, 4726.0, 7263.0, 11244.0, 17472.0, 27286.0, 43038.0, 67894.0, 105552.0, 152112.0, 179637.0, 146598.0, 99516.0, 63897.0, 40248.0, 25630.0, 16537.0, 10619.0, 6873.0, 4619.0, 3010.0, 1894.0, 1289.0, 859.0, 572.0, 350.0, 248.0, 153.0, 113.0, 79.0, 54.0, 42.0, 25.0, 18.0, 13.0, 11.0, 5.0, 9.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.177734375, -1.1390380859375, -1.100341796875, -1.0616455078125, -1.02294921875, -0.9842529296875, -0.945556640625, -0.9068603515625, -0.8681640625, -0.8294677734375, -0.790771484375, -0.7520751953125, -0.71337890625, -0.6746826171875, -0.635986328125, -0.5972900390625, -0.55859375, -0.5198974609375, -0.481201171875, -0.4425048828125, -0.40380859375, -0.3651123046875, -0.326416015625, -0.2877197265625, -0.2490234375, -0.2103271484375, -0.171630859375, -0.1329345703125, -0.09423828125, -0.0555419921875, -0.016845703125, 0.0218505859375, 0.060546875, 0.0992431640625, 0.137939453125, 0.1766357421875, 0.21533203125, 0.2540283203125, 0.292724609375, 0.3314208984375, 0.3701171875, 0.4088134765625, 0.447509765625, 0.4862060546875, 0.52490234375, 0.5635986328125, 0.602294921875, 0.6409912109375, 0.6796875, 0.7183837890625, 0.757080078125, 0.7957763671875, 0.83447265625, 0.8731689453125, 0.911865234375, 0.9505615234375, 0.9892578125, 1.0279541015625, 1.066650390625, 1.1053466796875, 1.14404296875, 1.1827392578125, 1.221435546875, 1.2601318359375, 1.298828125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 4.0, 8.0, 3.0, 6.0, 9.0, 2.0, 18.0, 8.0, 27.0, 24.0, 24.0, 29.0, 34.0, 38.0, 37.0, 38.0, 50.0, 38.0, 50.0, 44.0, 37.0, 49.0, 43.0, 36.0, 42.0, 49.0, 37.0, 32.0, 32.0, 17.0, 22.0, 18.0, 22.0, 19.0, 13.0, 12.0, 8.0, 6.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.578125, -10.2496337890625, -9.921142578125, -9.5926513671875, -9.26416015625, -8.9356689453125, -8.607177734375, -8.2786865234375, -7.9501953125, -7.6217041015625, -7.293212890625, -6.9647216796875, -6.63623046875, -6.3077392578125, -5.979248046875, -5.6507568359375, -5.322265625, -4.9937744140625, -4.665283203125, -4.3367919921875, -4.00830078125, -3.6798095703125, -3.351318359375, -3.0228271484375, -2.6943359375, -2.3658447265625, -2.037353515625, -1.7088623046875, -1.38037109375, -1.0518798828125, -0.723388671875, -0.3948974609375, -0.06640625, 0.2620849609375, 0.590576171875, 0.9190673828125, 1.24755859375, 1.5760498046875, 1.904541015625, 2.2330322265625, 2.5615234375, 2.8900146484375, 3.218505859375, 3.5469970703125, 3.87548828125, 4.2039794921875, 4.532470703125, 4.8609619140625, 5.189453125, 5.5179443359375, 5.846435546875, 6.1749267578125, 6.50341796875, 6.8319091796875, 7.160400390625, 7.4888916015625, 7.8173828125, 8.1458740234375, 8.474365234375, 8.8028564453125, 9.13134765625, 9.4598388671875, 9.788330078125, 10.1168212890625, 10.4453125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 9.0, 17.0, 18.0, 49.0, 68.0, 81.0, 146.0, 234.0, 312.0, 525.0, 772.0, 1285.0, 2144.0, 3267.0, 5198.0, 8055.0, 12422.0, 19740.0, 31061.0, 49708.0, 77646.0, 120244.0, 170979.0, 178071.0, 131108.0, 85909.0, 54296.0, 34686.0, 22063.0, 13780.0, 8755.0, 5695.0, 3681.0, 2339.0, 1539.0, 968.0, 611.0, 373.0, 268.0, 155.0, 96.0, 66.0, 45.0, 25.0, 19.0, 7.0, 3.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3349609375, -1.2920379638671875, -1.249114990234375, -1.2061920166015625, -1.16326904296875, -1.1203460693359375, -1.077423095703125, -1.0345001220703125, -0.9915771484375, -0.9486541748046875, -0.905731201171875, -0.8628082275390625, -0.81988525390625, -0.7769622802734375, -0.734039306640625, -0.6911163330078125, -0.648193359375, -0.6052703857421875, -0.562347412109375, -0.5194244384765625, -0.47650146484375, -0.4335784912109375, -0.390655517578125, -0.3477325439453125, -0.3048095703125, -0.2618865966796875, -0.218963623046875, -0.1760406494140625, -0.13311767578125, -0.0901947021484375, -0.047271728515625, -0.0043487548828125, 0.03857421875, 0.0814971923828125, 0.124420166015625, 0.1673431396484375, 0.21026611328125, 0.2531890869140625, 0.296112060546875, 0.3390350341796875, 0.3819580078125, 0.4248809814453125, 0.467803955078125, 0.5107269287109375, 0.55364990234375, 0.5965728759765625, 0.639495849609375, 0.6824188232421875, 0.725341796875, 0.7682647705078125, 0.811187744140625, 0.8541107177734375, 0.89703369140625, 0.9399566650390625, 0.982879638671875, 1.0258026123046875, 1.0687255859375, 1.1116485595703125, 1.154571533203125, 1.1974945068359375, 1.24041748046875, 1.2833404541015625, 1.326263427734375, 1.3691864013671875, 1.412109375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 13.0, 15.0, 15.0, 23.0, 20.0, 20.0, 28.0, 28.0, 33.0, 39.0, 40.0, 31.0, 40.0, 51.0, 47.0, 44.0, 43.0, 41.0, 66.0, 47.0, 33.0, 35.0, 34.0, 35.0, 23.0, 22.0, 26.0, 15.0, 23.0, 13.0, 9.0, 8.0, 7.0, 8.0, 1.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.23028564453125, -5.0191650390625, -4.80804443359375, -4.596923828125, -4.38580322265625, -4.1746826171875, -3.96356201171875, -3.75244140625, -3.54132080078125, -3.3302001953125, -3.11907958984375, -2.907958984375, -2.69683837890625, -2.4857177734375, -2.27459716796875, -2.0634765625, -1.85235595703125, -1.6412353515625, -1.43011474609375, -1.218994140625, -1.00787353515625, -0.7967529296875, -0.58563232421875, -0.37451171875, -0.16339111328125, 0.0477294921875, 0.25885009765625, 0.469970703125, 0.68109130859375, 0.8922119140625, 1.10333251953125, 1.314453125, 1.52557373046875, 1.7366943359375, 1.94781494140625, 2.158935546875, 2.37005615234375, 2.5811767578125, 2.79229736328125, 3.00341796875, 3.21453857421875, 3.4256591796875, 3.63677978515625, 3.847900390625, 4.05902099609375, 4.2701416015625, 4.48126220703125, 4.6923828125, 4.90350341796875, 5.1146240234375, 5.32574462890625, 5.536865234375, 5.74798583984375, 5.9591064453125, 6.17022705078125, 6.38134765625, 6.59246826171875, 6.8035888671875, 7.01470947265625, 7.225830078125, 7.43695068359375, 7.6480712890625, 7.85919189453125, 8.0703125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 16.0, 15.0, 22.0, 41.0, 69.0, 94.0, 131.0, 246.0, 466.0, 850.0, 1709.0, 3492.0, 7775.0, 18473.0, 47834.0, 137690.0, 386643.0, 286641.0, 95995.0, 34869.0, 13789.0, 6002.0, 2692.0, 1376.0, 661.0, 351.0, 216.0, 131.0, 77.0, 63.0, 36.0, 27.0, 13.0, 8.0, 8.0, 3.0, 5.0, 3.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19189453125, -0.1860504150390625, -0.180206298828125, -0.1743621826171875, -0.16851806640625, -0.1626739501953125, -0.156829833984375, -0.1509857177734375, -0.1451416015625, -0.1392974853515625, -0.133453369140625, -0.1276092529296875, -0.12176513671875, -0.1159210205078125, -0.110076904296875, -0.1042327880859375, -0.098388671875, -0.0925445556640625, -0.086700439453125, -0.0808563232421875, -0.07501220703125, -0.0691680908203125, -0.063323974609375, -0.0574798583984375, -0.0516357421875, -0.0457916259765625, -0.039947509765625, -0.0341033935546875, -0.02825927734375, -0.0224151611328125, -0.016571044921875, -0.0107269287109375, -0.0048828125, 0.0009613037109375, 0.006805419921875, 0.0126495361328125, 0.01849365234375, 0.0243377685546875, 0.030181884765625, 0.0360260009765625, 0.0418701171875, 0.0477142333984375, 0.053558349609375, 0.0594024658203125, 0.06524658203125, 0.0710906982421875, 0.076934814453125, 0.0827789306640625, 0.088623046875, 0.0944671630859375, 0.100311279296875, 0.1061553955078125, 0.11199951171875, 0.1178436279296875, 0.123687744140625, 0.1295318603515625, 0.1353759765625, 0.1412200927734375, 0.147064208984375, 0.1529083251953125, 0.15875244140625, 0.1645965576171875, 0.170440673828125, 0.1762847900390625, 0.18212890625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 8.0, 7.0, 7.0, 14.0, 6.0, 15.0, 22.0, 17.0, 18.0, 23.0, 22.0, 32.0, 34.0, 50.0, 26.0, 43.0, 41.0, 39.0, 47.0, 47.0, 44.0, 49.0, 28.0, 44.0, 44.0, 28.0, 24.0, 35.0, 24.0, 28.0, 20.0, 22.0, 9.0, 15.0, 14.0, 7.0, 12.0, 6.0, 5.0, 5.0, 7.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1861324310302734e-05, -1.1473894119262695e-05, -1.1086463928222656e-05, -1.0699033737182617e-05, -1.0311603546142578e-05, -9.924173355102539e-06, -9.5367431640625e-06, -9.149312973022461e-06, -8.761882781982422e-06, -8.374452590942383e-06, -7.987022399902344e-06, -7.599592208862305e-06, -7.212162017822266e-06, -6.8247318267822266e-06, -6.4373016357421875e-06, -6.0498714447021484e-06, -5.662441253662109e-06, -5.27501106262207e-06, -4.887580871582031e-06, -4.500150680541992e-06, -4.112720489501953e-06, -3.725290298461914e-06, -3.337860107421875e-06, -2.950429916381836e-06, -2.562999725341797e-06, -2.175569534301758e-06, -1.7881393432617188e-06, -1.4007091522216797e-06, -1.0132789611816406e-06, -6.258487701416016e-07, -2.384185791015625e-07, 1.4901161193847656e-07, 5.364418029785156e-07, 9.238719940185547e-07, 1.3113021850585938e-06, 1.6987323760986328e-06, 2.086162567138672e-06, 2.473592758178711e-06, 2.86102294921875e-06, 3.248453140258789e-06, 3.635883331298828e-06, 4.023313522338867e-06, 4.410743713378906e-06, 4.798173904418945e-06, 5.185604095458984e-06, 5.5730342864990234e-06, 5.9604644775390625e-06, 6.3478946685791016e-06, 6.735324859619141e-06, 7.12275505065918e-06, 7.510185241699219e-06, 7.897615432739258e-06, 8.285045623779297e-06, 8.672475814819336e-06, 9.059906005859375e-06, 9.447336196899414e-06, 9.834766387939453e-06, 1.0222196578979492e-05, 1.0609626770019531e-05, 1.099705696105957e-05, 1.138448715209961e-05, 1.1771917343139648e-05, 1.2159347534179688e-05, 1.2546777725219727e-05, 1.2934207916259766e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 10.0, 3.0, 12.0, 17.0, 17.0, 31.0, 40.0, 62.0, 109.0, 176.0, 259.0, 392.0, 611.0, 1054.0, 1610.0, 2948.0, 5337.0, 10757.0, 23206.0, 54317.0, 143772.0, 361886.0, 268167.0, 98861.0, 39330.0, 17262.0, 8069.0, 4167.0, 2388.0, 1336.0, 885.0, 549.0, 307.0, 193.0, 129.0, 100.0, 55.0, 46.0, 31.0, 23.0, 8.0, 5.0, 3.0, 5.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2296142578125, -0.22216224670410156, -0.21471023559570312, -0.2072582244873047, -0.19980621337890625, -0.1923542022705078, -0.18490219116210938, -0.17745018005371094, -0.1699981689453125, -0.16254615783691406, -0.15509414672851562, -0.1476421356201172, -0.14019012451171875, -0.1327381134033203, -0.12528610229492188, -0.11783409118652344, -0.110382080078125, -0.10293006896972656, -0.09547805786132812, -0.08802604675292969, -0.08057403564453125, -0.07312202453613281, -0.06567001342773438, -0.05821800231933594, -0.0507659912109375, -0.04331398010253906, -0.035861968994140625, -0.028409957885742188, -0.02095794677734375, -0.013505935668945312, -0.006053924560546875, 0.0013980865478515625, 0.00885009765625, 0.016302108764648438, 0.023754119873046875, 0.031206130981445312, 0.03865814208984375, 0.04611015319824219, 0.053562164306640625, 0.06101417541503906, 0.0684661865234375, 0.07591819763183594, 0.08337020874023438, 0.09082221984863281, 0.09827423095703125, 0.10572624206542969, 0.11317825317382812, 0.12063026428222656, 0.128082275390625, 0.13553428649902344, 0.14298629760742188, 0.1504383087158203, 0.15789031982421875, 0.1653423309326172, 0.17279434204101562, 0.18024635314941406, 0.1876983642578125, 0.19515037536621094, 0.20260238647460938, 0.2100543975830078, 0.21750640869140625, 0.2249584197998047, 0.23241043090820312, 0.23986244201660156, 0.247314453125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 9.0, 2.0, 5.0, 4.0, 10.0, 8.0, 8.0, 17.0, 15.0, 31.0, 27.0, 39.0, 35.0, 45.0, 63.0, 85.0, 97.0, 102.0, 82.0, 62.0, 55.0, 37.0, 38.0, 30.0, 17.0, 22.0, 15.0, 15.0, 10.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.095947265625, -0.09334373474121094, -0.09074020385742188, -0.08813667297363281, -0.08553314208984375, -0.08292961120605469, -0.08032608032226562, -0.07772254943847656, -0.0751190185546875, -0.07251548767089844, -0.06991195678710938, -0.06730842590332031, -0.06470489501953125, -0.06210136413574219, -0.059497833251953125, -0.05689430236816406, -0.054290771484375, -0.05168724060058594, -0.049083709716796875, -0.04648017883300781, -0.04387664794921875, -0.04127311706542969, -0.038669586181640625, -0.03606605529785156, -0.0334625244140625, -0.030858993530273438, -0.028255462646484375, -0.025651931762695312, -0.02304840087890625, -0.020444869995117188, -0.017841339111328125, -0.015237808227539062, -0.01263427734375, -0.010030746459960938, -0.007427215576171875, -0.0048236846923828125, -0.00222015380859375, 0.0003833770751953125, 0.002986907958984375, 0.0055904388427734375, 0.0081939697265625, 0.010797500610351562, 0.013401031494140625, 0.016004562377929688, 0.01860809326171875, 0.021211624145507812, 0.023815155029296875, 0.026418685913085938, 0.029022216796875, 0.03162574768066406, 0.034229278564453125, 0.03683280944824219, 0.03943634033203125, 0.04203987121582031, 0.044643402099609375, 0.04724693298339844, 0.0498504638671875, 0.05245399475097656, 0.055057525634765625, 0.05766105651855469, 0.06026458740234375, 0.06286811828613281, 0.06547164916992188, 0.06807518005371094, 0.0706787109375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 3.0, 9.0, 15.0, 20.0, 18.0, 21.0, 30.0, 32.0, 26.0, 34.0, 35.0, 59.0, 42.0, 44.0, 47.0, 40.0, 38.0, 59.0, 59.0, 45.0, 33.0, 43.0, 37.0, 40.0, 34.0, 11.0, 15.0, 14.0, 13.0, 25.0, 10.0, 9.0, 3.0, 5.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.292303085327148, -8.992376327514648, -8.692448616027832, -8.392521858215332, -8.092595100402832, -7.792667388916016, -7.492740631103516, -7.192813396453857, -6.892886161804199, -6.592958927154541, -6.293032169342041, -5.993104934692383, -5.693177700042725, -5.393250465393066, -5.093323707580566, -4.793396472930908, -4.493469715118408, -4.19354248046875, -3.893615484237671, -3.593688488006592, -3.2937612533569336, -2.9938342571258545, -2.6939072608947754, -2.393980026245117, -2.094053030014038, -1.7941259145736694, -1.4941987991333008, -1.1942718029022217, -0.894344687461853, -0.5944175720214844, -0.2944905757904053, 0.00543665885925293, 0.30536365509033203, 0.6052907705307007, 0.9052178263664246, 1.2051448822021484, 1.505071997642517, 1.8049991130828857, 2.104926109313965, 2.404853343963623, 2.704780340194702, 3.0047073364257812, 3.3046345710754395, 3.6045615673065186, 3.9044885635375977, 4.204415798187256, 4.504343032836914, 4.804269790649414, 5.104197025299072, 5.4041242599487305, 5.7040510177612305, 6.003978252410889, 6.303905487060547, 6.603832244873047, 6.903759479522705, 7.203686714172363, 7.503613471984863, 7.8035407066345215, 8.10346794128418, 8.40339469909668, 8.70332145690918, 9.003249168395996, 9.303175926208496, 9.603103637695312, 9.903030395507812]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 1.0, 7.0, 7.0, 8.0, 14.0, 13.0, 16.0, 16.0, 20.0, 10.0, 24.0, 26.0, 24.0, 25.0, 42.0, 46.0, 47.0, 30.0, 47.0, 43.0, 39.0, 35.0, 46.0, 47.0, 46.0, 35.0, 30.0, 38.0, 32.0, 26.0, 25.0, 22.0, 21.0, 19.0, 13.0, 22.0, 11.0, 5.0, 4.0, 3.0, 1.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.280278205871582, -9.983506202697754, -9.686734199523926, -9.389962196350098, -9.09319019317627, -8.796418190002441, -8.499646186828613, -8.202873229980469, -7.906101703643799, -7.609329700469971, -7.312557697296143, -7.0157856941223145, -6.719013214111328, -6.4222412109375, -6.125469207763672, -5.828697204589844, -5.531925201416016, -5.2351531982421875, -4.938381195068359, -4.641609191894531, -4.344837188720703, -4.048065185546875, -3.7512927055358887, -3.4545207023620605, -3.1577486991882324, -2.8609766960144043, -2.564204692840576, -2.267432451248169, -1.9706604480743408, -1.6738884449005127, -1.377116322517395, -1.0803442001342773, -0.7835721969604492, -0.4868001341819763, -0.19002807140350342, 0.10674399137496948, 0.4035160541534424, 0.7002880573272705, 0.9970601797103882, 1.2938323020935059, 1.590604305267334, 1.887376308441162, 2.1841483116149902, 2.4809205532073975, 2.7776925563812256, 3.0744645595550537, 3.371236801147461, 3.668008804321289, 3.964780807495117, 4.261552810668945, 4.558324813842773, 4.855096817016602, 5.15186882019043, 5.448640823364258, 5.745413303375244, 6.042185306549072, 6.3389573097229, 6.6357293128967285, 6.932501316070557, 7.229273319244385, 7.526045799255371, 7.822817802429199, 8.119589805603027, 8.416361808776855, 8.713133811950684]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 12.0, 11.0, 24.0, 24.0, 38.0, 62.0, 108.0, 173.0, 264.0, 431.0, 698.0, 1108.0, 1713.0, 2729.0, 4476.0, 7121.0, 11474.0, 18131.0, 28628.0, 43725.0, 63738.0, 87176.0, 111495.0, 127105.0, 128988.0, 115922.0, 92884.0, 68319.0, 47381.0, 31482.0, 19732.0, 12623.0, 7710.0, 4889.0, 2995.0, 1859.0, 1245.0, 728.0, 467.0, 311.0, 209.0, 145.0, 69.0, 45.0, 23.0, 23.0, 20.0, 12.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33203125, -5.1549072265625, -4.977783203125, -4.8006591796875, -4.62353515625, -4.4464111328125, -4.269287109375, -4.0921630859375, -3.9150390625, -3.7379150390625, -3.560791015625, -3.3836669921875, -3.20654296875, -3.0294189453125, -2.852294921875, -2.6751708984375, -2.498046875, -2.3209228515625, -2.143798828125, -1.9666748046875, -1.78955078125, -1.6124267578125, -1.435302734375, -1.2581787109375, -1.0810546875, -0.9039306640625, -0.726806640625, -0.5496826171875, -0.37255859375, -0.1954345703125, -0.018310546875, 0.1588134765625, 0.3359375, 0.5130615234375, 0.690185546875, 0.8673095703125, 1.04443359375, 1.2215576171875, 1.398681640625, 1.5758056640625, 1.7529296875, 1.9300537109375, 2.107177734375, 2.2843017578125, 2.46142578125, 2.6385498046875, 2.815673828125, 2.9927978515625, 3.169921875, 3.3470458984375, 3.524169921875, 3.7012939453125, 3.87841796875, 4.0555419921875, 4.232666015625, 4.4097900390625, 4.5869140625, 4.7640380859375, 4.941162109375, 5.1182861328125, 5.29541015625, 5.4725341796875, 5.649658203125, 5.8267822265625, 6.00390625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 10.0, 8.0, 8.0, 15.0, 14.0, 13.0, 17.0, 17.0, 23.0, 16.0, 23.0, 41.0, 33.0, 34.0, 34.0, 38.0, 42.0, 44.0, 40.0, 56.0, 53.0, 46.0, 42.0, 46.0, 30.0, 33.0, 28.0, 33.0, 24.0, 35.0, 22.0, 18.0, 15.0, 9.0, 11.0, 10.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.1953125, -10.876953125, -10.55859375, -10.240234375, -9.921875, -9.603515625, -9.28515625, -8.966796875, -8.6484375, -8.330078125, -8.01171875, -7.693359375, -7.375, -7.056640625, -6.73828125, -6.419921875, -6.1015625, -5.783203125, -5.46484375, -5.146484375, -4.828125, -4.509765625, -4.19140625, -3.873046875, -3.5546875, -3.236328125, -2.91796875, -2.599609375, -2.28125, -1.962890625, -1.64453125, -1.326171875, -1.0078125, -0.689453125, -0.37109375, -0.052734375, 0.265625, 0.583984375, 0.90234375, 1.220703125, 1.5390625, 1.857421875, 2.17578125, 2.494140625, 2.8125, 3.130859375, 3.44921875, 3.767578125, 4.0859375, 4.404296875, 4.72265625, 5.041015625, 5.359375, 5.677734375, 5.99609375, 6.314453125, 6.6328125, 6.951171875, 7.26953125, 7.587890625, 7.90625, 8.224609375, 8.54296875, 8.861328125, 9.1796875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 6.0, 7.0, 9.0, 9.0, 14.0, 28.0, 44.0, 72.0, 125.0, 169.0, 325.0, 518.0, 890.0, 1418.0, 2461.0, 4228.0, 6887.0, 11375.0, 18397.0, 28983.0, 44565.0, 65864.0, 91157.0, 114175.0, 130120.0, 130162.0, 115291.0, 91821.0, 67321.0, 45641.0, 29230.0, 18413.0, 11399.0, 6745.0, 4279.0, 2485.0, 1531.0, 921.0, 574.0, 328.0, 233.0, 127.0, 73.0, 50.0, 36.0, 24.0, 19.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-6.34765625, -6.1663818359375, -5.985107421875, -5.8038330078125, -5.62255859375, -5.4412841796875, -5.260009765625, -5.0787353515625, -4.8974609375, -4.7161865234375, -4.534912109375, -4.3536376953125, -4.17236328125, -3.9910888671875, -3.809814453125, -3.6285400390625, -3.447265625, -3.2659912109375, -3.084716796875, -2.9034423828125, -2.72216796875, -2.5408935546875, -2.359619140625, -2.1783447265625, -1.9970703125, -1.8157958984375, -1.634521484375, -1.4532470703125, -1.27197265625, -1.0906982421875, -0.909423828125, -0.7281494140625, -0.546875, -0.3656005859375, -0.184326171875, -0.0030517578125, 0.17822265625, 0.3594970703125, 0.540771484375, 0.7220458984375, 0.9033203125, 1.0845947265625, 1.265869140625, 1.4471435546875, 1.62841796875, 1.8096923828125, 1.990966796875, 2.1722412109375, 2.353515625, 2.5347900390625, 2.716064453125, 2.8973388671875, 3.07861328125, 3.2598876953125, 3.441162109375, 3.6224365234375, 3.8037109375, 3.9849853515625, 4.166259765625, 4.3475341796875, 4.52880859375, 4.7100830078125, 4.891357421875, 5.0726318359375, 5.25390625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 13.0, 13.0, 10.0, 13.0, 9.0, 18.0, 19.0, 30.0, 24.0, 29.0, 42.0, 44.0, 35.0, 36.0, 49.0, 42.0, 43.0, 39.0, 40.0, 36.0, 44.0, 35.0, 36.0, 29.0, 35.0, 35.0, 34.0, 22.0, 26.0, 17.0, 14.0, 20.0, 12.0, 10.0, 11.0, 8.0, 5.0, 6.0, 9.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.71484375, -6.52337646484375, -6.3319091796875, -6.14044189453125, -5.948974609375, -5.75750732421875, -5.5660400390625, -5.37457275390625, -5.18310546875, -4.99163818359375, -4.8001708984375, -4.60870361328125, -4.417236328125, -4.22576904296875, -4.0343017578125, -3.84283447265625, -3.6513671875, -3.45989990234375, -3.2684326171875, -3.07696533203125, -2.885498046875, -2.69403076171875, -2.5025634765625, -2.31109619140625, -2.11962890625, -1.92816162109375, -1.7366943359375, -1.54522705078125, -1.353759765625, -1.16229248046875, -0.9708251953125, -0.77935791015625, -0.587890625, -0.39642333984375, -0.2049560546875, -0.01348876953125, 0.177978515625, 0.36944580078125, 0.5609130859375, 0.75238037109375, 0.94384765625, 1.13531494140625, 1.3267822265625, 1.51824951171875, 1.709716796875, 1.90118408203125, 2.0926513671875, 2.28411865234375, 2.4755859375, 2.66705322265625, 2.8585205078125, 3.04998779296875, 3.241455078125, 3.43292236328125, 3.6243896484375, 3.81585693359375, 4.00732421875, 4.19879150390625, 4.3902587890625, 4.58172607421875, 4.773193359375, 4.96466064453125, 5.1561279296875, 5.34759521484375, 5.5390625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 17.0, 16.0, 23.0, 49.0, 82.0, 100.0, 157.0, 260.0, 408.0, 658.0, 1017.0, 1713.0, 2751.0, 4582.0, 7596.0, 12434.0, 20421.0, 32223.0, 49417.0, 71808.0, 96927.0, 119181.0, 130887.0, 128161.0, 110972.0, 85613.0, 61678.0, 41276.0, 25968.0, 16368.0, 10108.0, 6069.0, 3641.0, 2272.0, 1374.0, 876.0, 516.0, 332.0, 227.0, 147.0, 82.0, 48.0, 38.0, 26.0, 11.0, 10.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-2.216796875, -2.149169921875, -2.08154296875, -2.013916015625, -1.9462890625, -1.878662109375, -1.81103515625, -1.743408203125, -1.67578125, -1.608154296875, -1.54052734375, -1.472900390625, -1.4052734375, -1.337646484375, -1.27001953125, -1.202392578125, -1.134765625, -1.067138671875, -0.99951171875, -0.931884765625, -0.8642578125, -0.796630859375, -0.72900390625, -0.661376953125, -0.59375, -0.526123046875, -0.45849609375, -0.390869140625, -0.3232421875, -0.255615234375, -0.18798828125, -0.120361328125, -0.052734375, 0.014892578125, 0.08251953125, 0.150146484375, 0.2177734375, 0.285400390625, 0.35302734375, 0.420654296875, 0.48828125, 0.555908203125, 0.62353515625, 0.691162109375, 0.7587890625, 0.826416015625, 0.89404296875, 0.961669921875, 1.029296875, 1.096923828125, 1.16455078125, 1.232177734375, 1.2998046875, 1.367431640625, 1.43505859375, 1.502685546875, 1.5703125, 1.637939453125, 1.70556640625, 1.773193359375, 1.8408203125, 1.908447265625, 1.97607421875, 2.043701171875, 2.111328125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 0.0, 6.0, 8.0, 5.0, 7.0, 17.0, 14.0, 19.0, 21.0, 15.0, 16.0, 27.0, 22.0, 45.0, 47.0, 54.0, 48.0, 42.0, 51.0, 56.0, 57.0, 51.0, 43.0, 43.0, 47.0, 48.0, 30.0, 21.0, 33.0, 18.0, 17.0, 18.0, 10.0, 12.0, 6.0, 4.0, 5.0, 4.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021779537200927734, -0.00021044351160526276, -0.00020309165120124817, -0.00019573979079723358, -0.000188387930393219, -0.0001810360699892044, -0.00017368420958518982, -0.00016633234918117523, -0.00015898048877716064, -0.00015162862837314606, -0.00014427676796913147, -0.00013692490756511688, -0.0001295730471611023, -0.0001222211867570877, -0.00011486932635307312, -0.00010751746594905853, -0.00010016560554504395, -9.281374514102936e-05, -8.546188473701477e-05, -7.811002433300018e-05, -7.07581639289856e-05, -6.340630352497101e-05, -5.605444312095642e-05, -4.8702582716941833e-05, -4.1350722312927246e-05, -3.399886190891266e-05, -2.664700150489807e-05, -1.9295141100883484e-05, -1.1943280696868896e-05, -4.591420292854309e-06, 2.7604401111602783e-06, 1.0112300515174866e-05, 1.7464160919189453e-05, 2.481602132320404e-05, 3.216788172721863e-05, 3.9519742131233215e-05, 4.68716025352478e-05, 5.422346293926239e-05, 6.157532334327698e-05, 6.892718374729156e-05, 7.627904415130615e-05, 8.363090455532074e-05, 9.098276495933533e-05, 9.833462536334991e-05, 0.0001056864857673645, 0.00011303834617137909, 0.00012039020657539368, 0.00012774206697940826, 0.00013509392738342285, 0.00014244578778743744, 0.00014979764819145203, 0.00015714950859546661, 0.0001645013689994812, 0.0001718532294034958, 0.00017920508980751038, 0.00018655695021152496, 0.00019390881061553955, 0.00020126067101955414, 0.00020861253142356873, 0.0002159643918275833, 0.0002233162522315979, 0.0002306681126356125, 0.00023801997303962708, 0.00024537183344364166, 0.00025272369384765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 7.0, 11.0, 17.0, 27.0, 55.0, 78.0, 103.0, 180.0, 272.0, 412.0, 698.0, 1001.0, 1715.0, 2675.0, 4603.0, 7459.0, 12202.0, 20358.0, 33460.0, 54272.0, 80234.0, 110196.0, 134914.0, 143537.0, 131374.0, 104952.0, 75088.0, 49671.0, 31191.0, 18817.0, 11137.0, 6833.0, 4246.0, 2530.0, 1532.0, 991.0, 615.0, 362.0, 256.0, 168.0, 100.0, 66.0, 46.0, 34.0, 16.0, 16.0, 9.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.451171875, -2.37554931640625, -2.2999267578125, -2.22430419921875, -2.148681640625, -2.07305908203125, -1.9974365234375, -1.92181396484375, -1.84619140625, -1.77056884765625, -1.6949462890625, -1.61932373046875, -1.543701171875, -1.46807861328125, -1.3924560546875, -1.31683349609375, -1.2412109375, -1.16558837890625, -1.0899658203125, -1.01434326171875, -0.938720703125, -0.86309814453125, -0.7874755859375, -0.71185302734375, -0.63623046875, -0.56060791015625, -0.4849853515625, -0.40936279296875, -0.333740234375, -0.25811767578125, -0.1824951171875, -0.10687255859375, -0.03125, 0.04437255859375, 0.1199951171875, 0.19561767578125, 0.271240234375, 0.34686279296875, 0.4224853515625, 0.49810791015625, 0.57373046875, 0.64935302734375, 0.7249755859375, 0.80059814453125, 0.876220703125, 0.95184326171875, 1.0274658203125, 1.10308837890625, 1.1787109375, 1.25433349609375, 1.3299560546875, 1.40557861328125, 1.481201171875, 1.55682373046875, 1.6324462890625, 1.70806884765625, 1.78369140625, 1.85931396484375, 1.9349365234375, 2.01055908203125, 2.086181640625, 2.16180419921875, 2.2374267578125, 2.31304931640625, 2.388671875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 8.0, 6.0, 5.0, 7.0, 11.0, 17.0, 16.0, 23.0, 22.0, 29.0, 31.0, 26.0, 25.0, 37.0, 50.0, 46.0, 48.0, 41.0, 37.0, 55.0, 49.0, 46.0, 46.0, 44.0, 42.0, 40.0, 30.0, 28.0, 20.0, 14.0, 16.0, 9.0, 10.0, 13.0, 12.0, 5.0, 2.0, 7.0, 7.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.79345703125, -0.7685775756835938, -0.7436981201171875, -0.7188186645507812, -0.693939208984375, -0.6690597534179688, -0.6441802978515625, -0.6193008422851562, -0.59442138671875, -0.5695419311523438, -0.5446624755859375, -0.5197830200195312, -0.494903564453125, -0.47002410888671875, -0.4451446533203125, -0.42026519775390625, -0.3953857421875, -0.37050628662109375, -0.3456268310546875, -0.32074737548828125, -0.295867919921875, -0.27098846435546875, -0.2461090087890625, -0.22122955322265625, -0.19635009765625, -0.17147064208984375, -0.1465911865234375, -0.12171173095703125, -0.096832275390625, -0.07195281982421875, -0.0470733642578125, -0.02219390869140625, 0.002685546875, 0.02756500244140625, 0.0524444580078125, 0.07732391357421875, 0.102203369140625, 0.12708282470703125, 0.1519622802734375, 0.17684173583984375, 0.20172119140625, 0.22660064697265625, 0.2514801025390625, 0.27635955810546875, 0.301239013671875, 0.32611846923828125, 0.3509979248046875, 0.37587738037109375, 0.4007568359375, 0.42563629150390625, 0.4505157470703125, 0.47539520263671875, 0.500274658203125, 0.5251541137695312, 0.5500335693359375, 0.5749130249023438, 0.59979248046875, 0.6246719360351562, 0.6495513916015625, 0.6744308471679688, 0.699310302734375, 0.7241897583007812, 0.7490692138671875, 0.7739486694335938, 0.798828125]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 10.0, 11.0, 5.0, 11.0, 17.0, 24.0, 21.0, 28.0, 26.0, 40.0, 31.0, 41.0, 47.0, 43.0, 49.0, 45.0, 59.0, 39.0, 50.0, 44.0, 43.0, 42.0, 33.0, 27.0, 43.0, 34.0, 24.0, 17.0, 13.0, 14.0, 12.0, 7.0, 11.0, 9.0, 2.0, 6.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.194305419921875, -8.895365715026855, -8.596426963806152, -8.297487258911133, -7.99854850769043, -7.69960880279541, -7.400669574737549, -7.1017303466796875, -6.802791118621826, -6.503851890563965, -6.2049126625061035, -5.905973434448242, -5.607033729553223, -5.3080949783325195, -5.0091552734375, -4.710216045379639, -4.411276817321777, -4.112337589263916, -3.8133983612060547, -3.5144588947296143, -3.215519666671753, -2.9165804386138916, -2.617640972137451, -2.31870174407959, -2.0197625160217285, -1.7208232879638672, -1.4218839406967163, -1.1229445934295654, -0.8240053653717041, -0.5250661373138428, -0.2261267900466919, 0.07281255722045898, 0.3717527389526367, 0.6706920266151428, 0.9696313142776489, 1.2685706615447998, 1.5675098896026611, 1.8664491176605225, 2.165388584136963, 2.464327812194824, 2.7632670402526855, 3.062206268310547, 3.361145496368408, 3.6600849628448486, 3.95902419090271, 4.257963180541992, 4.556902885437012, 4.855842113494873, 5.154781341552734, 5.453720569610596, 5.752659797668457, 6.051599025726318, 6.35053825378418, 6.649477958679199, 6.9484171867370605, 7.247356414794922, 7.546295642852783, 7.8452348709106445, 8.144174575805664, 8.443113327026367, 8.742053031921387, 9.04099178314209, 9.33993148803711, 9.638870239257812, 9.937809944152832]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 4.0, 10.0, 8.0, 8.0, 16.0, 9.0, 12.0, 21.0, 19.0, 28.0, 35.0, 36.0, 33.0, 51.0, 43.0, 44.0, 52.0, 40.0, 44.0, 45.0, 42.0, 36.0, 47.0, 32.0, 40.0, 33.0, 28.0, 29.0, 20.0, 33.0, 24.0, 7.0, 11.0, 17.0, 12.0, 4.0, 2.0, 9.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.42290210723877, -11.090110778808594, -10.757320404052734, -10.424529075622559, -10.091737747192383, -9.758947372436523, -9.426156044006348, -9.093364715576172, -8.760574340820312, -8.427783012390137, -8.094992637634277, -7.762201309204102, -7.429410457611084, -7.096619606018066, -6.763828277587891, -6.431037425994873, -6.0982465744018555, -5.765455722808838, -5.43266487121582, -5.0998735427856445, -4.767082691192627, -4.434291839599609, -4.101500511169434, -3.768709659576416, -3.4359188079833984, -3.103127956390381, -2.770336866378784, -2.4375457763671875, -2.10475492477417, -1.7719639539718628, -1.4391729831695557, -1.106381893157959, -0.7735910415649414, -0.4408000707626343, -0.10800909996032715, 0.22478187084197998, 0.5575728416442871, 0.8903638124465942, 1.2231547832489014, 1.555945873260498, 1.8887367248535156, 2.221527576446533, 2.55431866645813, 2.8871097564697266, 3.219900608062744, 3.5526914596557617, 3.8854825496673584, 4.218273639678955, 4.551064491271973, 4.88385534286499, 5.216646194458008, 5.549437522888184, 5.882228374481201, 6.215019226074219, 6.5478105545043945, 6.880601406097412, 7.21339225769043, 7.546183109283447, 7.878973960876465, 8.21176528930664, 8.5445556640625, 8.877346992492676, 9.210138320922852, 9.542928695678711, 9.875720024108887]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 14.0, 19.0, 30.0, 56.0, 84.0, 129.0, 195.0, 319.0, 515.0, 925.0, 1415.0, 2426.0, 3815.0, 6463.0, 10896.0, 18625.0, 31347.0, 52706.0, 88678.0, 147961.0, 237452.0, 360811.0, 501075.0, 604000.0, 609511.0, 512391.0, 372910.0, 246958.0, 154641.0, 93272.0, 55612.0, 32236.0, 18977.0, 11245.0, 6734.0, 3899.0, 2279.0, 1385.0, 905.0, 527.0, 323.0, 201.0, 123.0, 67.0, 57.0, 21.0, 19.0, 19.0, 7.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-9.6953125, -9.410400390625, -9.12548828125, -8.840576171875, -8.5556640625, -8.270751953125, -7.98583984375, -7.700927734375, -7.416015625, -7.131103515625, -6.84619140625, -6.561279296875, -6.2763671875, -5.991455078125, -5.70654296875, -5.421630859375, -5.13671875, -4.851806640625, -4.56689453125, -4.281982421875, -3.9970703125, -3.712158203125, -3.42724609375, -3.142333984375, -2.857421875, -2.572509765625, -2.28759765625, -2.002685546875, -1.7177734375, -1.432861328125, -1.14794921875, -0.863037109375, -0.578125, -0.293212890625, -0.00830078125, 0.276611328125, 0.5615234375, 0.846435546875, 1.13134765625, 1.416259765625, 1.701171875, 1.986083984375, 2.27099609375, 2.555908203125, 2.8408203125, 3.125732421875, 3.41064453125, 3.695556640625, 3.98046875, 4.265380859375, 4.55029296875, 4.835205078125, 5.1201171875, 5.405029296875, 5.68994140625, 5.974853515625, 6.259765625, 6.544677734375, 6.82958984375, 7.114501953125, 7.3994140625, 7.684326171875, 7.96923828125, 8.254150390625, 8.5390625]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 4.0, 6.0, 5.0, 13.0, 15.0, 21.0, 14.0, 17.0, 23.0, 29.0, 31.0, 33.0, 36.0, 39.0, 48.0, 42.0, 45.0, 45.0, 41.0, 50.0, 39.0, 44.0, 46.0, 31.0, 39.0, 22.0, 36.0, 26.0, 25.0, 23.0, 15.0, 22.0, 22.0, 9.0, 13.0, 4.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.5703125, -9.2998046875, -9.029296875, -8.7587890625, -8.48828125, -8.2177734375, -7.947265625, -7.6767578125, -7.40625, -7.1357421875, -6.865234375, -6.5947265625, -6.32421875, -6.0537109375, -5.783203125, -5.5126953125, -5.2421875, -4.9716796875, -4.701171875, -4.4306640625, -4.16015625, -3.8896484375, -3.619140625, -3.3486328125, -3.078125, -2.8076171875, -2.537109375, -2.2666015625, -1.99609375, -1.7255859375, -1.455078125, -1.1845703125, -0.9140625, -0.6435546875, -0.373046875, -0.1025390625, 0.16796875, 0.4384765625, 0.708984375, 0.9794921875, 1.25, 1.5205078125, 1.791015625, 2.0615234375, 2.33203125, 2.6025390625, 2.873046875, 3.1435546875, 3.4140625, 3.6845703125, 3.955078125, 4.2255859375, 4.49609375, 4.7666015625, 5.037109375, 5.3076171875, 5.578125, 5.8486328125, 6.119140625, 6.3896484375, 6.66015625, 6.9306640625, 7.201171875, 7.4716796875, 7.7421875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 14.0, 20.0, 22.0, 53.0, 90.0, 156.0, 194.0, 320.0, 480.0, 876.0, 1451.0, 2320.0, 3665.0, 6111.0, 9872.0, 15836.0, 25455.0, 40752.0, 63320.0, 98805.0, 148293.0, 215564.0, 300073.0, 387085.0, 459618.0, 494062.0, 474540.0, 411468.0, 324535.0, 238285.0, 166605.0, 110511.0, 71962.0, 45767.0, 28838.0, 17962.0, 11405.0, 6831.0, 4311.0, 2576.0, 1529.0, 1016.0, 612.0, 405.0, 226.0, 149.0, 79.0, 63.0, 31.0, 21.0, 12.0, 8.0, 8.0, 2.0, 5.0, 2.0, 4.0], "bins": [-8.96875, -8.6939697265625, -8.419189453125, -8.1444091796875, -7.86962890625, -7.5948486328125, -7.320068359375, -7.0452880859375, -6.7705078125, -6.4957275390625, -6.220947265625, -5.9461669921875, -5.67138671875, -5.3966064453125, -5.121826171875, -4.8470458984375, -4.572265625, -4.2974853515625, -4.022705078125, -3.7479248046875, -3.47314453125, -3.1983642578125, -2.923583984375, -2.6488037109375, -2.3740234375, -2.0992431640625, -1.824462890625, -1.5496826171875, -1.27490234375, -1.0001220703125, -0.725341796875, -0.4505615234375, -0.17578125, 0.0989990234375, 0.373779296875, 0.6485595703125, 0.92333984375, 1.1981201171875, 1.472900390625, 1.7476806640625, 2.0224609375, 2.2972412109375, 2.572021484375, 2.8468017578125, 3.12158203125, 3.3963623046875, 3.671142578125, 3.9459228515625, 4.220703125, 4.4954833984375, 4.770263671875, 5.0450439453125, 5.31982421875, 5.5946044921875, 5.869384765625, 6.1441650390625, 6.4189453125, 6.6937255859375, 6.968505859375, 7.2432861328125, 7.51806640625, 7.7928466796875, 8.067626953125, 8.3424072265625, 8.6171875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 5.0, 2.0, 8.0, 5.0, 18.0, 21.0, 19.0, 31.0, 28.0, 50.0, 52.0, 68.0, 67.0, 100.0, 126.0, 130.0, 169.0, 163.0, 173.0, 174.0, 215.0, 204.0, 247.0, 243.0, 212.0, 185.0, 203.0, 171.0, 151.0, 123.0, 118.0, 111.0, 103.0, 59.0, 61.0, 57.0, 47.0, 35.0, 27.0, 21.0, 17.0, 15.0, 9.0, 11.0, 6.0, 4.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.19140625, -4.05609130859375, -3.9207763671875, -3.78546142578125, -3.650146484375, -3.51483154296875, -3.3795166015625, -3.24420166015625, -3.10888671875, -2.97357177734375, -2.8382568359375, -2.70294189453125, -2.567626953125, -2.43231201171875, -2.2969970703125, -2.16168212890625, -2.0263671875, -1.89105224609375, -1.7557373046875, -1.62042236328125, -1.485107421875, -1.34979248046875, -1.2144775390625, -1.07916259765625, -0.94384765625, -0.80853271484375, -0.6732177734375, -0.53790283203125, -0.402587890625, -0.26727294921875, -0.1319580078125, 0.00335693359375, 0.138671875, 0.27398681640625, 0.4093017578125, 0.54461669921875, 0.679931640625, 0.81524658203125, 0.9505615234375, 1.08587646484375, 1.22119140625, 1.35650634765625, 1.4918212890625, 1.62713623046875, 1.762451171875, 1.89776611328125, 2.0330810546875, 2.16839599609375, 2.3037109375, 2.43902587890625, 2.5743408203125, 2.70965576171875, 2.844970703125, 2.98028564453125, 3.1156005859375, 3.25091552734375, 3.38623046875, 3.52154541015625, 3.6568603515625, 3.79217529296875, 3.927490234375, 4.06280517578125, 4.1981201171875, 4.33343505859375, 4.46875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 1.0, 4.0, 2.0, 4.0, 9.0, 7.0, 8.0, 16.0, 11.0, 22.0, 28.0, 27.0, 22.0, 32.0, 29.0, 38.0, 48.0, 42.0, 48.0, 58.0, 56.0, 48.0, 65.0, 43.0, 44.0, 40.0, 40.0, 42.0, 32.0, 26.0, 19.0, 17.0, 17.0, 9.0, 9.0, 10.0, 6.0, 3.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.580362319946289, -13.16423511505127, -12.74810791015625, -12.331981658935547, -11.915854454040527, -11.499727249145508, -11.083600044250488, -10.667472839355469, -10.251346588134766, -9.835219383239746, -9.419092178344727, -9.002965927124023, -8.586838722229004, -8.170711517333984, -7.754584312438965, -7.3384575843811035, -6.922330379486084, -6.5062031745910645, -6.090076446533203, -5.673949241638184, -5.257822513580322, -4.841695308685303, -4.425568580627441, -4.009441375732422, -3.5933144092559814, -3.177187442779541, -2.7610604763031006, -2.34493350982666, -1.9288064241409302, -1.5126793384552002, -1.0965523719787598, -0.6804254055023193, -0.2642984390258789, 0.1518285572528839, 0.5679555535316467, 0.9840825796127319, 1.4002095460891724, 1.8163366317749023, 2.2324635982513428, 2.648590564727783, 3.0647175312042236, 3.480844497680664, 3.8969714641571045, 4.313098430633545, 4.7292256355285645, 5.145352363586426, 5.561479568481445, 5.977606773376465, 6.393733501434326, 6.809860706329346, 7.225987434387207, 7.642114639282227, 8.058241844177246, 8.474369049072266, 8.890495300292969, 9.306622505187988, 9.722749710083008, 10.138876914978027, 10.555004119873047, 10.97113037109375, 11.38725757598877, 11.803384780883789, 12.219511985778809, 12.635639190673828, 13.051765441894531]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 4.0, 7.0, 11.0, 9.0, 18.0, 16.0, 22.0, 32.0, 25.0, 32.0, 41.0, 23.0, 30.0, 47.0, 45.0, 45.0, 41.0, 60.0, 46.0, 45.0, 52.0, 39.0, 41.0, 39.0, 39.0, 31.0, 31.0, 24.0, 20.0, 20.0, 16.0, 9.0, 10.0, 6.0, 6.0, 1.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.955738067626953, -14.543953895568848, -14.132169723510742, -13.720385551452637, -13.308601379394531, -12.896817207336426, -12.48503303527832, -12.073248863220215, -11.66146469116211, -11.249680519104004, -10.837896347045898, -10.426112174987793, -10.014328002929688, -9.602543830871582, -9.190759658813477, -8.778975486755371, -8.367191314697266, -7.95540714263916, -7.543622970581055, -7.131838798522949, -6.720054626464844, -6.308270454406738, -5.896486282348633, -5.484702110290527, -5.072917938232422, -4.661133766174316, -4.249349594116211, -3.8375654220581055, -3.42578125, -3.0139970779418945, -2.602212905883789, -2.1904287338256836, -1.7786445617675781, -1.3668603897094727, -0.9550762176513672, -0.5432920455932617, -0.13150787353515625, 0.2802762985229492, 0.6920604705810547, 1.1038446426391602, 1.5156288146972656, 1.927412986755371, 2.3391971588134766, 2.750981330871582, 3.1627655029296875, 3.574549674987793, 3.9863338470458984, 4.398118019104004, 4.809902191162109, 5.221686363220215, 5.63347053527832, 6.045254707336426, 6.457038879394531, 6.868823051452637, 7.280607223510742, 7.692391395568848, 8.104175567626953, 8.515959739685059, 8.927743911743164, 9.33952808380127, 9.751312255859375, 10.16309642791748, 10.574880599975586, 10.986664772033691, 11.398448944091797]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 6.0, 16.0, 12.0, 12.0, 46.0, 60.0, 73.0, 152.0, 249.0, 386.0, 672.0, 1234.0, 1933.0, 3251.0, 5534.0, 9637.0, 16424.0, 29033.0, 51398.0, 90882.0, 158039.0, 230182.0, 188878.0, 112136.0, 63678.0, 35692.0, 20490.0, 11595.0, 6831.0, 4058.0, 2406.0, 1439.0, 789.0, 511.0, 301.0, 196.0, 113.0, 84.0, 43.0, 33.0, 24.0, 12.0, 11.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5908203125, -1.5288848876953125, -1.466949462890625, -1.4050140380859375, -1.34307861328125, -1.2811431884765625, -1.219207763671875, -1.1572723388671875, -1.0953369140625, -1.0334014892578125, -0.971466064453125, -0.9095306396484375, -0.84759521484375, -0.7856597900390625, -0.723724365234375, -0.6617889404296875, -0.599853515625, -0.5379180908203125, -0.475982666015625, -0.4140472412109375, -0.35211181640625, -0.2901763916015625, -0.228240966796875, -0.1663055419921875, -0.1043701171875, -0.0424346923828125, 0.019500732421875, 0.0814361572265625, 0.14337158203125, 0.2053070068359375, 0.267242431640625, 0.3291778564453125, 0.39111328125, 0.4530487060546875, 0.514984130859375, 0.5769195556640625, 0.63885498046875, 0.7007904052734375, 0.762725830078125, 0.8246612548828125, 0.8865966796875, 0.9485321044921875, 1.010467529296875, 1.0724029541015625, 1.13433837890625, 1.1962738037109375, 1.258209228515625, 1.3201446533203125, 1.382080078125, 1.4440155029296875, 1.505950927734375, 1.5678863525390625, 1.62982177734375, 1.6917572021484375, 1.753692626953125, 1.8156280517578125, 1.8775634765625, 1.9394989013671875, 2.001434326171875, 2.0633697509765625, 2.12530517578125, 2.1872406005859375, 2.249176025390625, 2.3111114501953125, 2.373046875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 2.0, 3.0, 8.0, 6.0, 13.0, 13.0, 17.0, 19.0, 26.0, 25.0, 16.0, 34.0, 30.0, 34.0, 31.0, 30.0, 45.0, 38.0, 51.0, 44.0, 33.0, 49.0, 40.0, 40.0, 42.0, 34.0, 36.0, 34.0, 36.0, 21.0, 22.0, 18.0, 27.0, 11.0, 15.0, 8.0, 17.0, 9.0, 2.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.4453125, -12.0567626953125, -11.668212890625, -11.2796630859375, -10.89111328125, -10.5025634765625, -10.114013671875, -9.7254638671875, -9.3369140625, -8.9483642578125, -8.559814453125, -8.1712646484375, -7.78271484375, -7.3941650390625, -7.005615234375, -6.6170654296875, -6.228515625, -5.8399658203125, -5.451416015625, -5.0628662109375, -4.67431640625, -4.2857666015625, -3.897216796875, -3.5086669921875, -3.1201171875, -2.7315673828125, -2.343017578125, -1.9544677734375, -1.56591796875, -1.1773681640625, -0.788818359375, -0.4002685546875, -0.01171875, 0.3768310546875, 0.765380859375, 1.1539306640625, 1.54248046875, 1.9310302734375, 2.319580078125, 2.7081298828125, 3.0966796875, 3.4852294921875, 3.873779296875, 4.2623291015625, 4.65087890625, 5.0394287109375, 5.427978515625, 5.8165283203125, 6.205078125, 6.5936279296875, 6.982177734375, 7.3707275390625, 7.75927734375, 8.1478271484375, 8.536376953125, 8.9249267578125, 9.3134765625, 9.7020263671875, 10.090576171875, 10.4791259765625, 10.86767578125, 11.2562255859375, 11.644775390625, 12.0333251953125, 12.421875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 10.0, 5.0, 11.0, 14.0, 30.0, 40.0, 45.0, 119.0, 173.0, 208.0, 389.0, 533.0, 839.0, 1300.0, 1907.0, 3020.0, 4583.0, 7107.0, 11182.0, 17520.0, 27018.0, 42537.0, 65360.0, 99848.0, 144665.0, 176113.0, 148812.0, 103594.0, 67852.0, 44043.0, 28348.0, 18226.0, 11722.0, 7489.0, 4836.0, 3194.0, 2030.0, 1338.0, 923.0, 547.0, 323.0, 274.0, 137.0, 98.0, 69.0, 41.0, 36.0, 21.0, 16.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.6826171875, -1.63092041015625, -1.5792236328125, -1.52752685546875, -1.475830078125, -1.42413330078125, -1.3724365234375, -1.32073974609375, -1.26904296875, -1.21734619140625, -1.1656494140625, -1.11395263671875, -1.062255859375, -1.01055908203125, -0.9588623046875, -0.90716552734375, -0.85546875, -0.80377197265625, -0.7520751953125, -0.70037841796875, -0.648681640625, -0.59698486328125, -0.5452880859375, -0.49359130859375, -0.44189453125, -0.39019775390625, -0.3385009765625, -0.28680419921875, -0.235107421875, -0.18341064453125, -0.1317138671875, -0.08001708984375, -0.0283203125, 0.02337646484375, 0.0750732421875, 0.12677001953125, 0.178466796875, 0.23016357421875, 0.2818603515625, 0.33355712890625, 0.38525390625, 0.43695068359375, 0.4886474609375, 0.54034423828125, 0.592041015625, 0.64373779296875, 0.6954345703125, 0.74713134765625, 0.798828125, 0.85052490234375, 0.9022216796875, 0.95391845703125, 1.005615234375, 1.05731201171875, 1.1090087890625, 1.16070556640625, 1.21240234375, 1.26409912109375, 1.3157958984375, 1.36749267578125, 1.419189453125, 1.47088623046875, 1.5225830078125, 1.57427978515625, 1.6259765625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 5.0, 4.0, 4.0, 15.0, 7.0, 11.0, 14.0, 5.0, 13.0, 13.0, 22.0, 24.0, 22.0, 36.0, 29.0, 34.0, 37.0, 36.0, 34.0, 49.0, 39.0, 44.0, 28.0, 44.0, 31.0, 35.0, 35.0, 32.0, 31.0, 29.0, 40.0, 30.0, 30.0, 24.0, 24.0, 13.0, 22.0, 7.0, 13.0, 7.0, 2.0, 7.0, 4.0, 8.0, 8.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-7.796875, -7.56964111328125, -7.3424072265625, -7.11517333984375, -6.887939453125, -6.66070556640625, -6.4334716796875, -6.20623779296875, -5.97900390625, -5.75177001953125, -5.5245361328125, -5.29730224609375, -5.070068359375, -4.84283447265625, -4.6156005859375, -4.38836669921875, -4.1611328125, -3.93389892578125, -3.7066650390625, -3.47943115234375, -3.252197265625, -3.02496337890625, -2.7977294921875, -2.57049560546875, -2.34326171875, -2.11602783203125, -1.8887939453125, -1.66156005859375, -1.434326171875, -1.20709228515625, -0.9798583984375, -0.75262451171875, -0.525390625, -0.29815673828125, -0.0709228515625, 0.15631103515625, 0.383544921875, 0.61077880859375, 0.8380126953125, 1.06524658203125, 1.29248046875, 1.51971435546875, 1.7469482421875, 1.97418212890625, 2.201416015625, 2.42864990234375, 2.6558837890625, 2.88311767578125, 3.1103515625, 3.33758544921875, 3.5648193359375, 3.79205322265625, 4.019287109375, 4.24652099609375, 4.4737548828125, 4.70098876953125, 4.92822265625, 5.15545654296875, 5.3826904296875, 5.60992431640625, 5.837158203125, 6.06439208984375, 6.2916259765625, 6.51885986328125, 6.74609375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 3.0, 10.0, 15.0, 13.0, 14.0, 23.0, 52.0, 61.0, 81.0, 151.0, 219.0, 299.0, 439.0, 787.0, 1193.0, 2052.0, 3412.0, 6198.0, 11858.0, 24446.0, 54235.0, 124841.0, 291286.0, 293388.0, 126880.0, 54781.0, 24989.0, 11847.0, 6119.0, 3477.0, 1995.0, 1222.0, 780.0, 457.0, 289.0, 224.0, 132.0, 93.0, 67.0, 38.0, 24.0, 22.0, 12.0, 10.0, 10.0, 6.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1854248046875, -0.1792449951171875, -0.173065185546875, -0.1668853759765625, -0.16070556640625, -0.1545257568359375, -0.148345947265625, -0.1421661376953125, -0.135986328125, -0.1298065185546875, -0.123626708984375, -0.1174468994140625, -0.11126708984375, -0.1050872802734375, -0.098907470703125, -0.0927276611328125, -0.0865478515625, -0.0803680419921875, -0.074188232421875, -0.0680084228515625, -0.06182861328125, -0.0556488037109375, -0.049468994140625, -0.0432891845703125, -0.037109375, -0.0309295654296875, -0.024749755859375, -0.0185699462890625, -0.01239013671875, -0.0062103271484375, -3.0517578125e-05, 0.0061492919921875, 0.0123291015625, 0.0185089111328125, 0.024688720703125, 0.0308685302734375, 0.03704833984375, 0.0432281494140625, 0.049407958984375, 0.0555877685546875, 0.061767578125, 0.0679473876953125, 0.074127197265625, 0.0803070068359375, 0.08648681640625, 0.0926666259765625, 0.098846435546875, 0.1050262451171875, 0.1112060546875, 0.1173858642578125, 0.123565673828125, 0.1297454833984375, 0.13592529296875, 0.1421051025390625, 0.148284912109375, 0.1544647216796875, 0.16064453125, 0.1668243408203125, 0.173004150390625, 0.1791839599609375, 0.18536376953125, 0.1915435791015625, 0.197723388671875, 0.2039031982421875, 0.2100830078125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 7.0, 3.0, 15.0, 16.0, 24.0, 12.0, 34.0, 35.0, 33.0, 32.0, 39.0, 32.0, 40.0, 37.0, 57.0, 42.0, 35.0, 28.0, 42.0, 34.0, 38.0, 43.0, 34.0, 29.0, 34.0, 21.0, 26.0, 23.0, 27.0, 20.0, 17.0, 16.0, 13.0, 9.0, 9.0, 5.0, 6.0, 7.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3947486877441406e-05, -1.3501383364200592e-05, -1.3055279850959778e-05, -1.2609176337718964e-05, -1.216307282447815e-05, -1.1716969311237335e-05, -1.1270865797996521e-05, -1.0824762284755707e-05, -1.0378658771514893e-05, -9.932555258274078e-06, -9.486451745033264e-06, -9.04034823179245e-06, -8.594244718551636e-06, -8.148141205310822e-06, -7.702037692070007e-06, -7.255934178829193e-06, -6.809830665588379e-06, -6.363727152347565e-06, -5.9176236391067505e-06, -5.471520125865936e-06, -5.025416612625122e-06, -4.579313099384308e-06, -4.133209586143494e-06, -3.6871060729026794e-06, -3.2410025596618652e-06, -2.794899046421051e-06, -2.348795533180237e-06, -1.9026920199394226e-06, -1.4565885066986084e-06, -1.0104849934577942e-06, -5.6438148021698e-07, -1.1827796697616577e-07, 3.2782554626464844e-07, 7.739290595054626e-07, 1.2200325727462769e-06, 1.666136085987091e-06, 2.1122395992279053e-06, 2.5583431124687195e-06, 3.0044466257095337e-06, 3.450550138950348e-06, 3.896653652191162e-06, 4.342757165431976e-06, 4.7888606786727905e-06, 5.234964191913605e-06, 5.681067705154419e-06, 6.127171218395233e-06, 6.573274731636047e-06, 7.0193782448768616e-06, 7.465481758117676e-06, 7.91158527135849e-06, 8.357688784599304e-06, 8.803792297840118e-06, 9.249895811080933e-06, 9.695999324321747e-06, 1.0142102837562561e-05, 1.0588206350803375e-05, 1.103430986404419e-05, 1.1480413377285004e-05, 1.1926516890525818e-05, 1.2372620403766632e-05, 1.2818723917007446e-05, 1.326482743024826e-05, 1.3710930943489075e-05, 1.4157034456729889e-05, 1.4603137969970703e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 8.0, 9.0, 21.0, 26.0, 36.0, 57.0, 119.0, 165.0, 220.0, 372.0, 577.0, 927.0, 1461.0, 2461.0, 3966.0, 7124.0, 13133.0, 24992.0, 51051.0, 110291.0, 253022.0, 308232.0, 139910.0, 63119.0, 30597.0, 15769.0, 8646.0, 4814.0, 2787.0, 1696.0, 1075.0, 653.0, 420.0, 274.0, 175.0, 114.0, 74.0, 53.0, 27.0, 27.0, 14.0, 8.0, 4.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.33203125, -0.322845458984375, -0.31365966796875, -0.304473876953125, -0.2952880859375, -0.286102294921875, -0.27691650390625, -0.267730712890625, -0.258544921875, -0.249359130859375, -0.24017333984375, -0.230987548828125, -0.2218017578125, -0.212615966796875, -0.20343017578125, -0.194244384765625, -0.18505859375, -0.175872802734375, -0.16668701171875, -0.157501220703125, -0.1483154296875, -0.139129638671875, -0.12994384765625, -0.120758056640625, -0.111572265625, -0.102386474609375, -0.09320068359375, -0.084014892578125, -0.0748291015625, -0.065643310546875, -0.05645751953125, -0.047271728515625, -0.0380859375, -0.028900146484375, -0.01971435546875, -0.010528564453125, -0.0013427734375, 0.007843017578125, 0.01702880859375, 0.026214599609375, 0.035400390625, 0.044586181640625, 0.05377197265625, 0.062957763671875, 0.0721435546875, 0.081329345703125, 0.09051513671875, 0.099700927734375, 0.10888671875, 0.118072509765625, 0.12725830078125, 0.136444091796875, 0.1456298828125, 0.154815673828125, 0.16400146484375, 0.173187255859375, 0.182373046875, 0.191558837890625, 0.20074462890625, 0.209930419921875, 0.2191162109375, 0.228302001953125, 0.23748779296875, 0.246673583984375, 0.255859375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 2.0, 11.0, 14.0, 18.0, 22.0, 32.0, 47.0, 64.0, 72.0, 93.0, 114.0, 123.0, 79.0, 65.0, 50.0, 46.0, 33.0, 21.0, 16.0, 10.0, 14.0, 11.0, 11.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07275390625, -0.06995391845703125, -0.0671539306640625, -0.06435394287109375, -0.061553955078125, -0.05875396728515625, -0.0559539794921875, -0.05315399169921875, -0.05035400390625, -0.04755401611328125, -0.0447540283203125, -0.04195404052734375, -0.039154052734375, -0.03635406494140625, -0.0335540771484375, -0.03075408935546875, -0.0279541015625, -0.02515411376953125, -0.0223541259765625, -0.01955413818359375, -0.016754150390625, -0.01395416259765625, -0.0111541748046875, -0.00835418701171875, -0.00555419921875, -0.00275421142578125, 4.57763671875e-05, 0.00284576416015625, 0.005645751953125, 0.00844573974609375, 0.0112457275390625, 0.01404571533203125, 0.016845703125, 0.01964569091796875, 0.0224456787109375, 0.02524566650390625, 0.028045654296875, 0.03084564208984375, 0.0336456298828125, 0.03644561767578125, 0.03924560546875, 0.04204559326171875, 0.0448455810546875, 0.04764556884765625, 0.050445556640625, 0.05324554443359375, 0.0560455322265625, 0.05884552001953125, 0.0616455078125, 0.06444549560546875, 0.0672454833984375, 0.07004547119140625, 0.072845458984375, 0.07564544677734375, 0.0784454345703125, 0.08124542236328125, 0.08404541015625, 0.08684539794921875, 0.0896453857421875, 0.09244537353515625, 0.095245361328125, 0.09804534912109375, 0.1008453369140625, 0.10364532470703125, 0.1064453125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 9.0, 8.0, 9.0, 10.0, 13.0, 14.0, 27.0, 23.0, 34.0, 22.0, 36.0, 40.0, 45.0, 49.0, 38.0, 54.0, 56.0, 43.0, 71.0, 48.0, 53.0, 33.0, 44.0, 37.0, 36.0, 26.0, 20.0, 14.0, 22.0, 11.0, 7.0, 12.0, 4.0, 3.0, 8.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.771561622619629, -13.352483749389648, -12.933406829833984, -12.514328956604004, -12.095251083374023, -11.67617416381836, -11.257096290588379, -10.838018417358398, -10.418941497802734, -9.999863624572754, -9.58078670501709, -9.16170883178711, -8.742631912231445, -8.323554039001465, -7.904476165771484, -7.485398769378662, -7.06632137298584, -6.647243976593018, -6.228166580200195, -5.809088706970215, -5.390011310577393, -4.97093391418457, -4.55185604095459, -4.132778644561768, -3.7137012481689453, -3.294623851776123, -2.8755462169647217, -2.4564685821533203, -2.037391185760498, -1.6183137893676758, -1.1992361545562744, -0.780158519744873, -0.3610811233520508, 0.057996392250061035, 0.47707390785217285, 0.8961514234542847, 1.3152289390563965, 1.7343063354492188, 2.15338397026062, 2.5724616050720215, 2.9915390014648438, 3.410616397857666, 3.8296940326690674, 4.248771667480469, 4.667849063873291, 5.086926460266113, 5.506004333496094, 5.925081729888916, 6.344159126281738, 6.7632365226745605, 7.182313919067383, 7.601391792297363, 8.020469665527344, 8.439546585083008, 8.858624458312988, 9.277702331542969, 9.696779251098633, 10.115857124328613, 10.534934043884277, 10.954011917114258, 11.373088836669922, 11.792166709899902, 12.211244583129883, 12.630321502685547, 13.049399375915527]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 3.0, 7.0, 11.0, 11.0, 16.0, 16.0, 21.0, 32.0, 26.0, 32.0, 40.0, 25.0, 28.0, 48.0, 44.0, 48.0, 40.0, 60.0, 46.0, 46.0, 50.0, 38.0, 44.0, 37.0, 38.0, 31.0, 32.0, 24.0, 20.0, 21.0, 15.0, 8.0, 12.0, 5.0, 6.0, 1.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.978402137756348, -14.56612491607666, -14.153846740722656, -13.741569519042969, -13.329291343688965, -12.917014122009277, -12.504735946655273, -12.092458724975586, -11.680181503295898, -11.267904281616211, -10.855626106262207, -10.44334888458252, -10.031070709228516, -9.618793487548828, -9.20651626586914, -8.794238090515137, -8.381959915161133, -7.969682216644287, -7.557404518127441, -7.145127296447754, -6.73284912109375, -6.3205718994140625, -5.908294200897217, -5.496016502380371, -5.083738803863525, -4.67146110534668, -4.259183406829834, -3.8469059467315674, -3.4346282482147217, -3.022350549697876, -2.6100730895996094, -2.1977953910827637, -1.7855167388916016, -1.3732390403747559, -0.9609614610671997, -0.5486838817596436, -0.13640618324279785, 0.27587151527404785, 0.6881489753723145, 1.1004266738891602, 1.5127043724060059, 1.9249820709228516, 2.3372597694396973, 2.749537229537964, 3.1618149280548096, 3.5740926265716553, 3.986370086669922, 4.398647785186768, 4.810925483703613, 5.223203182220459, 5.635480880737305, 6.047758102416992, 6.460036277770996, 6.872313499450684, 7.284591197967529, 7.696868896484375, 8.109146118164062, 8.52142333984375, 8.933701515197754, 9.345978736877441, 9.758256912231445, 10.170534133911133, 10.58281135559082, 10.995089530944824, 11.407367706298828]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 10.0, 10.0, 9.0, 10.0, 20.0, 33.0, 46.0, 101.0, 129.0, 215.0, 311.0, 493.0, 722.0, 1125.0, 1709.0, 2754.0, 4301.0, 6678.0, 10593.0, 15865.0, 24599.0, 36772.0, 54441.0, 75413.0, 97759.0, 116430.0, 124934.0, 118906.0, 101534.0, 79121.0, 57678.0, 39915.0, 26755.0, 17502.0, 11357.0, 7201.0, 4665.0, 3035.0, 1912.0, 1216.0, 805.0, 490.0, 366.0, 208.0, 148.0, 89.0, 69.0, 44.0, 23.0, 14.0, 9.0, 8.0, 7.0, 1.0, 5.0, 1.0, 1.0], "bins": [-7.09375, -6.882568359375, -6.67138671875, -6.460205078125, -6.2490234375, -6.037841796875, -5.82666015625, -5.615478515625, -5.404296875, -5.193115234375, -4.98193359375, -4.770751953125, -4.5595703125, -4.348388671875, -4.13720703125, -3.926025390625, -3.71484375, -3.503662109375, -3.29248046875, -3.081298828125, -2.8701171875, -2.658935546875, -2.44775390625, -2.236572265625, -2.025390625, -1.814208984375, -1.60302734375, -1.391845703125, -1.1806640625, -0.969482421875, -0.75830078125, -0.547119140625, -0.3359375, -0.124755859375, 0.08642578125, 0.297607421875, 0.5087890625, 0.719970703125, 0.93115234375, 1.142333984375, 1.353515625, 1.564697265625, 1.77587890625, 1.987060546875, 2.1982421875, 2.409423828125, 2.62060546875, 2.831787109375, 3.04296875, 3.254150390625, 3.46533203125, 3.676513671875, 3.8876953125, 4.098876953125, 4.31005859375, 4.521240234375, 4.732421875, 4.943603515625, 5.15478515625, 5.365966796875, 5.5771484375, 5.788330078125, 5.99951171875, 6.210693359375, 6.421875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 8.0, 8.0, 7.0, 12.0, 17.0, 13.0, 27.0, 22.0, 24.0, 21.0, 25.0, 28.0, 36.0, 49.0, 34.0, 37.0, 47.0, 46.0, 49.0, 39.0, 46.0, 49.0, 40.0, 40.0, 40.0, 33.0, 36.0, 24.0, 23.0, 24.0, 18.0, 12.0, 14.0, 14.0, 7.0, 3.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-13.59375, -13.197265625, -12.80078125, -12.404296875, -12.0078125, -11.611328125, -11.21484375, -10.818359375, -10.421875, -10.025390625, -9.62890625, -9.232421875, -8.8359375, -8.439453125, -8.04296875, -7.646484375, -7.25, -6.853515625, -6.45703125, -6.060546875, -5.6640625, -5.267578125, -4.87109375, -4.474609375, -4.078125, -3.681640625, -3.28515625, -2.888671875, -2.4921875, -2.095703125, -1.69921875, -1.302734375, -0.90625, -0.509765625, -0.11328125, 0.283203125, 0.6796875, 1.076171875, 1.47265625, 1.869140625, 2.265625, 2.662109375, 3.05859375, 3.455078125, 3.8515625, 4.248046875, 4.64453125, 5.041015625, 5.4375, 5.833984375, 6.23046875, 6.626953125, 7.0234375, 7.419921875, 7.81640625, 8.212890625, 8.609375, 9.005859375, 9.40234375, 9.798828125, 10.1953125, 10.591796875, 10.98828125, 11.384765625, 11.78125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 9.0, 15.0, 19.0, 25.0, 38.0, 44.0, 97.0, 147.0, 209.0, 292.0, 416.0, 657.0, 989.0, 1466.0, 2262.0, 3520.0, 5349.0, 8044.0, 12232.0, 18083.0, 27788.0, 39768.0, 56174.0, 75652.0, 93474.0, 108931.0, 114978.0, 110481.0, 96520.0, 78805.0, 59730.0, 43418.0, 30142.0, 20073.0, 13395.0, 8752.0, 5649.0, 3592.0, 2497.0, 1676.0, 1058.0, 735.0, 435.0, 292.0, 207.0, 127.0, 98.0, 73.0, 38.0, 35.0, 21.0, 12.0, 10.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-6.01953125, -5.82281494140625, -5.6260986328125, -5.42938232421875, -5.232666015625, -5.03594970703125, -4.8392333984375, -4.64251708984375, -4.44580078125, -4.24908447265625, -4.0523681640625, -3.85565185546875, -3.658935546875, -3.46221923828125, -3.2655029296875, -3.06878662109375, -2.8720703125, -2.67535400390625, -2.4786376953125, -2.28192138671875, -2.085205078125, -1.88848876953125, -1.6917724609375, -1.49505615234375, -1.29833984375, -1.10162353515625, -0.9049072265625, -0.70819091796875, -0.511474609375, -0.31475830078125, -0.1180419921875, 0.07867431640625, 0.275390625, 0.47210693359375, 0.6688232421875, 0.86553955078125, 1.062255859375, 1.25897216796875, 1.4556884765625, 1.65240478515625, 1.84912109375, 2.04583740234375, 2.2425537109375, 2.43927001953125, 2.635986328125, 2.83270263671875, 3.0294189453125, 3.22613525390625, 3.4228515625, 3.61956787109375, 3.8162841796875, 4.01300048828125, 4.209716796875, 4.40643310546875, 4.6031494140625, 4.79986572265625, 4.99658203125, 5.19329833984375, 5.3900146484375, 5.58673095703125, 5.783447265625, 5.98016357421875, 6.1768798828125, 6.37359619140625, 6.5703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 6.0, 10.0, 8.0, 11.0, 12.0, 9.0, 15.0, 23.0, 17.0, 24.0, 17.0, 28.0, 28.0, 40.0, 46.0, 43.0, 39.0, 43.0, 37.0, 41.0, 41.0, 58.0, 28.0, 39.0, 46.0, 36.0, 40.0, 38.0, 19.0, 22.0, 20.0, 18.0, 13.0, 20.0, 11.0, 10.0, 12.0, 5.0, 7.0, 4.0, 9.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.359375, -7.12957763671875, -6.8997802734375, -6.66998291015625, -6.440185546875, -6.21038818359375, -5.9805908203125, -5.75079345703125, -5.52099609375, -5.29119873046875, -5.0614013671875, -4.83160400390625, -4.601806640625, -4.37200927734375, -4.1422119140625, -3.91241455078125, -3.6826171875, -3.45281982421875, -3.2230224609375, -2.99322509765625, -2.763427734375, -2.53363037109375, -2.3038330078125, -2.07403564453125, -1.84423828125, -1.61444091796875, -1.3846435546875, -1.15484619140625, -0.925048828125, -0.69525146484375, -0.4654541015625, -0.23565673828125, -0.005859375, 0.22393798828125, 0.4537353515625, 0.68353271484375, 0.913330078125, 1.14312744140625, 1.3729248046875, 1.60272216796875, 1.83251953125, 2.06231689453125, 2.2921142578125, 2.52191162109375, 2.751708984375, 2.98150634765625, 3.2113037109375, 3.44110107421875, 3.6708984375, 3.90069580078125, 4.1304931640625, 4.36029052734375, 4.590087890625, 4.81988525390625, 5.0496826171875, 5.27947998046875, 5.50927734375, 5.73907470703125, 5.9688720703125, 6.19866943359375, 6.428466796875, 6.65826416015625, 6.8880615234375, 7.11785888671875, 7.34765625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 10.0, 15.0, 31.0, 31.0, 49.0, 81.0, 116.0, 150.0, 198.0, 307.0, 453.0, 645.0, 981.0, 1546.0, 2593.0, 4678.0, 8983.0, 18162.0, 37123.0, 72130.0, 124215.0, 176949.0, 196243.0, 166100.0, 110697.0, 61599.0, 31181.0, 15243.0, 7612.0, 4050.0, 2199.0, 1445.0, 919.0, 596.0, 344.0, 263.0, 166.0, 147.0, 88.0, 70.0, 39.0, 28.0, 17.0, 20.0, 11.0, 12.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.8192138671875, -3.689208984375, -3.5592041015625, -3.42919921875, -3.2991943359375, -3.169189453125, -3.0391845703125, -2.9091796875, -2.7791748046875, -2.649169921875, -2.5191650390625, -2.38916015625, -2.2591552734375, -2.129150390625, -1.9991455078125, -1.869140625, -1.7391357421875, -1.609130859375, -1.4791259765625, -1.34912109375, -1.2191162109375, -1.089111328125, -0.9591064453125, -0.8291015625, -0.6990966796875, -0.569091796875, -0.4390869140625, -0.30908203125, -0.1790771484375, -0.049072265625, 0.0809326171875, 0.2109375, 0.3409423828125, 0.470947265625, 0.6009521484375, 0.73095703125, 0.8609619140625, 0.990966796875, 1.1209716796875, 1.2509765625, 1.3809814453125, 1.510986328125, 1.6409912109375, 1.77099609375, 1.9010009765625, 2.031005859375, 2.1610107421875, 2.291015625, 2.4210205078125, 2.551025390625, 2.6810302734375, 2.81103515625, 2.9410400390625, 3.071044921875, 3.2010498046875, 3.3310546875, 3.4610595703125, 3.591064453125, 3.7210693359375, 3.85107421875, 3.9810791015625, 4.111083984375, 4.2410888671875, 4.37109375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 2.0, 15.0, 13.0, 14.0, 20.0, 31.0, 50.0, 49.0, 68.0, 71.0, 63.0, 66.0, 63.0, 88.0, 58.0, 54.0, 54.0, 47.0, 37.0, 33.0, 29.0, 18.0, 17.0, 6.0, 3.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00045108795166015625, -0.00043720006942749023, -0.0004233121871948242, -0.0004094243049621582, -0.0003955364227294922, -0.00038164854049682617, -0.00036776065826416016, -0.00035387277603149414, -0.0003399848937988281, -0.0003260970115661621, -0.0003122091293334961, -0.0002983212471008301, -0.00028443336486816406, -0.00027054548263549805, -0.00025665760040283203, -0.00024276971817016602, -0.0002288818359375, -0.00021499395370483398, -0.00020110607147216797, -0.00018721818923950195, -0.00017333030700683594, -0.00015944242477416992, -0.0001455545425415039, -0.0001316666603088379, -0.00011777877807617188, -0.00010389089584350586, -9.000301361083984e-05, -7.611513137817383e-05, -6.222724914550781e-05, -4.83393669128418e-05, -3.445148468017578e-05, -2.0563602447509766e-05, -6.67572021484375e-06, 7.212162017822266e-06, 2.110004425048828e-05, 3.49879264831543e-05, 4.887580871582031e-05, 6.276369094848633e-05, 7.665157318115234e-05, 9.053945541381836e-05, 0.00010442733764648438, 0.00011831521987915039, 0.0001322031021118164, 0.00014609098434448242, 0.00015997886657714844, 0.00017386674880981445, 0.00018775463104248047, 0.00020164251327514648, 0.0002155303955078125, 0.00022941827774047852, 0.00024330615997314453, 0.00025719404220581055, 0.00027108192443847656, 0.0002849698066711426, 0.0002988576889038086, 0.0003127455711364746, 0.0003266334533691406, 0.00034052133560180664, 0.00035440921783447266, 0.00036829710006713867, 0.0003821849822998047, 0.0003960728645324707, 0.0004099607467651367, 0.00042384862899780273, 0.00043773651123046875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 10.0, 15.0, 12.0, 26.0, 24.0, 47.0, 71.0, 110.0, 186.0, 291.0, 434.0, 788.0, 1351.0, 2565.0, 5393.0, 13263.0, 36303.0, 101268.0, 219936.0, 292902.0, 216030.0, 98195.0, 35352.0, 12898.0, 5317.0, 2519.0, 1294.0, 741.0, 420.0, 279.0, 144.0, 97.0, 68.0, 53.0, 49.0, 19.0, 24.0, 11.0, 11.0, 10.0, 6.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.6796875, -6.47406005859375, -6.2684326171875, -6.06280517578125, -5.857177734375, -5.65155029296875, -5.4459228515625, -5.24029541015625, -5.03466796875, -4.82904052734375, -4.6234130859375, -4.41778564453125, -4.212158203125, -4.00653076171875, -3.8009033203125, -3.59527587890625, -3.3896484375, -3.18402099609375, -2.9783935546875, -2.77276611328125, -2.567138671875, -2.36151123046875, -2.1558837890625, -1.95025634765625, -1.74462890625, -1.53900146484375, -1.3333740234375, -1.12774658203125, -0.922119140625, -0.71649169921875, -0.5108642578125, -0.30523681640625, -0.099609375, 0.10601806640625, 0.3116455078125, 0.51727294921875, 0.722900390625, 0.92852783203125, 1.1341552734375, 1.33978271484375, 1.54541015625, 1.75103759765625, 1.9566650390625, 2.16229248046875, 2.367919921875, 2.57354736328125, 2.7791748046875, 2.98480224609375, 3.1904296875, 3.39605712890625, 3.6016845703125, 3.80731201171875, 4.012939453125, 4.21856689453125, 4.4241943359375, 4.62982177734375, 4.83544921875, 5.04107666015625, 5.2467041015625, 5.45233154296875, 5.657958984375, 5.86358642578125, 6.0692138671875, 6.27484130859375, 6.48046875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 6.0, 9.0, 5.0, 15.0, 21.0, 18.0, 24.0, 33.0, 43.0, 73.0, 69.0, 72.0, 80.0, 74.0, 81.0, 73.0, 62.0, 44.0, 43.0, 39.0, 25.0, 21.0, 12.0, 14.0, 6.0, 7.0, 5.0, 9.0, 6.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.431640625, -1.381103515625, -1.33056640625, -1.280029296875, -1.2294921875, -1.178955078125, -1.12841796875, -1.077880859375, -1.02734375, -0.976806640625, -0.92626953125, -0.875732421875, -0.8251953125, -0.774658203125, -0.72412109375, -0.673583984375, -0.623046875, -0.572509765625, -0.52197265625, -0.471435546875, -0.4208984375, -0.370361328125, -0.31982421875, -0.269287109375, -0.21875, -0.168212890625, -0.11767578125, -0.067138671875, -0.0166015625, 0.033935546875, 0.08447265625, 0.135009765625, 0.185546875, 0.236083984375, 0.28662109375, 0.337158203125, 0.3876953125, 0.438232421875, 0.48876953125, 0.539306640625, 0.58984375, 0.640380859375, 0.69091796875, 0.741455078125, 0.7919921875, 0.842529296875, 0.89306640625, 0.943603515625, 0.994140625, 1.044677734375, 1.09521484375, 1.145751953125, 1.1962890625, 1.246826171875, 1.29736328125, 1.347900390625, 1.3984375, 1.448974609375, 1.49951171875, 1.550048828125, 1.6005859375, 1.651123046875, 1.70166015625, 1.752197265625, 1.802734375]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 9.0, 11.0, 10.0, 17.0, 20.0, 18.0, 25.0, 21.0, 22.0, 30.0, 33.0, 40.0, 41.0, 48.0, 47.0, 44.0, 54.0, 44.0, 54.0, 44.0, 50.0, 51.0, 31.0, 33.0, 34.0, 24.0, 25.0, 16.0, 19.0, 10.0, 17.0, 9.0, 9.0, 5.0, 4.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-13.322610855102539, -12.925789833068848, -12.528968811035156, -12.132147789001465, -11.735326766967773, -11.338505744934082, -10.94168472290039, -10.544864654541016, -10.148042678833008, -9.751221656799316, -9.354400634765625, -8.957579612731934, -8.560758590698242, -8.16393756866455, -7.767117023468018, -7.370296001434326, -6.973475456237793, -6.576654434204102, -6.17983341217041, -5.783012390136719, -5.386191368103027, -4.989370346069336, -4.592549800872803, -4.195728778839111, -3.79890775680542, -3.4020867347717285, -3.005265712738037, -2.608444929122925, -2.2116239070892334, -1.814802885055542, -1.4179821014404297, -1.0211610794067383, -0.6243410110473633, -0.22752004861831665, 0.16930091381072998, 0.5661218166351318, 0.9629428386688232, 1.3597638607025146, 1.756584644317627, 2.1534056663513184, 2.5502266883850098, 2.947047710418701, 3.3438687324523926, 3.740689516067505, 4.137510299682617, 4.534331321716309, 4.93115234375, 5.327973365783691, 5.724794387817383, 6.121615409851074, 6.518436431884766, 6.915257453918457, 7.312078475952148, 7.70889949798584, 8.105720520019531, 8.502540588378906, 8.899362564086914, 9.296183586120605, 9.693004608154297, 10.089825630187988, 10.48664665222168, 10.883467674255371, 11.280288696289062, 11.677108764648438, 12.073929786682129]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 7.0, 9.0, 18.0, 13.0, 14.0, 17.0, 19.0, 25.0, 40.0, 20.0, 31.0, 27.0, 41.0, 39.0, 47.0, 44.0, 46.0, 38.0, 31.0, 36.0, 40.0, 52.0, 41.0, 33.0, 32.0, 40.0, 37.0, 18.0, 18.0, 21.0, 20.0, 17.0, 13.0, 12.0, 10.0, 6.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-13.985101699829102, -13.58392333984375, -13.182744979858398, -12.781566619873047, -12.380388259887695, -11.979209899902344, -11.578031539916992, -11.17685317993164, -10.775674819946289, -10.374496459960938, -9.973318099975586, -9.572139739990234, -9.170961380004883, -8.769783020019531, -8.36860466003418, -7.967426300048828, -7.566247463226318, -7.165069103240967, -6.763890743255615, -6.362712383270264, -5.961534023284912, -5.560355186462402, -5.159176826477051, -4.757998466491699, -4.356820106506348, -3.955641746520996, -3.5544633865356445, -3.153285026550293, -2.7521066665649414, -2.3509280681610107, -1.9497497081756592, -1.5485713481903076, -1.1473932266235352, -0.7462148666381836, -0.34503644704818726, 0.05614197254180908, 0.45732033252716064, 0.8584988117218018, 1.2596771717071533, 1.6608555316925049, 2.0620338916778564, 2.463212251663208, 2.8643906116485596, 3.2655692100524902, 3.666747570037842, 4.067925930023193, 4.469104290008545, 4.8702826499938965, 5.271461009979248, 5.6726393699646, 6.073817729949951, 6.474996089935303, 6.876174449920654, 7.277353286743164, 7.678531646728516, 8.079710006713867, 8.480888366699219, 8.88206672668457, 9.283245086669922, 9.684423446655273, 10.085601806640625, 10.486780166625977, 10.887958526611328, 11.28913688659668, 11.690315246582031]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 11.0, 15.0, 35.0, 52.0, 76.0, 127.0, 190.0, 293.0, 468.0, 753.0, 1119.0, 1700.0, 2693.0, 4189.0, 6599.0, 10667.0, 17152.0, 27362.0, 43502.0, 68392.0, 107464.0, 168876.0, 252580.0, 363911.0, 480447.0, 559396.0, 555946.0, 474862.0, 355669.0, 247929.0, 163950.0, 105256.0, 65896.0, 41374.0, 25253.0, 15558.0, 9420.0, 5827.0, 3548.0, 2225.0, 1352.0, 835.0, 490.0, 288.0, 206.0, 124.0, 70.0, 45.0, 32.0, 23.0, 18.0, 7.0, 2.0, 2.0, 3.0, 5.0, 2.0], "bins": [-11.9140625, -11.552490234375, -11.19091796875, -10.829345703125, -10.4677734375, -10.106201171875, -9.74462890625, -9.383056640625, -9.021484375, -8.659912109375, -8.29833984375, -7.936767578125, -7.5751953125, -7.213623046875, -6.85205078125, -6.490478515625, -6.12890625, -5.767333984375, -5.40576171875, -5.044189453125, -4.6826171875, -4.321044921875, -3.95947265625, -3.597900390625, -3.236328125, -2.874755859375, -2.51318359375, -2.151611328125, -1.7900390625, -1.428466796875, -1.06689453125, -0.705322265625, -0.34375, 0.017822265625, 0.37939453125, 0.740966796875, 1.1025390625, 1.464111328125, 1.82568359375, 2.187255859375, 2.548828125, 2.910400390625, 3.27197265625, 3.633544921875, 3.9951171875, 4.356689453125, 4.71826171875, 5.079833984375, 5.44140625, 5.802978515625, 6.16455078125, 6.526123046875, 6.8876953125, 7.249267578125, 7.61083984375, 7.972412109375, 8.333984375, 8.695556640625, 9.05712890625, 9.418701171875, 9.7802734375, 10.141845703125, 10.50341796875, 10.864990234375, 11.2265625]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 2.0, 6.0, 6.0, 6.0, 4.0, 6.0, 12.0, 12.0, 17.0, 19.0, 18.0, 20.0, 26.0, 25.0, 20.0, 30.0, 31.0, 33.0, 29.0, 39.0, 37.0, 44.0, 37.0, 46.0, 36.0, 44.0, 32.0, 23.0, 31.0, 39.0, 49.0, 26.0, 24.0, 21.0, 29.0, 20.0, 22.0, 16.0, 17.0, 6.0, 11.0, 10.0, 3.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.3828125, -10.0517578125, -9.720703125, -9.3896484375, -9.05859375, -8.7275390625, -8.396484375, -8.0654296875, -7.734375, -7.4033203125, -7.072265625, -6.7412109375, -6.41015625, -6.0791015625, -5.748046875, -5.4169921875, -5.0859375, -4.7548828125, -4.423828125, -4.0927734375, -3.76171875, -3.4306640625, -3.099609375, -2.7685546875, -2.4375, -2.1064453125, -1.775390625, -1.4443359375, -1.11328125, -0.7822265625, -0.451171875, -0.1201171875, 0.2109375, 0.5419921875, 0.873046875, 1.2041015625, 1.53515625, 1.8662109375, 2.197265625, 2.5283203125, 2.859375, 3.1904296875, 3.521484375, 3.8525390625, 4.18359375, 4.5146484375, 4.845703125, 5.1767578125, 5.5078125, 5.8388671875, 6.169921875, 6.5009765625, 6.83203125, 7.1630859375, 7.494140625, 7.8251953125, 8.15625, 8.4873046875, 8.818359375, 9.1494140625, 9.48046875, 9.8115234375, 10.142578125, 10.4736328125, 10.8046875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 8.0, 9.0, 27.0, 45.0, 50.0, 81.0, 146.0, 228.0, 335.0, 577.0, 987.0, 1657.0, 2712.0, 4535.0, 7831.0, 12777.0, 21370.0, 35914.0, 60184.0, 99138.0, 159183.0, 243529.0, 351957.0, 466404.0, 550423.0, 561055.0, 493337.0, 384826.0, 271325.0, 178435.0, 113092.0, 69333.0, 41362.0, 25108.0, 14472.0, 8616.0, 5274.0, 3112.0, 1939.0, 1081.0, 694.0, 408.0, 273.0, 172.0, 100.0, 65.0, 32.0, 29.0, 17.0, 12.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-14.9375, -14.4866943359375, -14.035888671875, -13.5850830078125, -13.13427734375, -12.6834716796875, -12.232666015625, -11.7818603515625, -11.3310546875, -10.8802490234375, -10.429443359375, -9.9786376953125, -9.52783203125, -9.0770263671875, -8.626220703125, -8.1754150390625, -7.724609375, -7.2738037109375, -6.822998046875, -6.3721923828125, -5.92138671875, -5.4705810546875, -5.019775390625, -4.5689697265625, -4.1181640625, -3.6673583984375, -3.216552734375, -2.7657470703125, -2.31494140625, -1.8641357421875, -1.413330078125, -0.9625244140625, -0.51171875, -0.0609130859375, 0.389892578125, 0.8406982421875, 1.29150390625, 1.7423095703125, 2.193115234375, 2.6439208984375, 3.0947265625, 3.5455322265625, 3.996337890625, 4.4471435546875, 4.89794921875, 5.3487548828125, 5.799560546875, 6.2503662109375, 6.701171875, 7.1519775390625, 7.602783203125, 8.0535888671875, 8.50439453125, 8.9552001953125, 9.406005859375, 9.8568115234375, 10.3076171875, 10.7584228515625, 11.209228515625, 11.6600341796875, 12.11083984375, 12.5616455078125, 13.012451171875, 13.4632568359375, 13.9140625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 10.0, 18.0, 15.0, 31.0, 34.0, 44.0, 57.0, 74.0, 102.0, 105.0, 156.0, 167.0, 210.0, 214.0, 263.0, 263.0, 279.0, 265.0, 271.0, 218.0, 225.0, 215.0, 156.0, 126.0, 135.0, 109.0, 69.0, 61.0, 44.0, 29.0, 29.0, 19.0, 14.0, 14.0, 14.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.612548828125, -7.38134765625, -7.150146484375, -6.9189453125, -6.687744140625, -6.45654296875, -6.225341796875, -5.994140625, -5.762939453125, -5.53173828125, -5.300537109375, -5.0693359375, -4.838134765625, -4.60693359375, -4.375732421875, -4.14453125, -3.913330078125, -3.68212890625, -3.450927734375, -3.2197265625, -2.988525390625, -2.75732421875, -2.526123046875, -2.294921875, -2.063720703125, -1.83251953125, -1.601318359375, -1.3701171875, -1.138916015625, -0.90771484375, -0.676513671875, -0.4453125, -0.214111328125, 0.01708984375, 0.248291015625, 0.4794921875, 0.710693359375, 0.94189453125, 1.173095703125, 1.404296875, 1.635498046875, 1.86669921875, 2.097900390625, 2.3291015625, 2.560302734375, 2.79150390625, 3.022705078125, 3.25390625, 3.485107421875, 3.71630859375, 3.947509765625, 4.1787109375, 4.409912109375, 4.64111328125, 4.872314453125, 5.103515625, 5.334716796875, 5.56591796875, 5.797119140625, 6.0283203125, 6.259521484375, 6.49072265625, 6.721923828125, 6.953125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 5.0, 4.0, 2.0, 7.0, 7.0, 7.0, 6.0, 8.0, 14.0, 19.0, 33.0, 25.0, 28.0, 40.0, 45.0, 53.0, 48.0, 47.0, 53.0, 55.0, 54.0, 44.0, 46.0, 37.0, 42.0, 47.0, 32.0, 33.0, 24.0, 21.0, 23.0, 20.0, 16.0, 5.0, 4.0, 11.0, 8.0, 5.0, 3.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.138803482055664, -16.52672004699707, -15.91463851928711, -15.302555084228516, -14.690472602844238, -14.078390121459961, -13.466306686401367, -12.85422420501709, -12.242141723632812, -11.630059242248535, -11.017976760864258, -10.405893325805664, -9.793810844421387, -9.18172836303711, -8.569644927978516, -7.957562446594238, -7.345479965209961, -6.733397483825684, -6.121314525604248, -5.5092315673828125, -4.897149085998535, -4.285066604614258, -3.6729836463928223, -3.0609006881713867, -2.4488182067871094, -1.836735486984253, -1.2246527671813965, -0.61257004737854, -0.00048732757568359375, 0.6115953922271729, 1.2236781120300293, 1.8357610702514648, 2.4478416442871094, 3.059924364089966, 3.6720070838928223, 4.284090042114258, 4.896172523498535, 5.5082550048828125, 6.120337963104248, 6.732420921325684, 7.344503402709961, 7.956585884094238, 8.568668365478516, 9.18075180053711, 9.792834281921387, 10.404916763305664, 11.017000198364258, 11.629082679748535, 12.241165161132812, 12.85324764251709, 13.465330123901367, 14.077413558959961, 14.689496040344238, 15.301578521728516, 15.91366195678711, 16.525745391845703, 17.137826919555664, 17.749910354614258, 18.36199188232422, 18.974075317382812, 19.586158752441406, 20.198240280151367, 20.81032371520996, 21.422405242919922, 22.034488677978516]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 2.0, 8.0, 8.0, 4.0, 12.0, 9.0, 17.0, 14.0, 18.0, 26.0, 19.0, 27.0, 30.0, 26.0, 38.0, 30.0, 34.0, 44.0, 49.0, 41.0, 37.0, 44.0, 33.0, 31.0, 44.0, 48.0, 31.0, 34.0, 35.0, 30.0, 21.0, 24.0, 19.0, 18.0, 21.0, 9.0, 18.0, 14.0, 10.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.245227813720703, -16.741004943847656, -16.23678207397461, -15.732558250427246, -15.228334426879883, -14.724111557006836, -14.219888687133789, -13.715665817260742, -13.211441993713379, -12.707219123840332, -12.202995300292969, -11.698772430419922, -11.194549560546875, -10.690325736999512, -10.186102867126465, -9.681879043579102, -9.177656173706055, -8.673433303833008, -8.169209480285645, -7.664986610412598, -7.160763263702393, -6.6565399169921875, -6.152317047119141, -5.6480937004089355, -5.1438703536987305, -4.639647006988525, -4.13542366027832, -3.6312007904052734, -3.1269774436950684, -2.6227540969848633, -2.1185309886932373, -1.6143078804016113, -1.1100835800170898, -0.6058603525161743, -0.10163712501525879, 0.40258610248565674, 0.9068093299865723, 1.4110326766967773, 1.9152557849884033, 2.4194788932800293, 2.9237022399902344, 3.4279255867004395, 3.9321486949920654, 4.436371803283691, 4.9405951499938965, 5.444818496704102, 5.949041366577148, 6.4532647132873535, 6.957488059997559, 7.461711406707764, 7.965934753417969, 8.470157623291016, 8.974380493164062, 9.478604316711426, 9.982827186584473, 10.487051010131836, 10.991273880004883, 11.49549674987793, 11.999720573425293, 12.50394344329834, 13.008167266845703, 13.51239013671875, 14.016613006591797, 14.520835876464844, 15.025059700012207]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 8.0, 11.0, 18.0, 51.0, 61.0, 88.0, 148.0, 223.0, 312.0, 593.0, 911.0, 1466.0, 2480.0, 4136.0, 6800.0, 12080.0, 20987.0, 37870.0, 69307.0, 127068.0, 215487.0, 229899.0, 142432.0, 78100.0, 42140.0, 23552.0, 13325.0, 7680.0, 4461.0, 2619.0, 1573.0, 1052.0, 566.0, 375.0, 238.0, 157.0, 116.0, 57.0, 39.0, 23.0, 21.0, 7.0, 7.0, 3.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.001953125, -2.908416748046875, -2.81488037109375, -2.721343994140625, -2.6278076171875, -2.534271240234375, -2.44073486328125, -2.347198486328125, -2.253662109375, -2.160125732421875, -2.06658935546875, -1.973052978515625, -1.8795166015625, -1.785980224609375, -1.69244384765625, -1.598907470703125, -1.50537109375, -1.411834716796875, -1.31829833984375, -1.224761962890625, -1.1312255859375, -1.037689208984375, -0.94415283203125, -0.850616455078125, -0.757080078125, -0.663543701171875, -0.57000732421875, -0.476470947265625, -0.3829345703125, -0.289398193359375, -0.19586181640625, -0.102325439453125, -0.0087890625, 0.084747314453125, 0.17828369140625, 0.271820068359375, 0.3653564453125, 0.458892822265625, 0.55242919921875, 0.645965576171875, 0.739501953125, 0.833038330078125, 0.92657470703125, 1.020111083984375, 1.1136474609375, 1.207183837890625, 1.30072021484375, 1.394256591796875, 1.48779296875, 1.581329345703125, 1.67486572265625, 1.768402099609375, 1.8619384765625, 1.955474853515625, 2.04901123046875, 2.142547607421875, 2.236083984375, 2.329620361328125, 2.42315673828125, 2.516693115234375, 2.6102294921875, 2.703765869140625, 2.79730224609375, 2.890838623046875, 2.984375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 6.0, 8.0, 8.0, 15.0, 14.0, 19.0, 18.0, 30.0, 37.0, 36.0, 41.0, 30.0, 27.0, 49.0, 56.0, 45.0, 44.0, 40.0, 45.0, 34.0, 57.0, 44.0, 39.0, 35.0, 22.0, 35.0, 34.0, 30.0, 23.0, 15.0, 8.0, 16.0, 9.0, 7.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.671875, -20.0654296875, -19.458984375, -18.8525390625, -18.24609375, -17.6396484375, -17.033203125, -16.4267578125, -15.8203125, -15.2138671875, -14.607421875, -14.0009765625, -13.39453125, -12.7880859375, -12.181640625, -11.5751953125, -10.96875, -10.3623046875, -9.755859375, -9.1494140625, -8.54296875, -7.9365234375, -7.330078125, -6.7236328125, -6.1171875, -5.5107421875, -4.904296875, -4.2978515625, -3.69140625, -3.0849609375, -2.478515625, -1.8720703125, -1.265625, -0.6591796875, -0.052734375, 0.5537109375, 1.16015625, 1.7666015625, 2.373046875, 2.9794921875, 3.5859375, 4.1923828125, 4.798828125, 5.4052734375, 6.01171875, 6.6181640625, 7.224609375, 7.8310546875, 8.4375, 9.0439453125, 9.650390625, 10.2568359375, 10.86328125, 11.4697265625, 12.076171875, 12.6826171875, 13.2890625, 13.8955078125, 14.501953125, 15.1083984375, 15.71484375, 16.3212890625, 16.927734375, 17.5341796875, 18.140625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 8.0, 10.0, 16.0, 20.0, 34.0, 41.0, 82.0, 90.0, 157.0, 255.0, 383.0, 503.0, 755.0, 1186.0, 1726.0, 2550.0, 3973.0, 5898.0, 9001.0, 13784.0, 21163.0, 32916.0, 50132.0, 77631.0, 117165.0, 164700.0, 171188.0, 127356.0, 85631.0, 55916.0, 36112.0, 23382.0, 15362.0, 10013.0, 6510.0, 4342.0, 2849.0, 1839.0, 1273.0, 843.0, 576.0, 366.0, 281.0, 165.0, 133.0, 83.0, 46.0, 35.0, 26.0, 27.0, 5.0, 9.0, 9.0, 6.0, 2.0, 2.0], "bins": [-2.541015625, -2.466522216796875, -2.39202880859375, -2.317535400390625, -2.2430419921875, -2.168548583984375, -2.09405517578125, -2.019561767578125, -1.945068359375, -1.870574951171875, -1.79608154296875, -1.721588134765625, -1.6470947265625, -1.572601318359375, -1.49810791015625, -1.423614501953125, -1.34912109375, -1.274627685546875, -1.20013427734375, -1.125640869140625, -1.0511474609375, -0.976654052734375, -0.90216064453125, -0.827667236328125, -0.753173828125, -0.678680419921875, -0.60418701171875, -0.529693603515625, -0.4552001953125, -0.380706787109375, -0.30621337890625, -0.231719970703125, -0.1572265625, -0.082733154296875, -0.00823974609375, 0.066253662109375, 0.1407470703125, 0.215240478515625, 0.28973388671875, 0.364227294921875, 0.438720703125, 0.513214111328125, 0.58770751953125, 0.662200927734375, 0.7366943359375, 0.811187744140625, 0.88568115234375, 0.960174560546875, 1.03466796875, 1.109161376953125, 1.18365478515625, 1.258148193359375, 1.3326416015625, 1.407135009765625, 1.48162841796875, 1.556121826171875, 1.630615234375, 1.705108642578125, 1.77960205078125, 1.854095458984375, 1.9285888671875, 2.003082275390625, 2.07757568359375, 2.152069091796875, 2.2265625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 8.0, 2.0, 6.0, 13.0, 15.0, 15.0, 16.0, 19.0, 16.0, 40.0, 31.0, 32.0, 43.0, 30.0, 40.0, 42.0, 56.0, 46.0, 48.0, 33.0, 44.0, 50.0, 34.0, 47.0, 27.0, 35.0, 30.0, 27.0, 31.0, 29.0, 15.0, 18.0, 13.0, 9.0, 8.0, 12.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-12.609375, -12.24853515625, -11.8876953125, -11.52685546875, -11.166015625, -10.80517578125, -10.4443359375, -10.08349609375, -9.72265625, -9.36181640625, -9.0009765625, -8.64013671875, -8.279296875, -7.91845703125, -7.5576171875, -7.19677734375, -6.8359375, -6.47509765625, -6.1142578125, -5.75341796875, -5.392578125, -5.03173828125, -4.6708984375, -4.31005859375, -3.94921875, -3.58837890625, -3.2275390625, -2.86669921875, -2.505859375, -2.14501953125, -1.7841796875, -1.42333984375, -1.0625, -0.70166015625, -0.3408203125, 0.02001953125, 0.380859375, 0.74169921875, 1.1025390625, 1.46337890625, 1.82421875, 2.18505859375, 2.5458984375, 2.90673828125, 3.267578125, 3.62841796875, 3.9892578125, 4.35009765625, 4.7109375, 5.07177734375, 5.4326171875, 5.79345703125, 6.154296875, 6.51513671875, 6.8759765625, 7.23681640625, 7.59765625, 7.95849609375, 8.3193359375, 8.68017578125, 9.041015625, 9.40185546875, 9.7626953125, 10.12353515625, 10.484375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 3.0, 5.0, 16.0, 11.0, 29.0, 46.0, 60.0, 91.0, 158.0, 251.0, 410.0, 737.0, 1312.0, 2490.0, 4716.0, 9332.0, 18773.0, 38756.0, 82801.0, 177843.0, 312714.0, 208656.0, 98587.0, 45857.0, 22100.0, 10910.0, 5478.0, 2857.0, 1543.0, 854.0, 409.0, 272.0, 168.0, 123.0, 69.0, 40.0, 25.0, 22.0, 11.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2242431640625, -0.21640586853027344, -0.20856857299804688, -0.2007312774658203, -0.19289398193359375, -0.1850566864013672, -0.17721939086914062, -0.16938209533691406, -0.1615447998046875, -0.15370750427246094, -0.14587020874023438, -0.1380329132080078, -0.13019561767578125, -0.12235832214355469, -0.11452102661132812, -0.10668373107910156, -0.098846435546875, -0.09100914001464844, -0.08317184448242188, -0.07533454895019531, -0.06749725341796875, -0.05965995788574219, -0.051822662353515625, -0.04398536682128906, -0.0361480712890625, -0.028310775756835938, -0.020473480224609375, -0.012636184692382812, -0.00479888916015625, 0.0030384063720703125, 0.010875701904296875, 0.018712997436523438, 0.02655029296875, 0.03438758850097656, 0.042224884033203125, 0.05006217956542969, 0.05789947509765625, 0.06573677062988281, 0.07357406616210938, 0.08141136169433594, 0.0892486572265625, 0.09708595275878906, 0.10492324829101562, 0.11276054382324219, 0.12059783935546875, 0.1284351348876953, 0.13627243041992188, 0.14410972595214844, 0.151947021484375, 0.15978431701660156, 0.16762161254882812, 0.1754589080810547, 0.18329620361328125, 0.1911334991455078, 0.19897079467773438, 0.20680809020996094, 0.2146453857421875, 0.22248268127441406, 0.23031997680664062, 0.2381572723388672, 0.24599456787109375, 0.2538318634033203, 0.2616691589355469, 0.26950645446777344, 0.27734375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 2.0, 4.0, 2.0, 10.0, 14.0, 14.0, 14.0, 10.0, 20.0, 27.0, 32.0, 37.0, 36.0, 51.0, 43.0, 35.0, 61.0, 59.0, 72.0, 54.0, 50.0, 54.0, 45.0, 44.0, 40.0, 32.0, 24.0, 24.0, 19.0, 18.0, 14.0, 9.0, 6.0, 6.0, 6.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.9252300262451172e-05, -1.8544495105743408e-05, -1.7836689949035645e-05, -1.712888479232788e-05, -1.6421079635620117e-05, -1.5713274478912354e-05, -1.500546932220459e-05, -1.4297664165496826e-05, -1.3589859008789062e-05, -1.2882053852081299e-05, -1.2174248695373535e-05, -1.1466443538665771e-05, -1.0758638381958008e-05, -1.0050833225250244e-05, -9.34302806854248e-06, -8.635222911834717e-06, -7.927417755126953e-06, -7.2196125984191895e-06, -6.511807441711426e-06, -5.804002285003662e-06, -5.0961971282958984e-06, -4.388391971588135e-06, -3.680586814880371e-06, -2.9727816581726074e-06, -2.2649765014648438e-06, -1.55717134475708e-06, -8.493661880493164e-07, -1.4156103134155273e-07, 5.662441253662109e-07, 1.2740492820739746e-06, 1.9818544387817383e-06, 2.689659595489502e-06, 3.3974647521972656e-06, 4.105269908905029e-06, 4.813075065612793e-06, 5.520880222320557e-06, 6.22868537902832e-06, 6.936490535736084e-06, 7.644295692443848e-06, 8.352100849151611e-06, 9.059906005859375e-06, 9.767711162567139e-06, 1.0475516319274902e-05, 1.1183321475982666e-05, 1.189112663269043e-05, 1.2598931789398193e-05, 1.3306736946105957e-05, 1.401454210281372e-05, 1.4722347259521484e-05, 1.5430152416229248e-05, 1.6137957572937012e-05, 1.6845762729644775e-05, 1.755356788635254e-05, 1.8261373043060303e-05, 1.8969178199768066e-05, 1.967698335647583e-05, 2.0384788513183594e-05, 2.1092593669891357e-05, 2.180039882659912e-05, 2.2508203983306885e-05, 2.321600914001465e-05, 2.3923814296722412e-05, 2.4631619453430176e-05, 2.533942461013794e-05, 2.6047229766845703e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 18.0, 26.0, 34.0, 49.0, 82.0, 103.0, 160.0, 257.0, 375.0, 544.0, 821.0, 1280.0, 2102.0, 3239.0, 5211.0, 8562.0, 14030.0, 23066.0, 39365.0, 68944.0, 120150.0, 204577.0, 225235.0, 138558.0, 78405.0, 45302.0, 26263.0, 15865.0, 9740.0, 5883.0, 3666.0, 2349.0, 1525.0, 942.0, 622.0, 408.0, 254.0, 145.0, 126.0, 76.0, 58.0, 46.0, 32.0, 14.0, 16.0, 8.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.277587890625, -0.26866912841796875, -0.2597503662109375, -0.25083160400390625, -0.241912841796875, -0.23299407958984375, -0.2240753173828125, -0.21515655517578125, -0.20623779296875, -0.19731903076171875, -0.1884002685546875, -0.17948150634765625, -0.170562744140625, -0.16164398193359375, -0.1527252197265625, -0.14380645751953125, -0.1348876953125, -0.12596893310546875, -0.1170501708984375, -0.10813140869140625, -0.099212646484375, -0.09029388427734375, -0.0813751220703125, -0.07245635986328125, -0.06353759765625, -0.05461883544921875, -0.0457000732421875, -0.03678131103515625, -0.027862548828125, -0.01894378662109375, -0.0100250244140625, -0.00110626220703125, 0.0078125, 0.01673126220703125, 0.0256500244140625, 0.03456878662109375, 0.043487548828125, 0.05240631103515625, 0.0613250732421875, 0.07024383544921875, 0.07916259765625, 0.08808135986328125, 0.0970001220703125, 0.10591888427734375, 0.114837646484375, 0.12375640869140625, 0.1326751708984375, 0.14159393310546875, 0.1505126953125, 0.15943145751953125, 0.1683502197265625, 0.17726898193359375, 0.186187744140625, 0.19510650634765625, 0.2040252685546875, 0.21294403076171875, 0.22186279296875, 0.23078155517578125, 0.2397003173828125, 0.24861907958984375, 0.257537841796875, 0.26645660400390625, 0.2753753662109375, 0.28429412841796875, 0.293212890625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 4.0, 12.0, 12.0, 6.0, 17.0, 20.0, 20.0, 29.0, 24.0, 28.0, 41.0, 45.0, 53.0, 68.0, 105.0, 78.0, 63.0, 49.0, 54.0, 45.0, 29.0, 27.0, 23.0, 21.0, 15.0, 23.0, 13.0, 13.0, 6.0, 7.0, 10.0, 2.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.109130859375, -0.10571479797363281, -0.10229873657226562, -0.09888267517089844, -0.09546661376953125, -0.09205055236816406, -0.08863449096679688, -0.08521842956542969, -0.0818023681640625, -0.07838630676269531, -0.07497024536132812, -0.07155418395996094, -0.06813812255859375, -0.06472206115722656, -0.061305999755859375, -0.05788993835449219, -0.054473876953125, -0.05105781555175781, -0.047641754150390625, -0.04422569274902344, -0.04080963134765625, -0.03739356994628906, -0.033977508544921875, -0.030561447143554688, -0.0271453857421875, -0.023729324340820312, -0.020313262939453125, -0.016897201538085938, -0.01348114013671875, -0.010065078735351562, -0.006649017333984375, -0.0032329559326171875, 0.00018310546875, 0.0035991668701171875, 0.007015228271484375, 0.010431289672851562, 0.01384735107421875, 0.017263412475585938, 0.020679473876953125, 0.024095535278320312, 0.0275115966796875, 0.030927658081054688, 0.034343719482421875, 0.03775978088378906, 0.04117584228515625, 0.04459190368652344, 0.048007965087890625, 0.05142402648925781, 0.054840087890625, 0.05825614929199219, 0.061672210693359375, 0.06508827209472656, 0.06850433349609375, 0.07192039489746094, 0.07533645629882812, 0.07875251770019531, 0.0821685791015625, 0.08558464050292969, 0.08900070190429688, 0.09241676330566406, 0.09583282470703125, 0.09924888610839844, 0.10266494750976562, 0.10608100891113281, 0.1094970703125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 9.0, 3.0, 4.0, 5.0, 5.0, 5.0, 9.0, 3.0, 9.0, 10.0, 14.0, 24.0, 28.0, 27.0, 33.0, 42.0, 47.0, 49.0, 47.0, 55.0, 54.0, 51.0, 43.0, 52.0, 47.0, 38.0, 40.0, 41.0, 32.0, 32.0, 18.0, 29.0, 21.0, 20.0, 11.0, 3.0, 7.0, 9.0, 7.0, 6.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.881986618041992, -16.272443771362305, -15.6628999710083, -15.053356170654297, -14.44381332397461, -13.834270477294922, -13.224726676940918, -12.615182876586914, -12.005640029907227, -11.396097183227539, -10.786553382873535, -10.177009582519531, -9.567466735839844, -8.957923889160156, -8.348380088806152, -7.738836765289307, -7.129293441772461, -6.519750118255615, -5.9102067947387695, -5.300663471221924, -4.691120147705078, -4.081576824188232, -3.4720335006713867, -2.862490177154541, -2.2529468536376953, -1.6434035301208496, -1.033860206604004, -0.4243168830871582, 0.1852264404296875, 0.7947697639465332, 1.404313087463379, 2.0138564109802246, 2.6233997344970703, 3.232943058013916, 3.8424863815307617, 4.452029705047607, 5.061573028564453, 5.671116352081299, 6.2806596755981445, 6.89020299911499, 7.499746322631836, 8.109289169311523, 8.718832969665527, 9.328376770019531, 9.937919616699219, 10.547462463378906, 11.15700626373291, 11.766550064086914, 12.376092910766602, 12.985635757446289, 13.595179557800293, 14.204723358154297, 14.814266204833984, 15.423809051513672, 16.03335189819336, 16.64289665222168, 17.252439498901367, 17.861982345581055, 18.471527099609375, 19.081069946289062, 19.69061279296875, 20.300155639648438, 20.909698486328125, 21.519243240356445, 22.128786087036133]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 7.0, 8.0, 4.0, 12.0, 10.0, 16.0, 15.0, 17.0, 24.0, 20.0, 28.0, 27.0, 27.0, 42.0, 29.0, 33.0, 39.0, 55.0, 40.0, 37.0, 44.0, 32.0, 32.0, 41.0, 49.0, 33.0, 33.0, 33.0, 32.0, 23.0, 23.0, 20.0, 20.0, 19.0, 10.0, 16.0, 16.0, 9.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.1890926361084, -16.683774948120117, -16.178455352783203, -15.673136711120605, -15.167818069458008, -14.66249942779541, -14.157180786132812, -13.651863098144531, -13.146543502807617, -12.64122486114502, -12.135906219482422, -11.630587577819824, -11.125268936157227, -10.619950294494629, -10.114631652832031, -9.60931396484375, -9.103995323181152, -8.598676681518555, -8.093358039855957, -7.588039398193359, -7.082720756530762, -6.577402114868164, -6.072083950042725, -5.566765308380127, -5.061446666717529, -4.556128025054932, -4.050809383392334, -3.5454909801483154, -3.0401723384857178, -2.53485369682312, -2.0295352935791016, -1.524216651916504, -1.0188989639282227, -0.5135803818702698, -0.008261799812316895, 0.4970567226409912, 1.0023753643035889, 1.5076940059661865, 2.013012409210205, 2.5183310508728027, 3.0236496925354004, 3.528968334197998, 4.034286975860596, 4.539605140686035, 5.044923782348633, 5.5502424240112305, 6.055561065673828, 6.560879707336426, 7.066198348999023, 7.571516990661621, 8.076835632324219, 8.582154273986816, 9.087472915649414, 9.592791557312012, 10.09811019897461, 10.60342788696289, 11.108747482299805, 11.614066123962402, 12.119384765625, 12.624703407287598, 13.130022048950195, 13.635340690612793, 14.14065933227539, 14.645977020263672, 15.15129566192627]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 5.0, 6.0, 5.0, 8.0, 17.0, 27.0, 43.0, 63.0, 84.0, 134.0, 236.0, 347.0, 566.0, 880.0, 1474.0, 2393.0, 4095.0, 6780.0, 11571.0, 19537.0, 33632.0, 55868.0, 87742.0, 124899.0, 153289.0, 157089.0, 132773.0, 97563.0, 63177.0, 38549.0, 22782.0, 13367.0, 7742.0, 4515.0, 2783.0, 1662.0, 1062.0, 655.0, 383.0, 261.0, 170.0, 110.0, 73.0, 48.0, 33.0, 19.0, 16.0, 8.0, 6.0, 9.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.0625, -10.6827392578125, -10.302978515625, -9.9232177734375, -9.54345703125, -9.1636962890625, -8.783935546875, -8.4041748046875, -8.0244140625, -7.6446533203125, -7.264892578125, -6.8851318359375, -6.50537109375, -6.1256103515625, -5.745849609375, -5.3660888671875, -4.986328125, -4.6065673828125, -4.226806640625, -3.8470458984375, -3.46728515625, -3.0875244140625, -2.707763671875, -2.3280029296875, -1.9482421875, -1.5684814453125, -1.188720703125, -0.8089599609375, -0.42919921875, -0.0494384765625, 0.330322265625, 0.7100830078125, 1.08984375, 1.4696044921875, 1.849365234375, 2.2291259765625, 2.60888671875, 2.9886474609375, 3.368408203125, 3.7481689453125, 4.1279296875, 4.5076904296875, 4.887451171875, 5.2672119140625, 5.64697265625, 6.0267333984375, 6.406494140625, 6.7862548828125, 7.166015625, 7.5457763671875, 7.925537109375, 8.3052978515625, 8.68505859375, 9.0648193359375, 9.444580078125, 9.8243408203125, 10.2041015625, 10.5838623046875, 10.963623046875, 11.3433837890625, 11.72314453125, 12.1029052734375, 12.482666015625, 12.8624267578125, 13.2421875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 3.0, 3.0, 6.0, 7.0, 11.0, 12.0, 12.0, 18.0, 14.0, 21.0, 26.0, 23.0, 31.0, 36.0, 42.0, 44.0, 46.0, 40.0, 47.0, 48.0, 52.0, 34.0, 45.0, 33.0, 40.0, 53.0, 38.0, 27.0, 33.0, 29.0, 27.0, 22.0, 18.0, 10.0, 15.0, 11.0, 4.0, 8.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.703125, -21.10498046875, -20.5068359375, -19.90869140625, -19.310546875, -18.71240234375, -18.1142578125, -17.51611328125, -16.91796875, -16.31982421875, -15.7216796875, -15.12353515625, -14.525390625, -13.92724609375, -13.3291015625, -12.73095703125, -12.1328125, -11.53466796875, -10.9365234375, -10.33837890625, -9.740234375, -9.14208984375, -8.5439453125, -7.94580078125, -7.34765625, -6.74951171875, -6.1513671875, -5.55322265625, -4.955078125, -4.35693359375, -3.7587890625, -3.16064453125, -2.5625, -1.96435546875, -1.3662109375, -0.76806640625, -0.169921875, 0.42822265625, 1.0263671875, 1.62451171875, 2.22265625, 2.82080078125, 3.4189453125, 4.01708984375, 4.615234375, 5.21337890625, 5.8115234375, 6.40966796875, 7.0078125, 7.60595703125, 8.2041015625, 8.80224609375, 9.400390625, 9.99853515625, 10.5966796875, 11.19482421875, 11.79296875, 12.39111328125, 12.9892578125, 13.58740234375, 14.185546875, 14.78369140625, 15.3818359375, 15.97998046875, 16.578125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 15.0, 21.0, 17.0, 38.0, 45.0, 70.0, 117.0, 169.0, 269.0, 370.0, 589.0, 910.0, 1438.0, 2213.0, 3322.0, 5385.0, 8468.0, 13838.0, 22535.0, 35893.0, 57086.0, 85750.0, 116882.0, 140339.0, 144939.0, 127705.0, 97498.0, 67221.0, 43339.0, 27101.0, 16668.0, 10334.0, 6376.0, 4156.0, 2511.0, 1670.0, 1121.0, 737.0, 478.0, 289.0, 202.0, 150.0, 111.0, 66.0, 33.0, 22.0, 17.0, 13.0, 12.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.15625, -11.7900390625, -11.423828125, -11.0576171875, -10.69140625, -10.3251953125, -9.958984375, -9.5927734375, -9.2265625, -8.8603515625, -8.494140625, -8.1279296875, -7.76171875, -7.3955078125, -7.029296875, -6.6630859375, -6.296875, -5.9306640625, -5.564453125, -5.1982421875, -4.83203125, -4.4658203125, -4.099609375, -3.7333984375, -3.3671875, -3.0009765625, -2.634765625, -2.2685546875, -1.90234375, -1.5361328125, -1.169921875, -0.8037109375, -0.4375, -0.0712890625, 0.294921875, 0.6611328125, 1.02734375, 1.3935546875, 1.759765625, 2.1259765625, 2.4921875, 2.8583984375, 3.224609375, 3.5908203125, 3.95703125, 4.3232421875, 4.689453125, 5.0556640625, 5.421875, 5.7880859375, 6.154296875, 6.5205078125, 6.88671875, 7.2529296875, 7.619140625, 7.9853515625, 8.3515625, 8.7177734375, 9.083984375, 9.4501953125, 9.81640625, 10.1826171875, 10.548828125, 10.9150390625, 11.28125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 0.0, 7.0, 9.0, 6.0, 9.0, 16.0, 8.0, 21.0, 17.0, 21.0, 13.0, 28.0, 29.0, 31.0, 35.0, 39.0, 34.0, 38.0, 31.0, 38.0, 43.0, 44.0, 50.0, 34.0, 30.0, 36.0, 41.0, 40.0, 34.0, 25.0, 23.0, 26.0, 17.0, 25.0, 18.0, 18.0, 12.0, 8.0, 13.0, 5.0, 13.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.6171875, -10.295166015625, -9.97314453125, -9.651123046875, -9.3291015625, -9.007080078125, -8.68505859375, -8.363037109375, -8.041015625, -7.718994140625, -7.39697265625, -7.074951171875, -6.7529296875, -6.430908203125, -6.10888671875, -5.786865234375, -5.46484375, -5.142822265625, -4.82080078125, -4.498779296875, -4.1767578125, -3.854736328125, -3.53271484375, -3.210693359375, -2.888671875, -2.566650390625, -2.24462890625, -1.922607421875, -1.6005859375, -1.278564453125, -0.95654296875, -0.634521484375, -0.3125, 0.009521484375, 0.33154296875, 0.653564453125, 0.9755859375, 1.297607421875, 1.61962890625, 1.941650390625, 2.263671875, 2.585693359375, 2.90771484375, 3.229736328125, 3.5517578125, 3.873779296875, 4.19580078125, 4.517822265625, 4.83984375, 5.161865234375, 5.48388671875, 5.805908203125, 6.1279296875, 6.449951171875, 6.77197265625, 7.093994140625, 7.416015625, 7.738037109375, 8.06005859375, 8.382080078125, 8.7041015625, 9.026123046875, 9.34814453125, 9.670166015625, 9.9921875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 8.0, 5.0, 9.0, 17.0, 18.0, 26.0, 50.0, 60.0, 109.0, 153.0, 241.0, 362.0, 590.0, 1074.0, 1961.0, 3703.0, 7298.0, 14531.0, 29762.0, 57882.0, 100495.0, 148978.0, 180966.0, 175656.0, 136939.0, 87976.0, 49334.0, 24817.0, 12212.0, 6040.0, 3153.0, 1648.0, 893.0, 531.0, 348.0, 236.0, 163.0, 84.0, 64.0, 48.0, 33.0, 23.0, 14.0, 9.0, 10.0, 6.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.69140625, -5.52337646484375, -5.3553466796875, -5.18731689453125, -5.019287109375, -4.85125732421875, -4.6832275390625, -4.51519775390625, -4.34716796875, -4.17913818359375, -4.0111083984375, -3.84307861328125, -3.675048828125, -3.50701904296875, -3.3389892578125, -3.17095947265625, -3.0029296875, -2.83489990234375, -2.6668701171875, -2.49884033203125, -2.330810546875, -2.16278076171875, -1.9947509765625, -1.82672119140625, -1.65869140625, -1.49066162109375, -1.3226318359375, -1.15460205078125, -0.986572265625, -0.81854248046875, -0.6505126953125, -0.48248291015625, -0.314453125, -0.14642333984375, 0.0216064453125, 0.18963623046875, 0.357666015625, 0.52569580078125, 0.6937255859375, 0.86175537109375, 1.02978515625, 1.19781494140625, 1.3658447265625, 1.53387451171875, 1.701904296875, 1.86993408203125, 2.0379638671875, 2.20599365234375, 2.3740234375, 2.54205322265625, 2.7100830078125, 2.87811279296875, 3.046142578125, 3.21417236328125, 3.3822021484375, 3.55023193359375, 3.71826171875, 3.88629150390625, 4.0543212890625, 4.22235107421875, 4.390380859375, 4.55841064453125, 4.7264404296875, 4.89447021484375, 5.0625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 4.0, 4.0, 9.0, 10.0, 9.0, 11.0, 15.0, 23.0, 34.0, 36.0, 44.0, 29.0, 53.0, 43.0, 37.0, 38.0, 49.0, 54.0, 52.0, 50.0, 45.0, 37.0, 43.0, 38.0, 31.0, 30.0, 34.0, 34.0, 8.0, 23.0, 7.0, 15.0, 7.0, 12.0, 6.0, 5.0, 4.0, 3.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004444122314453125, -0.00043026357889175415, -0.0004161149263381958, -0.00040196627378463745, -0.0003878176212310791, -0.00037366896867752075, -0.0003595203161239624, -0.00034537166357040405, -0.0003312230110168457, -0.00031707435846328735, -0.000302925705909729, -0.00028877705335617065, -0.0002746284008026123, -0.00026047974824905396, -0.0002463310956954956, -0.00023218244314193726, -0.0002180337905883789, -0.00020388513803482056, -0.0001897364854812622, -0.00017558783292770386, -0.0001614391803741455, -0.00014729052782058716, -0.0001331418752670288, -0.00011899322271347046, -0.00010484457015991211, -9.069591760635376e-05, -7.654726505279541e-05, -6.239861249923706e-05, -4.824995994567871e-05, -3.410130739212036e-05, -1.9952654838562012e-05, -5.804002285003662e-06, 8.344650268554688e-06, 2.2493302822113037e-05, 3.664195537567139e-05, 5.0790607929229736e-05, 6.493926048278809e-05, 7.908791303634644e-05, 9.323656558990479e-05, 0.00010738521814346313, 0.00012153387069702148, 0.00013568252325057983, 0.00014983117580413818, 0.00016397982835769653, 0.00017812848091125488, 0.00019227713346481323, 0.00020642578601837158, 0.00022057443857192993, 0.00023472309112548828, 0.00024887174367904663, 0.000263020396232605, 0.00027716904878616333, 0.0002913177013397217, 0.00030546635389328003, 0.0003196150064468384, 0.00033376365900039673, 0.0003479123115539551, 0.00036206096410751343, 0.0003762096166610718, 0.0003903582692146301, 0.0004045069217681885, 0.0004186555743217468, 0.0004328042268753052, 0.0004469528794288635, 0.0004611015319824219]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 3.0, 6.0, 11.0, 18.0, 18.0, 35.0, 38.0, 72.0, 112.0, 169.0, 235.0, 350.0, 520.0, 825.0, 1340.0, 2180.0, 3889.0, 7313.0, 14153.0, 27024.0, 50817.0, 86958.0, 131690.0, 167032.0, 172223.0, 145533.0, 102361.0, 61666.0, 33654.0, 17591.0, 8820.0, 4870.0, 2608.0, 1561.0, 971.0, 656.0, 418.0, 257.0, 180.0, 121.0, 79.0, 68.0, 43.0, 24.0, 14.0, 12.0, 6.0, 12.0, 1.0, 3.0, 3.0, 1.0], "bins": [-5.9140625, -5.75054931640625, -5.5870361328125, -5.42352294921875, -5.260009765625, -5.09649658203125, -4.9329833984375, -4.76947021484375, -4.60595703125, -4.44244384765625, -4.2789306640625, -4.11541748046875, -3.951904296875, -3.78839111328125, -3.6248779296875, -3.46136474609375, -3.2978515625, -3.13433837890625, -2.9708251953125, -2.80731201171875, -2.643798828125, -2.48028564453125, -2.3167724609375, -2.15325927734375, -1.98974609375, -1.82623291015625, -1.6627197265625, -1.49920654296875, -1.335693359375, -1.17218017578125, -1.0086669921875, -0.84515380859375, -0.681640625, -0.51812744140625, -0.3546142578125, -0.19110107421875, -0.027587890625, 0.13592529296875, 0.2994384765625, 0.46295166015625, 0.62646484375, 0.78997802734375, 0.9534912109375, 1.11700439453125, 1.280517578125, 1.44403076171875, 1.6075439453125, 1.77105712890625, 1.9345703125, 2.09808349609375, 2.2615966796875, 2.42510986328125, 2.588623046875, 2.75213623046875, 2.9156494140625, 3.07916259765625, 3.24267578125, 3.40618896484375, 3.5697021484375, 3.73321533203125, 3.896728515625, 4.06024169921875, 4.2237548828125, 4.38726806640625, 4.55078125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 7.0, 10.0, 12.0, 8.0, 14.0, 18.0, 25.0, 29.0, 18.0, 26.0, 39.0, 33.0, 37.0, 43.0, 51.0, 52.0, 47.0, 40.0, 56.0, 43.0, 47.0, 36.0, 40.0, 37.0, 25.0, 42.0, 30.0, 19.0, 22.0, 26.0, 14.0, 14.0, 13.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.59375, -1.5487518310546875, -1.503753662109375, -1.4587554931640625, -1.41375732421875, -1.3687591552734375, -1.323760986328125, -1.2787628173828125, -1.2337646484375, -1.1887664794921875, -1.143768310546875, -1.0987701416015625, -1.05377197265625, -1.0087738037109375, -0.963775634765625, -0.9187774658203125, -0.873779296875, -0.8287811279296875, -0.783782958984375, -0.7387847900390625, -0.69378662109375, -0.6487884521484375, -0.603790283203125, -0.5587921142578125, -0.5137939453125, -0.4687957763671875, -0.423797607421875, -0.3787994384765625, -0.33380126953125, -0.2888031005859375, -0.243804931640625, -0.1988067626953125, -0.15380859375, -0.1088104248046875, -0.063812255859375, -0.0188140869140625, 0.02618408203125, 0.0711822509765625, 0.116180419921875, 0.1611785888671875, 0.2061767578125, 0.2511749267578125, 0.296173095703125, 0.3411712646484375, 0.38616943359375, 0.4311676025390625, 0.476165771484375, 0.5211639404296875, 0.566162109375, 0.6111602783203125, 0.656158447265625, 0.7011566162109375, 0.74615478515625, 0.7911529541015625, 0.836151123046875, 0.8811492919921875, 0.9261474609375, 0.9711456298828125, 1.016143798828125, 1.0611419677734375, 1.10614013671875, 1.1511383056640625, 1.196136474609375, 1.2411346435546875, 1.2861328125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 2.0, 3.0, 5.0, 1.0, 5.0, 4.0, 2.0, 5.0, 6.0, 8.0, 5.0, 12.0, 11.0, 17.0, 24.0, 22.0, 28.0, 27.0, 40.0, 39.0, 41.0, 52.0, 48.0, 45.0, 52.0, 54.0, 48.0, 40.0, 42.0, 32.0, 32.0, 38.0, 28.0, 27.0, 27.0, 27.0, 27.0, 15.0, 9.0, 6.0, 7.0, 9.0, 10.0, 6.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.337387084960938, -15.75629997253418, -15.175212860107422, -14.594124794006348, -14.01303768157959, -13.431950569152832, -12.850862503051758, -12.269775390625, -11.688688278198242, -11.107601165771484, -10.526514053344727, -9.945425987243652, -9.364338874816895, -8.783251762390137, -8.202163696289062, -7.621076583862305, -7.039989471435547, -6.458902359008789, -5.877814769744873, -5.296727180480957, -4.715640068054199, -4.134552955627441, -3.5534653663635254, -2.9723777770996094, -2.3912906646728516, -1.8102033138275146, -1.2291159629821777, -0.6480286121368408, -0.0669412612915039, 0.514146089553833, 1.09523344039917, 1.676321029663086, 2.2574081420898438, 2.8384954929351807, 3.4195828437805176, 4.000670433044434, 4.581757545471191, 5.162844657897949, 5.743932247161865, 6.325019836425781, 6.906106948852539, 7.487194061279297, 8.068281173706055, 8.649369239807129, 9.230456352233887, 9.811543464660645, 10.392631530761719, 10.973718643188477, 11.554805755615234, 12.135892868041992, 12.71697998046875, 13.298068046569824, 13.879155158996582, 14.46024227142334, 15.041330337524414, 15.622417449951172, 16.20350456237793, 16.784591674804688, 17.365678787231445, 17.946765899658203, 18.527854919433594, 19.10894203186035, 19.69002914428711, 20.271116256713867, 20.852203369140625]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 3.0, 10.0, 11.0, 11.0, 5.0, 26.0, 9.0, 21.0, 27.0, 34.0, 27.0, 32.0, 27.0, 34.0, 35.0, 47.0, 39.0, 38.0, 35.0, 30.0, 37.0, 41.0, 41.0, 46.0, 36.0, 31.0, 29.0, 29.0, 25.0, 30.0, 29.0, 19.0, 13.0, 12.0, 17.0, 12.0, 8.0, 3.0, 4.0, 8.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-19.28630256652832, -18.7386474609375, -18.19099235534668, -17.64333724975586, -17.09568214416504, -16.54802703857422, -16.0003719329834, -15.452717781066895, -14.905062675476074, -14.357407569885254, -13.809752464294434, -13.262097358703613, -12.71444320678711, -12.166788101196289, -11.619132995605469, -11.071477890014648, -10.523822784423828, -9.976167678833008, -9.428512573242188, -8.880857467651367, -8.333202362060547, -7.785547733306885, -7.237893104553223, -6.690237998962402, -6.142582893371582, -5.594927787780762, -5.047272682189941, -4.499618053436279, -3.951962947845459, -3.4043078422546387, -2.8566529750823975, -2.3089981079101562, -1.7613439559936523, -1.2136889696121216, -0.6660339832305908, -0.11837899684906006, 0.4292759895324707, 0.976931095123291, 1.5245859622955322, 2.0722408294677734, 2.6198959350585938, 3.167551040649414, 3.7152059078216553, 4.2628607749938965, 4.810515880584717, 5.358170986175537, 5.905825614929199, 6.4534807205200195, 7.00113582611084, 7.54879093170166, 8.09644603729248, 8.6441011428833, 9.191755294799805, 9.739410400390625, 10.287065505981445, 10.834720611572266, 11.382375717163086, 11.930030822753906, 12.477685928344727, 13.025341033935547, 13.572996139526367, 14.120651245117188, 14.668305397033691, 15.215960502624512, 15.763615608215332]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 7.0, 6.0, 14.0, 17.0, 16.0, 27.0, 51.0, 83.0, 127.0, 198.0, 306.0, 504.0, 794.0, 1329.0, 2218.0, 3601.0, 5899.0, 10121.0, 17558.0, 30998.0, 54264.0, 97833.0, 176428.0, 316677.0, 539700.0, 787285.0, 802846.0, 572775.0, 340993.0, 191536.0, 106261.0, 58482.0, 32942.0, 18074.0, 10239.0, 5847.0, 3368.0, 1966.0, 1175.0, 701.0, 394.0, 247.0, 145.0, 95.0, 48.0, 42.0, 21.0, 20.0, 5.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.15625, -26.381591796875, -25.60693359375, -24.832275390625, -24.0576171875, -23.282958984375, -22.50830078125, -21.733642578125, -20.958984375, -20.184326171875, -19.40966796875, -18.635009765625, -17.8603515625, -17.085693359375, -16.31103515625, -15.536376953125, -14.76171875, -13.987060546875, -13.21240234375, -12.437744140625, -11.6630859375, -10.888427734375, -10.11376953125, -9.339111328125, -8.564453125, -7.789794921875, -7.01513671875, -6.240478515625, -5.4658203125, -4.691162109375, -3.91650390625, -3.141845703125, -2.3671875, -1.592529296875, -0.81787109375, -0.043212890625, 0.7314453125, 1.506103515625, 2.28076171875, 3.055419921875, 3.830078125, 4.604736328125, 5.37939453125, 6.154052734375, 6.9287109375, 7.703369140625, 8.47802734375, 9.252685546875, 10.02734375, 10.802001953125, 11.57666015625, 12.351318359375, 13.1259765625, 13.900634765625, 14.67529296875, 15.449951171875, 16.224609375, 16.999267578125, 17.77392578125, 18.548583984375, 19.3232421875, 20.097900390625, 20.87255859375, 21.647216796875, 22.421875]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 8.0, 10.0, 10.0, 14.0, 14.0, 8.0, 26.0, 31.0, 24.0, 26.0, 22.0, 34.0, 50.0, 32.0, 42.0, 35.0, 48.0, 41.0, 45.0, 37.0, 45.0, 47.0, 37.0, 36.0, 31.0, 29.0, 28.0, 30.0, 22.0, 24.0, 22.0, 16.0, 12.0, 9.0, 10.0, 10.0, 10.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-20.4375, -19.8717041015625, -19.305908203125, -18.7401123046875, -18.17431640625, -17.6085205078125, -17.042724609375, -16.4769287109375, -15.9111328125, -15.3453369140625, -14.779541015625, -14.2137451171875, -13.64794921875, -13.0821533203125, -12.516357421875, -11.9505615234375, -11.384765625, -10.8189697265625, -10.253173828125, -9.6873779296875, -9.12158203125, -8.5557861328125, -7.989990234375, -7.4241943359375, -6.8583984375, -6.2926025390625, -5.726806640625, -5.1610107421875, -4.59521484375, -4.0294189453125, -3.463623046875, -2.8978271484375, -2.33203125, -1.7662353515625, -1.200439453125, -0.6346435546875, -0.06884765625, 0.4969482421875, 1.062744140625, 1.6285400390625, 2.1943359375, 2.7601318359375, 3.325927734375, 3.8917236328125, 4.45751953125, 5.0233154296875, 5.589111328125, 6.1549072265625, 6.720703125, 7.2864990234375, 7.852294921875, 8.4180908203125, 8.98388671875, 9.5496826171875, 10.115478515625, 10.6812744140625, 11.2470703125, 11.8128662109375, 12.378662109375, 12.9444580078125, 13.51025390625, 14.0760498046875, 14.641845703125, 15.2076416015625, 15.7734375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 12.0, 28.0, 40.0, 58.0, 117.0, 183.0, 282.0, 496.0, 808.0, 1320.0, 2297.0, 3962.0, 6737.0, 11175.0, 19033.0, 33323.0, 57301.0, 98180.0, 166406.0, 275214.0, 427345.0, 597457.0, 694662.0, 620329.0, 450899.0, 292956.0, 179407.0, 105929.0, 61851.0, 35940.0, 21100.0, 12030.0, 7061.0, 4256.0, 2529.0, 1431.0, 855.0, 503.0, 305.0, 176.0, 115.0, 67.0, 47.0, 29.0, 11.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.546875, -27.67041015625, -26.7939453125, -25.91748046875, -25.041015625, -24.16455078125, -23.2880859375, -22.41162109375, -21.53515625, -20.65869140625, -19.7822265625, -18.90576171875, -18.029296875, -17.15283203125, -16.2763671875, -15.39990234375, -14.5234375, -13.64697265625, -12.7705078125, -11.89404296875, -11.017578125, -10.14111328125, -9.2646484375, -8.38818359375, -7.51171875, -6.63525390625, -5.7587890625, -4.88232421875, -4.005859375, -3.12939453125, -2.2529296875, -1.37646484375, -0.5, 0.37646484375, 1.2529296875, 2.12939453125, 3.005859375, 3.88232421875, 4.7587890625, 5.63525390625, 6.51171875, 7.38818359375, 8.2646484375, 9.14111328125, 10.017578125, 10.89404296875, 11.7705078125, 12.64697265625, 13.5234375, 14.39990234375, 15.2763671875, 16.15283203125, 17.029296875, 17.90576171875, 18.7822265625, 19.65869140625, 20.53515625, 21.41162109375, 22.2880859375, 23.16455078125, 24.041015625, 24.91748046875, 25.7939453125, 26.67041015625, 27.546875]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 10.0, 10.0, 10.0, 16.0, 14.0, 29.0, 37.0, 35.0, 58.0, 73.0, 96.0, 107.0, 148.0, 156.0, 186.0, 212.0, 215.0, 261.0, 269.0, 295.0, 260.0, 257.0, 214.0, 200.0, 182.0, 126.0, 122.0, 103.0, 82.0, 61.0, 53.0, 41.0, 24.0, 33.0, 18.0, 19.0, 12.0, 10.0, 7.0, 5.0, 2.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0078125, -9.6409912109375, -9.274169921875, -8.9073486328125, -8.54052734375, -8.1737060546875, -7.806884765625, -7.4400634765625, -7.0732421875, -6.7064208984375, -6.339599609375, -5.9727783203125, -5.60595703125, -5.2391357421875, -4.872314453125, -4.5054931640625, -4.138671875, -3.7718505859375, -3.405029296875, -3.0382080078125, -2.67138671875, -2.3045654296875, -1.937744140625, -1.5709228515625, -1.2041015625, -0.8372802734375, -0.470458984375, -0.1036376953125, 0.26318359375, 0.6300048828125, 0.996826171875, 1.3636474609375, 1.73046875, 2.0972900390625, 2.464111328125, 2.8309326171875, 3.19775390625, 3.5645751953125, 3.931396484375, 4.2982177734375, 4.6650390625, 5.0318603515625, 5.398681640625, 5.7655029296875, 6.13232421875, 6.4991455078125, 6.865966796875, 7.2327880859375, 7.599609375, 7.9664306640625, 8.333251953125, 8.7000732421875, 9.06689453125, 9.4337158203125, 9.800537109375, 10.1673583984375, 10.5341796875, 10.9010009765625, 11.267822265625, 11.6346435546875, 12.00146484375, 12.3682861328125, 12.735107421875, 13.1019287109375, 13.46875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 10.0, 12.0, 21.0, 17.0, 32.0, 29.0, 30.0, 30.0, 48.0, 41.0, 60.0, 67.0, 45.0, 56.0, 52.0, 59.0, 53.0, 39.0, 37.0, 46.0, 29.0, 28.0, 24.0, 19.0, 11.0, 12.0, 14.0, 15.0, 11.0, 7.0, 10.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.99288558959961, -34.824806213378906, -33.65673065185547, -32.488651275634766, -31.320575714111328, -30.152496337890625, -28.984418869018555, -27.816341400146484, -26.648263931274414, -25.480186462402344, -24.312108993530273, -23.144031524658203, -21.9759521484375, -20.807876586914062, -19.63979721069336, -18.47171974182129, -17.30364227294922, -16.13556480407715, -14.967487335205078, -13.799408912658691, -12.631331443786621, -11.46325397491455, -10.295175552368164, -9.127098083496094, -7.959020614624023, -6.790943145751953, -5.622865200042725, -4.454787254333496, -3.286709785461426, -2.1186323165893555, -0.950554370880127, 0.21752357482910156, 1.3855972290039062, 2.5536749362945557, 3.721752643585205, 4.889830589294434, 6.057908058166504, 7.225985527038574, 8.394063949584961, 9.562141418457031, 10.730218887329102, 11.898296356201172, 13.066373825073242, 14.234452247619629, 15.4025297164917, 16.570606231689453, 17.738685607910156, 18.906763076782227, 20.074840545654297, 21.242918014526367, 22.410995483398438, 23.579072952270508, 24.747150421142578, 25.91522979736328, 27.08330726623535, 28.251384735107422, 29.419462203979492, 30.587539672851562, 31.755617141723633, 32.9236946105957, 34.091773986816406, 35.259849548339844, 36.42792892456055, 37.59600830078125, 38.76408386230469]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 9.0, 6.0, 8.0, 7.0, 4.0, 15.0, 7.0, 9.0, 21.0, 22.0, 21.0, 17.0, 24.0, 28.0, 35.0, 40.0, 33.0, 24.0, 43.0, 34.0, 37.0, 31.0, 41.0, 46.0, 53.0, 32.0, 48.0, 28.0, 31.0, 31.0, 29.0, 25.0, 21.0, 21.0, 18.0, 15.0, 13.0, 17.0, 10.0, 8.0, 6.0, 6.0, 8.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0], "bins": [-29.682016372680664, -28.85281753540039, -28.023616790771484, -27.19441795349121, -26.365219116210938, -25.536020278930664, -24.70682144165039, -23.877620697021484, -23.04842185974121, -22.219223022460938, -21.39002227783203, -20.560823440551758, -19.731624603271484, -18.90242576599121, -18.073226928710938, -17.24402618408203, -16.414827346801758, -15.585628509521484, -14.756428718566895, -13.927228927612305, -13.098030090332031, -12.268831253051758, -11.439631462097168, -10.610431671142578, -9.781232833862305, -8.952033996582031, -8.122834205627441, -7.29363489151001, -6.464435577392578, -5.6352362632751465, -4.806036949157715, -3.976837635040283, -3.1476364135742188, -2.318437099456787, -1.4892377853393555, -0.6600384712219238, 0.1691608428955078, 0.9983601570129395, 1.827559471130371, 2.6567587852478027, 3.4859580993652344, 4.315157413482666, 5.144356727600098, 5.973556041717529, 6.802755355834961, 7.631954669952393, 8.461153984069824, 9.290353775024414, 10.119552612304688, 10.948751449584961, 11.77795124053955, 12.60715103149414, 13.436349868774414, 14.265548706054688, 15.094748497009277, 15.923948287963867, 16.75314712524414, 17.582345962524414, 18.411544799804688, 19.240745544433594, 20.069944381713867, 20.89914321899414, 21.728343963623047, 22.55754280090332, 23.386741638183594]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 8.0, 8.0, 12.0, 7.0, 26.0, 34.0, 55.0, 73.0, 102.0, 141.0, 202.0, 301.0, 402.0, 611.0, 980.0, 1427.0, 2123.0, 3283.0, 5122.0, 8062.0, 13237.0, 21178.0, 35819.0, 60171.0, 103331.0, 168774.0, 217170.0, 161682.0, 97995.0, 57549.0, 33793.0, 20313.0, 12445.0, 7705.0, 4905.0, 3179.0, 2189.0, 1375.0, 909.0, 583.0, 404.0, 265.0, 180.0, 126.0, 80.0, 67.0, 52.0, 33.0, 24.0, 19.0, 7.0, 11.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.91015625, -4.7489013671875, -4.587646484375, -4.4263916015625, -4.26513671875, -4.1038818359375, -3.942626953125, -3.7813720703125, -3.6201171875, -3.4588623046875, -3.297607421875, -3.1363525390625, -2.97509765625, -2.8138427734375, -2.652587890625, -2.4913330078125, -2.330078125, -2.1688232421875, -2.007568359375, -1.8463134765625, -1.68505859375, -1.5238037109375, -1.362548828125, -1.2012939453125, -1.0400390625, -0.8787841796875, -0.717529296875, -0.5562744140625, -0.39501953125, -0.2337646484375, -0.072509765625, 0.0887451171875, 0.25, 0.4112548828125, 0.572509765625, 0.7337646484375, 0.89501953125, 1.0562744140625, 1.217529296875, 1.3787841796875, 1.5400390625, 1.7012939453125, 1.862548828125, 2.0238037109375, 2.18505859375, 2.3463134765625, 2.507568359375, 2.6688232421875, 2.830078125, 2.9913330078125, 3.152587890625, 3.3138427734375, 3.47509765625, 3.6363525390625, 3.797607421875, 3.9588623046875, 4.1201171875, 4.2813720703125, 4.442626953125, 4.6038818359375, 4.76513671875, 4.9263916015625, 5.087646484375, 5.2489013671875, 5.41015625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 2.0, 7.0, 7.0, 7.0, 9.0, 9.0, 20.0, 15.0, 24.0, 16.0, 33.0, 21.0, 30.0, 50.0, 38.0, 36.0, 48.0, 35.0, 42.0, 47.0, 52.0, 43.0, 39.0, 33.0, 37.0, 33.0, 33.0, 33.0, 29.0, 26.0, 21.0, 18.0, 18.0, 14.0, 12.0, 14.0, 6.0, 8.0, 5.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-32.375, -31.413330078125, -30.45166015625, -29.489990234375, -28.5283203125, -27.566650390625, -26.60498046875, -25.643310546875, -24.681640625, -23.719970703125, -22.75830078125, -21.796630859375, -20.8349609375, -19.873291015625, -18.91162109375, -17.949951171875, -16.98828125, -16.026611328125, -15.06494140625, -14.103271484375, -13.1416015625, -12.179931640625, -11.21826171875, -10.256591796875, -9.294921875, -8.333251953125, -7.37158203125, -6.409912109375, -5.4482421875, -4.486572265625, -3.52490234375, -2.563232421875, -1.6015625, -0.639892578125, 0.32177734375, 1.283447265625, 2.2451171875, 3.206787109375, 4.16845703125, 5.130126953125, 6.091796875, 7.053466796875, 8.01513671875, 8.976806640625, 9.9384765625, 10.900146484375, 11.86181640625, 12.823486328125, 13.78515625, 14.746826171875, 15.70849609375, 16.670166015625, 17.6318359375, 18.593505859375, 19.55517578125, 20.516845703125, 21.478515625, 22.440185546875, 23.40185546875, 24.363525390625, 25.3251953125, 26.286865234375, 27.24853515625, 28.210205078125, 29.171875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 4.0, 5.0, 6.0, 10.0, 13.0, 23.0, 35.0, 71.0, 81.0, 120.0, 186.0, 262.0, 402.0, 591.0, 1009.0, 1544.0, 2281.0, 3665.0, 5551.0, 8745.0, 13979.0, 22415.0, 35882.0, 57134.0, 92275.0, 141227.0, 187051.0, 167165.0, 114017.0, 72216.0, 44932.0, 27610.0, 17541.0, 10959.0, 6898.0, 4574.0, 2850.0, 1871.0, 1202.0, 733.0, 496.0, 292.0, 229.0, 132.0, 93.0, 59.0, 44.0, 24.0, 24.0, 11.0, 9.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.5703125, -4.43072509765625, -4.2911376953125, -4.15155029296875, -4.011962890625, -3.87237548828125, -3.7327880859375, -3.59320068359375, -3.45361328125, -3.31402587890625, -3.1744384765625, -3.03485107421875, -2.895263671875, -2.75567626953125, -2.6160888671875, -2.47650146484375, -2.3369140625, -2.19732666015625, -2.0577392578125, -1.91815185546875, -1.778564453125, -1.63897705078125, -1.4993896484375, -1.35980224609375, -1.22021484375, -1.08062744140625, -0.9410400390625, -0.80145263671875, -0.661865234375, -0.52227783203125, -0.3826904296875, -0.24310302734375, -0.103515625, 0.03607177734375, 0.1756591796875, 0.31524658203125, 0.454833984375, 0.59442138671875, 0.7340087890625, 0.87359619140625, 1.01318359375, 1.15277099609375, 1.2923583984375, 1.43194580078125, 1.571533203125, 1.71112060546875, 1.8507080078125, 1.99029541015625, 2.1298828125, 2.26947021484375, 2.4090576171875, 2.54864501953125, 2.688232421875, 2.82781982421875, 2.9674072265625, 3.10699462890625, 3.24658203125, 3.38616943359375, 3.5257568359375, 3.66534423828125, 3.804931640625, 3.94451904296875, 4.0841064453125, 4.22369384765625, 4.36328125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 10.0, 11.0, 19.0, 15.0, 15.0, 24.0, 22.0, 33.0, 35.0, 39.0, 33.0, 48.0, 48.0, 62.0, 51.0, 55.0, 52.0, 57.0, 54.0, 50.0, 29.0, 44.0, 32.0, 30.0, 23.0, 24.0, 15.0, 17.0, 15.0, 11.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.09375, -20.400146484375, -19.70654296875, -19.012939453125, -18.3193359375, -17.625732421875, -16.93212890625, -16.238525390625, -15.544921875, -14.851318359375, -14.15771484375, -13.464111328125, -12.7705078125, -12.076904296875, -11.38330078125, -10.689697265625, -9.99609375, -9.302490234375, -8.60888671875, -7.915283203125, -7.2216796875, -6.528076171875, -5.83447265625, -5.140869140625, -4.447265625, -3.753662109375, -3.06005859375, -2.366455078125, -1.6728515625, -0.979248046875, -0.28564453125, 0.407958984375, 1.1015625, 1.795166015625, 2.48876953125, 3.182373046875, 3.8759765625, 4.569580078125, 5.26318359375, 5.956787109375, 6.650390625, 7.343994140625, 8.03759765625, 8.731201171875, 9.4248046875, 10.118408203125, 10.81201171875, 11.505615234375, 12.19921875, 12.892822265625, 13.58642578125, 14.280029296875, 14.9736328125, 15.667236328125, 16.36083984375, 17.054443359375, 17.748046875, 18.441650390625, 19.13525390625, 19.828857421875, 20.5224609375, 21.216064453125, 21.90966796875, 22.603271484375, 23.296875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 6.0, 16.0, 13.0, 20.0, 39.0, 65.0, 86.0, 145.0, 200.0, 349.0, 492.0, 850.0, 1322.0, 2113.0, 3520.0, 6179.0, 10326.0, 17830.0, 31071.0, 57150.0, 106877.0, 202132.0, 263583.0, 156919.0, 82614.0, 45014.0, 24791.0, 14099.0, 8194.0, 4865.0, 2916.0, 1800.0, 1120.0, 675.0, 367.0, 268.0, 190.0, 131.0, 67.0, 47.0, 23.0, 23.0, 14.0, 8.0, 6.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34130859375, -0.32965850830078125, -0.3180084228515625, -0.30635833740234375, -0.294708251953125, -0.28305816650390625, -0.2714080810546875, -0.25975799560546875, -0.24810791015625, -0.23645782470703125, -0.2248077392578125, -0.21315765380859375, -0.201507568359375, -0.18985748291015625, -0.1782073974609375, -0.16655731201171875, -0.1549072265625, -0.14325714111328125, -0.1316070556640625, -0.11995697021484375, -0.108306884765625, -0.09665679931640625, -0.0850067138671875, -0.07335662841796875, -0.06170654296875, -0.05005645751953125, -0.0384063720703125, -0.02675628662109375, -0.015106201171875, -0.00345611572265625, 0.0081939697265625, 0.01984405517578125, 0.031494140625, 0.04314422607421875, 0.0547943115234375, 0.06644439697265625, 0.078094482421875, 0.08974456787109375, 0.1013946533203125, 0.11304473876953125, 0.12469482421875, 0.13634490966796875, 0.1479949951171875, 0.15964508056640625, 0.171295166015625, 0.18294525146484375, 0.1945953369140625, 0.20624542236328125, 0.2178955078125, 0.22954559326171875, 0.2411956787109375, 0.25284576416015625, 0.264495849609375, 0.27614593505859375, 0.2877960205078125, 0.29944610595703125, 0.31109619140625, 0.32274627685546875, 0.3343963623046875, 0.34604644775390625, 0.357696533203125, 0.36934661865234375, 0.3809967041015625, 0.39264678955078125, 0.404296875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 7.0, 10.0, 8.0, 14.0, 12.0, 9.0, 10.0, 17.0, 13.0, 28.0, 24.0, 36.0, 38.0, 42.0, 50.0, 34.0, 46.0, 63.0, 32.0, 41.0, 50.0, 41.0, 46.0, 40.0, 34.0, 29.0, 31.0, 30.0, 20.0, 23.0, 19.0, 17.0, 16.0, 11.0, 13.0, 8.0, 6.0, 10.0, 5.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.0590763092041016e-05, -3.943499177694321e-05, -3.82792204618454e-05, -3.712344914674759e-05, -3.596767783164978e-05, -3.481190651655197e-05, -3.365613520145416e-05, -3.2500363886356354e-05, -3.1344592571258545e-05, -3.0188821256160736e-05, -2.9033049941062927e-05, -2.787727862596512e-05, -2.672150731086731e-05, -2.55657359957695e-05, -2.4409964680671692e-05, -2.3254193365573883e-05, -2.2098422050476074e-05, -2.0942650735378265e-05, -1.9786879420280457e-05, -1.8631108105182648e-05, -1.747533679008484e-05, -1.631956547498703e-05, -1.5163794159889221e-05, -1.4008022844791412e-05, -1.2852251529693604e-05, -1.1696480214595795e-05, -1.0540708899497986e-05, -9.384937584400177e-06, -8.229166269302368e-06, -7.073394954204559e-06, -5.9176236391067505e-06, -4.761852324008942e-06, -3.606081008911133e-06, -2.450309693813324e-06, -1.2945383787155151e-06, -1.387670636177063e-07, 1.0170042514801025e-06, 2.1727755665779114e-06, 3.3285468816757202e-06, 4.484318196773529e-06, 5.640089511871338e-06, 6.795860826969147e-06, 7.951632142066956e-06, 9.107403457164764e-06, 1.0263174772262573e-05, 1.1418946087360382e-05, 1.2574717402458191e-05, 1.3730488717556e-05, 1.4886260032653809e-05, 1.6042031347751617e-05, 1.7197802662849426e-05, 1.8353573977947235e-05, 1.9509345293045044e-05, 2.0665116608142853e-05, 2.182088792324066e-05, 2.297665923833847e-05, 2.413243055343628e-05, 2.5288201868534088e-05, 2.6443973183631897e-05, 2.7599744498729706e-05, 2.8755515813827515e-05, 2.9911287128925323e-05, 3.106705844402313e-05, 3.222282975912094e-05, 3.337860107421875e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 12.0, 26.0, 36.0, 54.0, 92.0, 130.0, 174.0, 312.0, 410.0, 644.0, 857.0, 1342.0, 1904.0, 2843.0, 4070.0, 6543.0, 10339.0, 16497.0, 27233.0, 46343.0, 80076.0, 139595.0, 228690.0, 198168.0, 115711.0, 65926.0, 37752.0, 22678.0, 13977.0, 8892.0, 5626.0, 3846.0, 2431.0, 1640.0, 1193.0, 772.0, 533.0, 375.0, 261.0, 187.0, 130.0, 70.0, 69.0, 26.0, 24.0, 7.0, 13.0, 6.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.564453125, -0.546142578125, -0.52783203125, -0.509521484375, -0.4912109375, -0.472900390625, -0.45458984375, -0.436279296875, -0.41796875, -0.399658203125, -0.38134765625, -0.363037109375, -0.3447265625, -0.326416015625, -0.30810546875, -0.289794921875, -0.271484375, -0.253173828125, -0.23486328125, -0.216552734375, -0.1982421875, -0.179931640625, -0.16162109375, -0.143310546875, -0.125, -0.106689453125, -0.08837890625, -0.070068359375, -0.0517578125, -0.033447265625, -0.01513671875, 0.003173828125, 0.021484375, 0.039794921875, 0.05810546875, 0.076416015625, 0.0947265625, 0.113037109375, 0.13134765625, 0.149658203125, 0.16796875, 0.186279296875, 0.20458984375, 0.222900390625, 0.2412109375, 0.259521484375, 0.27783203125, 0.296142578125, 0.314453125, 0.332763671875, 0.35107421875, 0.369384765625, 0.3876953125, 0.406005859375, 0.42431640625, 0.442626953125, 0.4609375, 0.479248046875, 0.49755859375, 0.515869140625, 0.5341796875, 0.552490234375, 0.57080078125, 0.589111328125, 0.607421875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 3.0, 5.0, 6.0, 6.0, 11.0, 12.0, 10.0, 19.0, 17.0, 23.0, 17.0, 23.0, 40.0, 38.0, 32.0, 47.0, 58.0, 63.0, 73.0, 68.0, 52.0, 52.0, 46.0, 46.0, 30.0, 20.0, 29.0, 19.0, 28.0, 14.0, 6.0, 19.0, 11.0, 13.0, 9.0, 8.0, 3.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1378173828125, -0.1335926055908203, -0.12936782836914062, -0.12514305114746094, -0.12091827392578125, -0.11669349670410156, -0.11246871948242188, -0.10824394226074219, -0.1040191650390625, -0.09979438781738281, -0.09556961059570312, -0.09134483337402344, -0.08712005615234375, -0.08289527893066406, -0.07867050170898438, -0.07444572448730469, -0.070220947265625, -0.06599617004394531, -0.061771392822265625, -0.05754661560058594, -0.05332183837890625, -0.04909706115722656, -0.044872283935546875, -0.04064750671386719, -0.0364227294921875, -0.03219795227050781, -0.027973175048828125, -0.023748397827148438, -0.01952362060546875, -0.015298843383789062, -0.011074066162109375, -0.0068492889404296875, -0.00262451171875, 0.0016002655029296875, 0.005825042724609375, 0.010049819946289062, 0.01427459716796875, 0.018499374389648438, 0.022724151611328125, 0.026948928833007812, 0.0311737060546875, 0.03539848327636719, 0.039623260498046875, 0.04384803771972656, 0.04807281494140625, 0.05229759216308594, 0.056522369384765625, 0.06074714660644531, 0.064971923828125, 0.06919670104980469, 0.07342147827148438, 0.07764625549316406, 0.08187103271484375, 0.08609580993652344, 0.09032058715820312, 0.09454536437988281, 0.0987701416015625, 0.10299491882324219, 0.10721969604492188, 0.11144447326660156, 0.11566925048828125, 0.11989402770996094, 0.12411880493164062, 0.1283435821533203, 0.132568359375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 4.0, 5.0, 7.0, 10.0, 14.0, 22.0, 15.0, 32.0, 25.0, 28.0, 37.0, 39.0, 50.0, 47.0, 61.0, 53.0, 46.0, 56.0, 64.0, 46.0, 48.0, 39.0, 41.0, 37.0, 30.0, 19.0, 19.0, 17.0, 11.0, 11.0, 14.0, 12.0, 9.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-35.997074127197266, -34.83775329589844, -33.678436279296875, -32.51911544799805, -31.35979652404785, -30.200477600097656, -29.041156768798828, -27.881837844848633, -26.722518920898438, -25.563199996948242, -24.403881072998047, -23.24456024169922, -22.085241317749023, -20.925922393798828, -19.7666015625, -18.607282638549805, -17.44796371459961, -16.288644790649414, -15.129324913024902, -13.97000503540039, -12.810686111450195, -11.6513671875, -10.492047309875488, -9.332727432250977, -8.173408508300781, -7.014089107513428, -5.854769706726074, -4.695450305938721, -3.536130905151367, -2.3768115043640137, -1.2174921035766602, -0.05817222595214844, 1.1011466979980469, 2.2604660987854004, 3.419785499572754, 4.579104900360107, 5.738424301147461, 6.8977437019348145, 8.057063102722168, 9.21638298034668, 10.375701904296875, 11.53502082824707, 12.694340705871582, 13.853660583496094, 15.012979507446289, 16.172298431396484, 17.331619262695312, 18.490938186645508, 19.650257110595703, 20.8095760345459, 21.968894958496094, 23.128215789794922, 24.287534713745117, 25.446853637695312, 26.60617446899414, 27.765493392944336, 28.92481231689453, 30.084131240844727, 31.243450164794922, 32.40277099609375, 33.56208801269531, 34.72140884399414, 35.88072967529297, 37.04004669189453, 38.19936752319336]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 10.0, 5.0, 9.0, 7.0, 3.0, 16.0, 7.0, 9.0, 19.0, 24.0, 20.0, 17.0, 26.0, 26.0, 35.0, 39.0, 36.0, 20.0, 46.0, 36.0, 35.0, 32.0, 39.0, 49.0, 51.0, 33.0, 48.0, 27.0, 32.0, 31.0, 28.0, 26.0, 21.0, 20.0, 19.0, 14.0, 13.0, 18.0, 10.0, 8.0, 5.0, 7.0, 7.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0], "bins": [-30.045015335083008, -29.20672607421875, -28.36843490600586, -27.5301456451416, -26.691856384277344, -25.853567123413086, -25.015277862548828, -24.176986694335938, -23.33869743347168, -22.500408172607422, -21.66211700439453, -20.823827743530273, -19.985538482666016, -19.147249221801758, -18.3089599609375, -17.47066879272461, -16.63237953186035, -15.794090270996094, -14.95580005645752, -14.117509841918945, -13.279220581054688, -12.44093132019043, -11.602641105651855, -10.764350891113281, -9.926061630249023, -9.087772369384766, -8.249482154846191, -7.411192417144775, -6.572902679443359, -5.734612941741943, -4.896323204040527, -4.058033466339111, -3.2197418212890625, -2.3814520835876465, -1.5431623458862305, -0.7048726081848145, 0.13341712951660156, 0.9717068672180176, 1.8099966049194336, 2.6482863426208496, 3.4865760803222656, 4.324865818023682, 5.163155555725098, 6.001445293426514, 6.83973503112793, 7.678024768829346, 8.516314506530762, 9.354604721069336, 10.192893981933594, 11.031183242797852, 11.869473457336426, 12.707763671875, 13.546052932739258, 14.384342193603516, 15.22263240814209, 16.060922622680664, 16.899211883544922, 17.73750114440918, 18.575790405273438, 19.414081573486328, 20.252370834350586, 21.090660095214844, 21.928951263427734, 22.767240524291992, 23.60552978515625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 9.0, 16.0, 15.0, 20.0, 26.0, 50.0, 67.0, 77.0, 138.0, 197.0, 285.0, 406.0, 582.0, 790.0, 1238.0, 1886.0, 2963.0, 4703.0, 7722.0, 13153.0, 23758.0, 44946.0, 88708.0, 166823.0, 237378.0, 203263.0, 116872.0, 59407.0, 30669.0, 16686.0, 9587.0, 5628.0, 3591.0, 2274.0, 1503.0, 1002.0, 658.0, 462.0, 325.0, 214.0, 152.0, 94.0, 65.0, 36.0, 33.0, 25.0, 23.0, 13.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-36.1875, -35.0810546875, -33.974609375, -32.8681640625, -31.76171875, -30.6552734375, -29.548828125, -28.4423828125, -27.3359375, -26.2294921875, -25.123046875, -24.0166015625, -22.91015625, -21.8037109375, -20.697265625, -19.5908203125, -18.484375, -17.3779296875, -16.271484375, -15.1650390625, -14.05859375, -12.9521484375, -11.845703125, -10.7392578125, -9.6328125, -8.5263671875, -7.419921875, -6.3134765625, -5.20703125, -4.1005859375, -2.994140625, -1.8876953125, -0.78125, 0.3251953125, 1.431640625, 2.5380859375, 3.64453125, 4.7509765625, 5.857421875, 6.9638671875, 8.0703125, 9.1767578125, 10.283203125, 11.3896484375, 12.49609375, 13.6025390625, 14.708984375, 15.8154296875, 16.921875, 18.0283203125, 19.134765625, 20.2412109375, 21.34765625, 22.4541015625, 23.560546875, 24.6669921875, 25.7734375, 26.8798828125, 27.986328125, 29.0927734375, 30.19921875, 31.3056640625, 32.412109375, 33.5185546875, 34.625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 3.0, 0.0, 4.0, 3.0, 9.0, 16.0, 14.0, 22.0, 13.0, 21.0, 21.0, 24.0, 22.0, 30.0, 38.0, 40.0, 44.0, 35.0, 39.0, 45.0, 54.0, 49.0, 51.0, 32.0, 46.0, 43.0, 46.0, 33.0, 27.0, 29.0, 19.0, 28.0, 21.0, 14.0, 9.0, 10.0, 10.0, 4.0, 7.0, 4.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.9375, -31.923828125, -30.91015625, -29.896484375, -28.8828125, -27.869140625, -26.85546875, -25.841796875, -24.828125, -23.814453125, -22.80078125, -21.787109375, -20.7734375, -19.759765625, -18.74609375, -17.732421875, -16.71875, -15.705078125, -14.69140625, -13.677734375, -12.6640625, -11.650390625, -10.63671875, -9.623046875, -8.609375, -7.595703125, -6.58203125, -5.568359375, -4.5546875, -3.541015625, -2.52734375, -1.513671875, -0.5, 0.513671875, 1.52734375, 2.541015625, 3.5546875, 4.568359375, 5.58203125, 6.595703125, 7.609375, 8.623046875, 9.63671875, 10.650390625, 11.6640625, 12.677734375, 13.69140625, 14.705078125, 15.71875, 16.732421875, 17.74609375, 18.759765625, 19.7734375, 20.787109375, 21.80078125, 22.814453125, 23.828125, 24.841796875, 25.85546875, 26.869140625, 27.8828125, 28.896484375, 29.91015625, 30.923828125, 31.9375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 16.0, 13.0, 19.0, 28.0, 43.0, 94.0, 138.0, 192.0, 295.0, 516.0, 863.0, 1392.0, 2273.0, 4141.0, 7121.0, 12957.0, 25010.0, 50962.0, 114808.0, 250227.0, 292769.0, 151741.0, 65732.0, 30876.0, 15984.0, 8505.0, 4817.0, 2715.0, 1690.0, 947.0, 586.0, 392.0, 219.0, 164.0, 101.0, 71.0, 51.0, 18.0, 14.0, 11.0, 9.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.0, -54.2587890625, -52.517578125, -50.7763671875, -49.03515625, -47.2939453125, -45.552734375, -43.8115234375, -42.0703125, -40.3291015625, -38.587890625, -36.8466796875, -35.10546875, -33.3642578125, -31.623046875, -29.8818359375, -28.140625, -26.3994140625, -24.658203125, -22.9169921875, -21.17578125, -19.4345703125, -17.693359375, -15.9521484375, -14.2109375, -12.4697265625, -10.728515625, -8.9873046875, -7.24609375, -5.5048828125, -3.763671875, -2.0224609375, -0.28125, 1.4599609375, 3.201171875, 4.9423828125, 6.68359375, 8.4248046875, 10.166015625, 11.9072265625, 13.6484375, 15.3896484375, 17.130859375, 18.8720703125, 20.61328125, 22.3544921875, 24.095703125, 25.8369140625, 27.578125, 29.3193359375, 31.060546875, 32.8017578125, 34.54296875, 36.2841796875, 38.025390625, 39.7666015625, 41.5078125, 43.2490234375, 44.990234375, 46.7314453125, 48.47265625, 50.2138671875, 51.955078125, 53.6962890625, 55.4375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 7.0, 13.0, 15.0, 12.0, 16.0, 24.0, 42.0, 26.0, 30.0, 50.0, 36.0, 56.0, 54.0, 38.0, 64.0, 81.0, 69.0, 56.0, 42.0, 39.0, 42.0, 34.0, 34.0, 22.0, 23.0, 14.0, 11.0, 13.0, 10.0, 5.0, 9.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.546875, -23.755126953125, -22.96337890625, -22.171630859375, -21.3798828125, -20.588134765625, -19.79638671875, -19.004638671875, -18.212890625, -17.421142578125, -16.62939453125, -15.837646484375, -15.0458984375, -14.254150390625, -13.46240234375, -12.670654296875, -11.87890625, -11.087158203125, -10.29541015625, -9.503662109375, -8.7119140625, -7.920166015625, -7.12841796875, -6.336669921875, -5.544921875, -4.753173828125, -3.96142578125, -3.169677734375, -2.3779296875, -1.586181640625, -0.79443359375, -0.002685546875, 0.7890625, 1.580810546875, 2.37255859375, 3.164306640625, 3.9560546875, 4.747802734375, 5.53955078125, 6.331298828125, 7.123046875, 7.914794921875, 8.70654296875, 9.498291015625, 10.2900390625, 11.081787109375, 11.87353515625, 12.665283203125, 13.45703125, 14.248779296875, 15.04052734375, 15.832275390625, 16.6240234375, 17.415771484375, 18.20751953125, 18.999267578125, 19.791015625, 20.582763671875, 21.37451171875, 22.166259765625, 22.9580078125, 23.749755859375, 24.54150390625, 25.333251953125, 26.125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 4.0, 10.0, 13.0, 11.0, 22.0, 40.0, 64.0, 99.0, 169.0, 271.0, 453.0, 907.0, 1686.0, 3300.0, 6274.0, 12896.0, 25395.0, 48894.0, 87708.0, 136504.0, 176763.0, 181813.0, 148598.0, 98744.0, 56847.0, 29999.0, 15152.0, 7581.0, 3737.0, 1997.0, 1132.0, 613.0, 331.0, 193.0, 129.0, 66.0, 42.0, 27.0, 25.0, 16.0, 11.0, 5.0, 6.0, 4.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0], "bins": [-9.2265625, -8.9638671875, -8.701171875, -8.4384765625, -8.17578125, -7.9130859375, -7.650390625, -7.3876953125, -7.125, -6.8623046875, -6.599609375, -6.3369140625, -6.07421875, -5.8115234375, -5.548828125, -5.2861328125, -5.0234375, -4.7607421875, -4.498046875, -4.2353515625, -3.97265625, -3.7099609375, -3.447265625, -3.1845703125, -2.921875, -2.6591796875, -2.396484375, -2.1337890625, -1.87109375, -1.6083984375, -1.345703125, -1.0830078125, -0.8203125, -0.5576171875, -0.294921875, -0.0322265625, 0.23046875, 0.4931640625, 0.755859375, 1.0185546875, 1.28125, 1.5439453125, 1.806640625, 2.0693359375, 2.33203125, 2.5947265625, 2.857421875, 3.1201171875, 3.3828125, 3.6455078125, 3.908203125, 4.1708984375, 4.43359375, 4.6962890625, 4.958984375, 5.2216796875, 5.484375, 5.7470703125, 6.009765625, 6.2724609375, 6.53515625, 6.7978515625, 7.060546875, 7.3232421875, 7.5859375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 10.0, 2.0, 7.0, 7.0, 10.0, 12.0, 12.0, 18.0, 13.0, 18.0, 21.0, 19.0, 22.0, 37.0, 35.0, 45.0, 44.0, 50.0, 40.0, 50.0, 49.0, 48.0, 47.0, 35.0, 52.0, 44.0, 29.0, 36.0, 33.0, 27.0, 24.0, 20.0, 14.0, 11.0, 19.0, 9.0, 8.0, 2.0, 7.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.000766754150390625, -0.0007449090480804443, -0.0007230639457702637, -0.000701218843460083, -0.0006793737411499023, -0.0006575286388397217, -0.000635683536529541, -0.0006138384342193604, -0.0005919933319091797, -0.000570148229598999, -0.0005483031272888184, -0.0005264580249786377, -0.000504612922668457, -0.00048276782035827637, -0.0004609227180480957, -0.00043907761573791504, -0.0004172325134277344, -0.0003953874111175537, -0.00037354230880737305, -0.0003516972064971924, -0.0003298521041870117, -0.00030800700187683105, -0.0002861618995666504, -0.0002643167972564697, -0.00024247169494628906, -0.0002206265926361084, -0.00019878149032592773, -0.00017693638801574707, -0.0001550912857055664, -0.00013324618339538574, -0.00011140108108520508, -8.955597877502441e-05, -6.771087646484375e-05, -4.5865774154663086e-05, -2.4020671844482422e-05, -2.175569534301758e-06, 1.9669532775878906e-05, 4.151463508605957e-05, 6.335973739624023e-05, 8.52048397064209e-05, 0.00010704994201660156, 0.00012889504432678223, 0.0001507401466369629, 0.00017258524894714355, 0.00019443035125732422, 0.00021627545356750488, 0.00023812055587768555, 0.0002599656581878662, 0.0002818107604980469, 0.00030365586280822754, 0.0003255009651184082, 0.00034734606742858887, 0.00036919116973876953, 0.0003910362720489502, 0.00041288137435913086, 0.0004347264766693115, 0.0004565715789794922, 0.00047841668128967285, 0.0005002617835998535, 0.0005221068859100342, 0.0005439519882202148, 0.0005657970905303955, 0.0005876421928405762, 0.0006094872951507568, 0.0006313323974609375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 2.0, 4.0, 9.0, 11.0, 15.0, 24.0, 33.0, 54.0, 83.0, 115.0, 184.0, 315.0, 509.0, 897.0, 1733.0, 3151.0, 6099.0, 12100.0, 23310.0, 45394.0, 80678.0, 128073.0, 168229.0, 179941.0, 154281.0, 107595.0, 64274.0, 34657.0, 17658.0, 8938.0, 4537.0, 2383.0, 1360.0, 759.0, 434.0, 255.0, 163.0, 96.0, 51.0, 48.0, 22.0, 19.0, 11.0, 15.0, 10.0, 8.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-8.890625, -8.63134765625, -8.3720703125, -8.11279296875, -7.853515625, -7.59423828125, -7.3349609375, -7.07568359375, -6.81640625, -6.55712890625, -6.2978515625, -6.03857421875, -5.779296875, -5.52001953125, -5.2607421875, -5.00146484375, -4.7421875, -4.48291015625, -4.2236328125, -3.96435546875, -3.705078125, -3.44580078125, -3.1865234375, -2.92724609375, -2.66796875, -2.40869140625, -2.1494140625, -1.89013671875, -1.630859375, -1.37158203125, -1.1123046875, -0.85302734375, -0.59375, -0.33447265625, -0.0751953125, 0.18408203125, 0.443359375, 0.70263671875, 0.9619140625, 1.22119140625, 1.48046875, 1.73974609375, 1.9990234375, 2.25830078125, 2.517578125, 2.77685546875, 3.0361328125, 3.29541015625, 3.5546875, 3.81396484375, 4.0732421875, 4.33251953125, 4.591796875, 4.85107421875, 5.1103515625, 5.36962890625, 5.62890625, 5.88818359375, 6.1474609375, 6.40673828125, 6.666015625, 6.92529296875, 7.1845703125, 7.44384765625, 7.703125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 7.0, 8.0, 14.0, 14.0, 22.0, 21.0, 36.0, 38.0, 39.0, 47.0, 50.0, 47.0, 51.0, 65.0, 48.0, 58.0, 45.0, 58.0, 61.0, 36.0, 41.0, 30.0, 33.0, 25.0, 27.0, 16.0, 14.0, 13.0, 9.0, 9.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.61328125, -2.535858154296875, -2.45843505859375, -2.381011962890625, -2.3035888671875, -2.226165771484375, -2.14874267578125, -2.071319580078125, -1.993896484375, -1.916473388671875, -1.83905029296875, -1.761627197265625, -1.6842041015625, -1.606781005859375, -1.52935791015625, -1.451934814453125, -1.37451171875, -1.297088623046875, -1.21966552734375, -1.142242431640625, -1.0648193359375, -0.987396240234375, -0.90997314453125, -0.832550048828125, -0.755126953125, -0.677703857421875, -0.60028076171875, -0.522857666015625, -0.4454345703125, -0.368011474609375, -0.29058837890625, -0.213165283203125, -0.1357421875, -0.058319091796875, 0.01910400390625, 0.096527099609375, 0.1739501953125, 0.251373291015625, 0.32879638671875, 0.406219482421875, 0.483642578125, 0.561065673828125, 0.63848876953125, 0.715911865234375, 0.7933349609375, 0.870758056640625, 0.94818115234375, 1.025604248046875, 1.10302734375, 1.180450439453125, 1.25787353515625, 1.335296630859375, 1.4127197265625, 1.490142822265625, 1.56756591796875, 1.644989013671875, 1.722412109375, 1.799835205078125, 1.87725830078125, 1.954681396484375, 2.0321044921875, 2.109527587890625, 2.18695068359375, 2.264373779296875, 2.341796875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 5.0, 6.0, 2.0, 3.0, 12.0, 14.0, 11.0, 16.0, 23.0, 32.0, 32.0, 42.0, 39.0, 40.0, 42.0, 48.0, 57.0, 57.0, 56.0, 51.0, 56.0, 49.0, 40.0, 44.0, 28.0, 35.0, 30.0, 15.0, 18.0, 17.0, 16.0, 14.0, 9.0, 9.0, 4.0, 4.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.399864196777344, -37.13087463378906, -35.861881256103516, -34.592891693115234, -33.32389831542969, -32.054908752441406, -30.785917282104492, -29.516925811767578, -28.247934341430664, -26.97894287109375, -25.709951400756836, -24.440959930419922, -23.17197036743164, -21.902976989746094, -20.633987426757812, -19.3649959564209, -18.096004486083984, -16.82701301574707, -15.558021545410156, -14.289031028747559, -13.020039558410645, -11.75104808807373, -10.482057571411133, -9.213066101074219, -7.944074630737305, -6.675083160400391, -5.406092166900635, -4.137101173400879, -2.868109703063965, -1.5991182327270508, -0.3301272392272949, 0.9388637542724609, 2.2078590393066406, 3.4768502712249756, 4.7458415031433105, 6.014832496643066, 7.2838239669799805, 8.552815437316895, 9.821805953979492, 11.090797424316406, 12.35978889465332, 13.628780364990234, 14.897771835327148, 16.166763305664062, 17.435752868652344, 18.70474624633789, 19.973735809326172, 21.242727279663086, 22.51171875, 23.780710220336914, 25.049701690673828, 26.318693161010742, 27.587684631347656, 28.856674194335938, 30.12566566467285, 31.394657135009766, 32.66365051269531, 33.932640075683594, 35.20163345336914, 36.47062301635742, 37.73961639404297, 39.00860595703125, 40.2775993347168, 41.54658889770508, 42.81557846069336]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 4.0, 4.0, 12.0, 9.0, 9.0, 14.0, 19.0, 23.0, 18.0, 30.0, 38.0, 34.0, 38.0, 49.0, 43.0, 48.0, 43.0, 30.0, 36.0, 54.0, 37.0, 53.0, 50.0, 38.0, 43.0, 30.0, 38.0, 23.0, 24.0, 21.0, 10.0, 17.0, 14.0, 9.0, 4.0, 5.0, 5.0, 6.0, 3.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.117008209228516, -41.859920501708984, -40.60282897949219, -39.345741271972656, -38.08864974975586, -36.83156204223633, -35.57447052001953, -34.3173828125, -33.06029510498047, -31.803205490112305, -30.54611587524414, -29.28902816772461, -28.031938552856445, -26.77484893798828, -25.517759323120117, -24.260669708251953, -23.00358009338379, -21.746490478515625, -20.48940086364746, -19.232311248779297, -17.975223541259766, -16.7181339263916, -15.461044311523438, -14.20395565032959, -12.946866035461426, -11.689776420593262, -10.432687759399414, -9.17559814453125, -7.918509006500244, -6.661419868469238, -5.404330253601074, -4.147241592407227, -2.8901519775390625, -1.633062720298767, -0.3759734630584717, 0.8811159133911133, 2.138205051422119, 3.395294189453125, 4.652383804321289, 5.909472465515137, 7.166562080383301, 8.423651695251465, 9.680740356445312, 10.937829971313477, 12.19491958618164, 13.452008247375488, 14.709097862243652, 15.9661865234375, 17.223276138305664, 18.480365753173828, 19.737455368041992, 20.994544982910156, 22.251632690429688, 23.50872230529785, 24.765811920166016, 26.022899627685547, 27.279991149902344, 28.537080764770508, 29.794170379638672, 31.051258087158203, 32.308349609375, 33.56543731689453, 34.82252502441406, 36.07961654663086, 37.33670425415039]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 11.0, 9.0, 19.0, 18.0, 41.0, 55.0, 66.0, 97.0, 148.0, 208.0, 291.0, 400.0, 601.0, 843.0, 1149.0, 1632.0, 2258.0, 3622.0, 5264.0, 7638.0, 479895.0, 6404.0, 4259.0, 2785.0, 1989.0, 1332.0, 928.0, 627.0, 474.0, 345.0, 250.0, 182.0, 104.0, 118.0, 50.0, 58.0, 28.0, 21.0, 16.0, 9.0, 9.0, 1.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-374.9385986328125, -363.30535888671875, -351.6721496582031, -340.0389099121094, -328.4056701660156, -316.7724609375, -305.13922119140625, -293.5059814453125, -281.8727722167969, -270.2395324707031, -258.6063232421875, -246.97308349609375, -235.33985900878906, -223.70663452148438, -212.07339477539062, -200.44017028808594, -188.8069305419922, -177.1737060546875, -165.54046630859375, -153.90724182128906, -142.27401733398438, -130.64077758789062, -119.00755310058594, -107.37432861328125, -95.74109649658203, -84.10786437988281, -72.47463989257812, -60.841407775878906, -49.20817947387695, -37.574951171875, -25.94171905517578, -14.308494567871094, -2.675262451171875, 8.957966804504395, 20.591196060180664, 32.22442626953125, 43.8576545715332, 55.490882873535156, 67.12411499023438, 78.75733947753906, 90.39057159423828, 102.0238037109375, 113.65702819824219, 125.2902603149414, 136.92349243164062, 148.5567169189453, 160.18994140625, 171.82318115234375, 183.45640563964844, 195.08963012695312, 206.72286987304688, 218.35609436035156, 229.98931884765625, 241.62255859375, 253.2557830810547, 264.8890075683594, 276.5222473144531, 288.1554870605469, 299.7886962890625, 311.42193603515625, 323.05517578125, 334.6883850097656, 346.3216247558594, 357.954833984375, 369.58807373046875]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 2.0, 9.0, 9.0, 11.0, 8.0, 13.0, 20.0, 22.0, 18.0, 25.0, 41.0, 38.0, 37.0, 44.0, 47.0, 50.0, 37.0, 34.0, 1060.0, 51.0, 41.0, 51.0, 41.0, 42.0, 48.0, 28.0, 36.0, 26.0, 26.0, 20.0, 9.0, 18.0, 14.0, 10.0, 4.0, 4.0, 6.0, 5.0, 3.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1279.6907958984375, -1242.409423828125, -1205.128173828125, -1167.8468017578125, -1130.5654296875, -1093.2841796875, -1056.0028076171875, -1018.721435546875, -981.4401245117188, -944.1588134765625, -906.87744140625, -869.5961303710938, -832.3148193359375, -795.033447265625, -757.7521362304688, -720.4708251953125, -683.189453125, -645.9081420898438, -608.6267700195312, -571.345458984375, -534.0640869140625, -496.78277587890625, -459.50146484375, -422.2201232910156, -384.93878173828125, -347.6574401855469, -310.3760986328125, -273.09478759765625, -235.81344604492188, -198.5321044921875, -161.2507781982422, -123.96945190429688, -86.688232421875, -49.406898498535156, -12.125564575195312, 25.15576934814453, 62.437103271484375, 99.71844482421875, 136.99977111816406, 174.28109741210938, 211.56243896484375, 248.84378051757812, 286.1251220703125, 323.40643310546875, 360.6877746582031, 397.9691162109375, 435.25042724609375, 472.5317687988281, 509.8131103515625, 547.0944213867188, 584.3757934570312, 621.6571044921875, 658.9384765625, 696.2197875976562, 733.5010986328125, 770.782470703125, 808.0637817382812, 845.3450927734375, 882.62646484375, 919.9077758789062, 957.1890869140625, 994.470458984375, 1031.7518310546875, 1069.0330810546875, 1106.314453125]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 12.0, 8.0, 22.0, 16.0, 27.0, 33.0, 50.0, 64.0, 98.0, 134.0, 286.0, 452.0, 546.0, 708.0, 956.0, 1523.0, 2658.0, 4016.0, 6614.0, 9754.0, 13867.0, 17633.0, 50705.0, 31009094.0, 67287.0, 38846.0, 14000.0, 6658.0, 3469.0, 1789.0, 1065.0, 720.0, 442.0, 277.0, 151.0, 117.0, 77.0, 72.0, 53.0, 42.0, 38.0, 22.0, 15.0, 13.0, 14.0, 13.0, 11.0, 14.0, 6.0, 7.0, 7.0, 1.0, 4.0, 6.0, 2.0, 0.0, 3.0], "bins": [-635.6773681640625, -614.7839965820312, -593.8905639648438, -572.9971923828125, -552.103759765625, -531.2103881835938, -510.3169860839844, -489.423583984375, -468.53021240234375, -447.6368103027344, -426.743408203125, -405.85003662109375, -384.9566345214844, -364.063232421875, -343.1698303222656, -322.27642822265625, -301.3830261230469, -280.4896240234375, -259.5962219238281, -238.7028350830078, -217.8094482421875, -196.91604614257812, -176.02264404296875, -155.12925720214844, -134.23585510253906, -113.34246063232422, -92.44906616210938, -71.5556640625, -50.662269592285156, -29.768875122070312, -8.875473022460938, 12.017913818359375, 32.91131591796875, 53.804710388183594, 74.69810485839844, 95.59150695800781, 116.48490142822266, 137.3782958984375, 158.27169799804688, 179.1650848388672, 200.05848693847656, 220.95188903808594, 241.84527587890625, 262.7386779785156, 283.632080078125, 304.52545166015625, 325.41888427734375, 346.312255859375, 367.2056579589844, 388.09906005859375, 408.9924621582031, 429.8858642578125, 450.77923583984375, 471.6726379394531, 492.5660400390625, 513.4594116210938, 534.3528442382812, 555.2462158203125, 576.1396484375, 597.0330200195312, 617.9264526367188, 638.81982421875, 659.7132568359375, 680.6066284179688, 701.5]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 9.0, 21.0, 23.0, 20.0, 43.0, 56.0, 70.0, 86.0, 124.0, 159.0, 266.0, 366.0, 553.0, 756.0, 1131.0, 1610.0, 2370.0, 3364.0, 5063.0, 7716.0, 11757.0, 18457.0, 28929.0, 46384.0, 74308.0, 119885.0, 200504.0, 351133.0, 800417.0, 2963419.0, 787650.0, 345894.0, 198745.0, 119010.0, 73174.0, 45433.0, 28771.0, 18328.0, 11935.0, 7802.0, 4930.0, 3338.0, 2302.0, 1555.0, 1081.0, 750.0, 490.0, 396.0, 251.0, 198.0, 109.0, 82.0, 70.0, 38.0, 35.0, 28.0, 22.0, 16.0, 11.0, 6.0, 1.0, 2.0], "bins": [-4.2734375, -4.13775634765625, -4.0020751953125, -3.86639404296875, -3.730712890625, -3.59503173828125, -3.4593505859375, -3.32366943359375, -3.18798828125, -3.05230712890625, -2.9166259765625, -2.78094482421875, -2.645263671875, -2.50958251953125, -2.3739013671875, -2.23822021484375, -2.1025390625, -1.96685791015625, -1.8311767578125, -1.69549560546875, -1.559814453125, -1.42413330078125, -1.2884521484375, -1.15277099609375, -1.01708984375, -0.88140869140625, -0.7457275390625, -0.61004638671875, -0.474365234375, -0.33868408203125, -0.2030029296875, -0.06732177734375, 0.068359375, 0.20404052734375, 0.3397216796875, 0.47540283203125, 0.611083984375, 0.74676513671875, 0.8824462890625, 1.01812744140625, 1.15380859375, 1.28948974609375, 1.4251708984375, 1.56085205078125, 1.696533203125, 1.83221435546875, 1.9678955078125, 2.10357666015625, 2.2392578125, 2.37493896484375, 2.5106201171875, 2.64630126953125, 2.781982421875, 2.91766357421875, 3.0533447265625, 3.18902587890625, 3.32470703125, 3.46038818359375, 3.5960693359375, 3.73175048828125, 3.867431640625, 4.00311279296875, 4.1387939453125, 4.27447509765625, 4.41015625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 6.0, 7.0, 6.0, 17.0, 19.0, 8.0, 19.0, 20.0, 20.0, 28.0, 25.0, 26.0, 36.0, 33.0, 43.0, 42.0, 45.0, 142.0, 570.0, 339.0, 125.0, 67.0, 53.0, 48.0, 32.0, 21.0, 29.0, 33.0, 24.0, 27.0, 23.0, 21.0, 11.0, 8.0, 11.0, 9.0, 5.0, 5.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-17.53125, -17.0091552734375, -16.487060546875, -15.9649658203125, -15.44287109375, -14.9207763671875, -14.398681640625, -13.8765869140625, -13.3544921875, -12.8323974609375, -12.310302734375, -11.7882080078125, -11.26611328125, -10.7440185546875, -10.221923828125, -9.6998291015625, -9.177734375, -8.6556396484375, -8.133544921875, -7.6114501953125, -7.08935546875, -6.5672607421875, -6.045166015625, -5.5230712890625, -5.0009765625, -4.4788818359375, -3.956787109375, -3.4346923828125, -2.91259765625, -2.3905029296875, -1.868408203125, -1.3463134765625, -0.82421875, -0.3021240234375, 0.219970703125, 0.7420654296875, 1.26416015625, 1.7862548828125, 2.308349609375, 2.8304443359375, 3.3525390625, 3.8746337890625, 4.396728515625, 4.9188232421875, 5.44091796875, 5.9630126953125, 6.485107421875, 7.0072021484375, 7.529296875, 8.0513916015625, 8.573486328125, 9.0955810546875, 9.61767578125, 10.1397705078125, 10.661865234375, 11.1839599609375, 11.7060546875, 12.2281494140625, 12.750244140625, 13.2723388671875, 13.79443359375, 14.3165283203125, 14.838623046875, 15.3607177734375, 15.8828125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 9.0, 7.0, 20.0, 18.0, 24.0, 38.0, 63.0, 83.0, 124.0, 168.0, 279.0, 436.0, 651.0, 953.0, 1565.0, 2386.0, 3847.0, 6255.0, 10574.0, 18021.0, 32536.0, 62148.0, 126534.0, 296389.0, 972086.0, 3858355.0, 508447.0, 195515.0, 89218.0, 45844.0, 24660.0, 13712.0, 7937.0, 4697.0, 2887.0, 1731.0, 1164.0, 761.0, 438.0, 274.0, 213.0, 112.0, 77.0, 49.0, 36.0, 31.0, 20.0, 20.0, 6.0, 4.0, 5.0, 7.0, 4.0], "bins": [-9.5, -9.238037109375, -8.97607421875, -8.714111328125, -8.4521484375, -8.190185546875, -7.92822265625, -7.666259765625, -7.404296875, -7.142333984375, -6.88037109375, -6.618408203125, -6.3564453125, -6.094482421875, -5.83251953125, -5.570556640625, -5.30859375, -5.046630859375, -4.78466796875, -4.522705078125, -4.2607421875, -3.998779296875, -3.73681640625, -3.474853515625, -3.212890625, -2.950927734375, -2.68896484375, -2.427001953125, -2.1650390625, -1.903076171875, -1.64111328125, -1.379150390625, -1.1171875, -0.855224609375, -0.59326171875, -0.331298828125, -0.0693359375, 0.192626953125, 0.45458984375, 0.716552734375, 0.978515625, 1.240478515625, 1.50244140625, 1.764404296875, 2.0263671875, 2.288330078125, 2.55029296875, 2.812255859375, 3.07421875, 3.336181640625, 3.59814453125, 3.860107421875, 4.1220703125, 4.384033203125, 4.64599609375, 4.907958984375, 5.169921875, 5.431884765625, 5.69384765625, 5.955810546875, 6.2177734375, 6.479736328125, 6.74169921875, 7.003662109375, 7.265625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 8.0, 7.0, 7.0, 11.0, 11.0, 11.0, 16.0, 12.0, 22.0, 15.0, 21.0, 23.0, 29.0, 17.0, 34.0, 32.0, 33.0, 36.0, 40.0, 41.0, 47.0, 221.0, 624.0, 212.0, 113.0, 46.0, 56.0, 28.0, 31.0, 29.0, 27.0, 24.0, 17.0, 21.0, 14.0, 18.0, 13.0, 10.0, 9.0, 8.0, 6.0, 5.0, 5.0, 7.0, 8.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.8515625, -14.4046630859375, -13.957763671875, -13.5108642578125, -13.06396484375, -12.6170654296875, -12.170166015625, -11.7232666015625, -11.2763671875, -10.8294677734375, -10.382568359375, -9.9356689453125, -9.48876953125, -9.0418701171875, -8.594970703125, -8.1480712890625, -7.701171875, -7.2542724609375, -6.807373046875, -6.3604736328125, -5.91357421875, -5.4666748046875, -5.019775390625, -4.5728759765625, -4.1259765625, -3.6790771484375, -3.232177734375, -2.7852783203125, -2.33837890625, -1.8914794921875, -1.444580078125, -0.9976806640625, -0.55078125, -0.1038818359375, 0.343017578125, 0.7899169921875, 1.23681640625, 1.6837158203125, 2.130615234375, 2.5775146484375, 3.0244140625, 3.4713134765625, 3.918212890625, 4.3651123046875, 4.81201171875, 5.2589111328125, 5.705810546875, 6.1527099609375, 6.599609375, 7.0465087890625, 7.493408203125, 7.9403076171875, 8.38720703125, 8.8341064453125, 9.281005859375, 9.7279052734375, 10.1748046875, 10.6217041015625, 11.068603515625, 11.5155029296875, 11.96240234375, 12.4093017578125, 12.856201171875, 13.3031005859375, 13.75]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 11.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 3.0, 11.0, 20.0, 30.0, 34.0, 29.0, 34.0, 57.0, 74.0, 102.0, 121.0, 249.0, 353.0, 474.0, 824.0, 1159.0, 2100.0, 3823.0, 7936.0, 22185.0, 100499.0, 6008200.0, 103362.0, 22248.0, 8070.0, 3747.0, 2081.0, 1209.0, 667.0, 507.0, 311.0, 222.0, 228.0, 113.0, 61.0, 70.0, 37.0, 58.0, 25.0, 27.0, 12.0, 10.0, 10.0, 4.0, 1.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-51.5625, -49.8720703125, -48.181640625, -46.4912109375, -44.80078125, -43.1103515625, -41.419921875, -39.7294921875, -38.0390625, -36.3486328125, -34.658203125, -32.9677734375, -31.27734375, -29.5869140625, -27.896484375, -26.2060546875, -24.515625, -22.8251953125, -21.134765625, -19.4443359375, -17.75390625, -16.0634765625, -14.373046875, -12.6826171875, -10.9921875, -9.3017578125, -7.611328125, -5.9208984375, -4.23046875, -2.5400390625, -0.849609375, 0.8408203125, 2.53125, 4.2216796875, 5.912109375, 7.6025390625, 9.29296875, 10.9833984375, 12.673828125, 14.3642578125, 16.0546875, 17.7451171875, 19.435546875, 21.1259765625, 22.81640625, 24.5068359375, 26.197265625, 27.8876953125, 29.578125, 31.2685546875, 32.958984375, 34.6494140625, 36.33984375, 38.0302734375, 39.720703125, 41.4111328125, 43.1015625, 44.7919921875, 46.482421875, 48.1728515625, 49.86328125, 51.5537109375, 53.244140625, 54.9345703125, 56.625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 12.0, 11.0, 15.0, 13.0, 19.0, 21.0, 41.0, 25.0, 37.0, 50.0, 48.0, 69.0, 67.0, 195.0, 688.0, 246.0, 102.0, 65.0, 50.0, 43.0, 39.0, 34.0, 36.0, 23.0, 10.0, 18.0, 10.0, 5.0, 4.0, 5.0, 2.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-25.015625, -24.32763671875, -23.6396484375, -22.95166015625, -22.263671875, -21.57568359375, -20.8876953125, -20.19970703125, -19.51171875, -18.82373046875, -18.1357421875, -17.44775390625, -16.759765625, -16.07177734375, -15.3837890625, -14.69580078125, -14.0078125, -13.31982421875, -12.6318359375, -11.94384765625, -11.255859375, -10.56787109375, -9.8798828125, -9.19189453125, -8.50390625, -7.81591796875, -7.1279296875, -6.43994140625, -5.751953125, -5.06396484375, -4.3759765625, -3.68798828125, -3.0, -2.31201171875, -1.6240234375, -0.93603515625, -0.248046875, 0.43994140625, 1.1279296875, 1.81591796875, 2.50390625, 3.19189453125, 3.8798828125, 4.56787109375, 5.255859375, 5.94384765625, 6.6318359375, 7.31982421875, 8.0078125, 8.69580078125, 9.3837890625, 10.07177734375, 10.759765625, 11.44775390625, 12.1357421875, 12.82373046875, 13.51171875, 14.19970703125, 14.8876953125, 15.57568359375, 16.263671875, 16.95166015625, 17.6396484375, 18.32763671875, 19.015625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 7.0, 8.0, 24.0, 58.0, 309.0, 440.0, 72.0, 37.0, 22.0, 9.0, 9.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.11697387695312, -60.79739761352539, -56.477821350097656, -52.15824508666992, -47.83866882324219, -43.51909255981445, -39.19951629638672, -34.879940032958984, -30.56036376953125, -26.240787506103516, -21.92121124267578, -17.601634979248047, -13.282058715820312, -8.962482452392578, -4.642906188964844, -0.3233299255371094, 3.996246337890625, 8.31582260131836, 12.635398864746094, 16.954975128173828, 21.274551391601562, 25.594127655029297, 29.91370391845703, 34.233280181884766, 38.5528564453125, 42.872432708740234, 47.19200897216797, 51.5115852355957, 55.83116149902344, 60.15073776245117, 64.4703140258789, 68.78988647460938, 73.10945129394531, 77.42903137207031, 81.74860382080078, 86.06817626953125, 90.38775634765625, 94.70733642578125, 99.02690887451172, 103.34648132324219, 107.66606140136719, 111.98564147949219, 116.30521392822266, 120.62478637695312, 124.94436645507812, 129.26394653320312, 133.58352661132812, 137.90309143066406, 142.22267150878906, 146.54225158691406, 150.86181640625, 155.181396484375, 159.5009765625, 163.820556640625, 168.14013671875, 172.45970153808594, 176.77928161621094, 181.09886169433594, 185.41842651367188, 189.73800659179688, 194.05758666992188, 198.37716674804688, 202.69674682617188, 207.0163116455078, 211.3358917236328]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 4.0, 9.0, 12.0, 21.0, 36.0, 56.0, 154.0, 289.0, 227.0, 71.0, 30.0, 27.0, 21.0, 9.0, 12.0, 5.0, 6.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-185.36448669433594, -180.1632843017578, -174.9620819091797, -169.76087951660156, -164.55967712402344, -159.3584747314453, -154.1572723388672, -148.95606994628906, -143.75486755371094, -138.5536651611328, -133.3524627685547, -128.15126037597656, -122.95005798339844, -117.74885559082031, -112.54765319824219, -107.34645080566406, -102.14524841308594, -96.94404602050781, -91.74284362792969, -86.54164123535156, -81.34043884277344, -76.13923645019531, -70.93803405761719, -65.73683166503906, -60.53562927246094, -55.33442687988281, -50.13322448730469, -44.93202209472656, -39.73081970214844, -34.52961730957031, -29.328414916992188, -24.127212524414062, -18.925994873046875, -13.72479248046875, -8.523590087890625, -3.3223876953125, 1.878814697265625, 7.08001708984375, 12.281219482421875, 17.482421875, 22.683624267578125, 27.88482666015625, 33.086029052734375, 38.2872314453125, 43.488433837890625, 48.68963623046875, 53.890838623046875, 59.092041015625, 64.29324340820312, 69.49444580078125, 74.69564819335938, 79.8968505859375, 85.09805297851562, 90.29925537109375, 95.50045776367188, 100.70166015625, 105.90286254882812, 111.10406494140625, 116.30526733398438, 121.5064697265625, 126.70767211914062, 131.90887451171875, 137.11007690429688, 142.311279296875, 147.51248168945312]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 9.0, 7.0, 6.0, 12.0, 11.0, 21.0, 20.0, 23.0, 35.0, 36.0, 72.0, 113.0, 143.0, 197.0, 286.0, 429.0, 686.0, 1144.0, 1774.0, 3238.0, 6326.0, 14162.0, 41750.0, 499746.0, 3515690.0, 77109.0, 17152.0, 6615.0, 3190.0, 1700.0, 920.0, 566.0, 337.0, 209.0, 141.0, 119.0, 80.0, 60.0, 32.0, 25.0, 19.0, 24.0, 14.0, 4.0, 6.0, 4.0, 4.0, 6.0, 5.0], "bins": [-2.126953125, -2.072662353515625, -2.01837158203125, -1.964080810546875, -1.9097900390625, -1.855499267578125, -1.80120849609375, -1.746917724609375, -1.692626953125, -1.638336181640625, -1.58404541015625, -1.529754638671875, -1.4754638671875, -1.421173095703125, -1.36688232421875, -1.312591552734375, -1.25830078125, -1.204010009765625, -1.14971923828125, -1.095428466796875, -1.0411376953125, -0.986846923828125, -0.93255615234375, -0.878265380859375, -0.823974609375, -0.769683837890625, -0.71539306640625, -0.661102294921875, -0.6068115234375, -0.552520751953125, -0.49822998046875, -0.443939208984375, -0.3896484375, -0.335357666015625, -0.28106689453125, -0.226776123046875, -0.1724853515625, -0.118194580078125, -0.06390380859375, -0.009613037109375, 0.044677734375, 0.098968505859375, 0.15325927734375, 0.207550048828125, 0.2618408203125, 0.316131591796875, 0.37042236328125, 0.424713134765625, 0.47900390625, 0.533294677734375, 0.58758544921875, 0.641876220703125, 0.6961669921875, 0.750457763671875, 0.80474853515625, 0.859039306640625, 0.913330078125, 0.967620849609375, 1.02191162109375, 1.076202392578125, 1.1304931640625, 1.184783935546875, 1.23907470703125, 1.293365478515625, 1.34765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 7.0, 6.0, 9.0, 12.0, 10.0, 29.0, 86.0, 559.0, 208.0, 28.0, 11.0, 8.0, 7.0, 4.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.342041015625, -0.3329353332519531, -0.32382965087890625, -0.3147239685058594, -0.3056182861328125, -0.2965126037597656, -0.28740692138671875, -0.2783012390136719, -0.269195556640625, -0.2600898742675781, -0.25098419189453125, -0.24187850952148438, -0.2327728271484375, -0.22366714477539062, -0.21456146240234375, -0.20545578002929688, -0.19635009765625, -0.18724441528320312, -0.17813873291015625, -0.16903305053710938, -0.1599273681640625, -0.15082168579101562, -0.14171600341796875, -0.13261032104492188, -0.123504638671875, -0.11439895629882812, -0.10529327392578125, -0.09618759155273438, -0.0870819091796875, -0.07797622680664062, -0.06887054443359375, -0.059764862060546875, -0.0506591796875, -0.041553497314453125, -0.03244781494140625, -0.023342132568359375, -0.0142364501953125, -0.005130767822265625, 0.00397491455078125, 0.013080596923828125, 0.022186279296875, 0.031291961669921875, 0.04039764404296875, 0.049503326416015625, 0.0586090087890625, 0.06771469116210938, 0.07682037353515625, 0.08592605590820312, 0.09503173828125, 0.10413742065429688, 0.11324310302734375, 0.12234878540039062, 0.1314544677734375, 0.14056015014648438, 0.14966583251953125, 0.15877151489257812, 0.167877197265625, 0.17698287963867188, 0.18608856201171875, 0.19519424438476562, 0.2042999267578125, 0.21340560913085938, 0.22251129150390625, 0.23161697387695312, 0.24072265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 10.0, 9.0, 13.0, 22.0, 32.0, 40.0, 66.0, 93.0, 143.0, 210.0, 330.0, 574.0, 947.0, 1991.0, 4449.0, 12081.0, 42325.0, 232954.0, 3045814.0, 724255.0, 92107.0, 22280.0, 7369.0, 2953.0, 1413.0, 725.0, 414.0, 227.0, 140.0, 89.0, 52.0, 42.0, 22.0, 21.0, 22.0, 10.0, 8.0, 11.0, 7.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.763671875, -1.714324951171875, -1.66497802734375, -1.615631103515625, -1.5662841796875, -1.516937255859375, -1.46759033203125, -1.418243408203125, -1.368896484375, -1.319549560546875, -1.27020263671875, -1.220855712890625, -1.1715087890625, -1.122161865234375, -1.07281494140625, -1.023468017578125, -0.97412109375, -0.924774169921875, -0.87542724609375, -0.826080322265625, -0.7767333984375, -0.727386474609375, -0.67803955078125, -0.628692626953125, -0.579345703125, -0.529998779296875, -0.48065185546875, -0.431304931640625, -0.3819580078125, -0.332611083984375, -0.28326416015625, -0.233917236328125, -0.1845703125, -0.135223388671875, -0.08587646484375, -0.036529541015625, 0.0128173828125, 0.062164306640625, 0.11151123046875, 0.160858154296875, 0.210205078125, 0.259552001953125, 0.30889892578125, 0.358245849609375, 0.4075927734375, 0.456939697265625, 0.50628662109375, 0.555633544921875, 0.60498046875, 0.654327392578125, 0.70367431640625, 0.753021240234375, 0.8023681640625, 0.851715087890625, 0.90106201171875, 0.950408935546875, 0.999755859375, 1.049102783203125, 1.09844970703125, 1.147796630859375, 1.1971435546875, 1.246490478515625, 1.29583740234375, 1.345184326171875, 1.39453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 9.0, 8.0, 9.0, 19.0, 16.0, 16.0, 39.0, 69.0, 68.0, 91.0, 135.0, 184.0, 215.0, 382.0, 663.0, 767.0, 406.0, 249.0, 194.0, 128.0, 78.0, 60.0, 65.0, 47.0, 34.0, 21.0, 20.0, 10.0, 11.0, 8.0, 10.0, 9.0, 7.0, 4.0, 5.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.33544921875, -0.32464599609375, -0.3138427734375, -0.30303955078125, -0.292236328125, -0.28143310546875, -0.2706298828125, -0.25982666015625, -0.2490234375, -0.23822021484375, -0.2274169921875, -0.21661376953125, -0.205810546875, -0.19500732421875, -0.1842041015625, -0.17340087890625, -0.16259765625, -0.15179443359375, -0.1409912109375, -0.13018798828125, -0.119384765625, -0.10858154296875, -0.0977783203125, -0.08697509765625, -0.076171875, -0.06536865234375, -0.0545654296875, -0.04376220703125, -0.032958984375, -0.02215576171875, -0.0113525390625, -0.00054931640625, 0.01025390625, 0.02105712890625, 0.0318603515625, 0.04266357421875, 0.053466796875, 0.06427001953125, 0.0750732421875, 0.08587646484375, 0.0966796875, 0.10748291015625, 0.1182861328125, 0.12908935546875, 0.139892578125, 0.15069580078125, 0.1614990234375, 0.17230224609375, 0.18310546875, 0.19390869140625, 0.2047119140625, 0.21551513671875, 0.226318359375, 0.23712158203125, 0.2479248046875, 0.25872802734375, 0.26953125, 0.28033447265625, 0.2911376953125, 0.30194091796875, 0.312744140625, 0.32354736328125, 0.3343505859375, 0.34515380859375, 0.35595703125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 9.0, 7.0, 14.0, 23.0, 41.0, 35.0, 64.0, 120.0, 108.0, 156.0, 143.0, 87.0, 63.0, 47.0, 26.0, 20.0, 12.0, 10.0, 9.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.740549087524414, -2.6274378299713135, -2.514326810836792, -2.4012155532836914, -2.288104295730591, -2.1749930381774902, -2.0618820190429688, -1.9487707614898682, -1.8356596231460571, -1.722548484802246, -1.6094372272491455, -1.4963260889053345, -1.3832149505615234, -1.2701036930084229, -1.1569925546646118, -1.0438814163208008, -0.9307701587677002, -0.8176589608192444, -0.7045477628707886, -0.5914366245269775, -0.47832542657852173, -0.3652142286300659, -0.2521030902862549, -0.13899189233779907, -0.02588069438934326, 0.08723048865795135, 0.20034167170524597, 0.3134528398513794, 0.4265640377998352, 0.539675235748291, 0.652786374092102, 0.7658975720405579, 0.8790087699890137, 0.9921199679374695, 1.1052311658859253, 1.2183423042297363, 1.331453561782837, 1.444564700126648, 1.557675838470459, 1.6707870960235596, 1.7838982343673706, 1.8970093727111816, 2.0101206302642822, 2.123231887817383, 2.2363429069519043, 2.349454164505005, 2.4625654220581055, 2.575676441192627, 2.6887876987457275, 2.801898956298828, 2.9150099754333496, 3.02812123298645, 3.141232490539551, 3.2543435096740723, 3.367454767227173, 3.4805660247802734, 3.593677043914795, 3.7067883014678955, 3.819899320602417, 3.9330105781555176, 4.046121597290039, 4.159233093261719, 4.27234411239624, 4.385455131530762, 4.498566627502441]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 6.0, 8.0, 6.0, 10.0, 11.0, 12.0, 19.0, 23.0, 14.0, 23.0, 18.0, 26.0, 35.0, 33.0, 36.0, 31.0, 47.0, 32.0, 34.0, 43.0, 42.0, 45.0, 41.0, 50.0, 34.0, 34.0, 34.0, 31.0, 30.0, 24.0, 21.0, 32.0, 15.0, 16.0, 15.0, 15.0, 12.0, 12.0, 11.0, 8.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.75883948802948, -1.707336187362671, -1.6558327674865723, -1.6043294668197632, -1.552826166152954, -1.5013227462768555, -1.4498194456100464, -1.3983161449432373, -1.3468127250671387, -1.2953094244003296, -1.243806004524231, -1.1923027038574219, -1.1407994031906128, -1.0892961025238037, -1.037792682647705, -0.986289381980896, -0.9347860813140869, -0.8832827210426331, -0.831779420375824, -0.7802760601043701, -0.728772759437561, -0.6772693991661072, -0.6257660388946533, -0.5742627382278442, -0.5227593779563904, -0.4712560474872589, -0.41975271701812744, -0.3682493567466736, -0.3167460262775421, -0.26524269580841064, -0.2137393355369568, -0.16223600506782532, -0.1107325553894043, -0.05922921746969223, -0.007725879549980164, 0.0437774658203125, 0.09528079628944397, 0.14678412675857544, 0.1982874870300293, 0.24979081749916077, 0.30129414796829224, 0.3527974784374237, 0.4043008089065552, 0.45580416917800903, 0.5073075294494629, 0.558810830116272, 0.6103141903877258, 0.6618175506591797, 0.7133208513259888, 0.7648242115974426, 0.8163275122642517, 0.8678308725357056, 0.9193341732025146, 0.9708375334739685, 1.0223408937454224, 1.0738441944122314, 1.12534761428833, 1.1768509149551392, 1.2283543348312378, 1.2798576354980469, 1.331360936164856, 1.382864236831665, 1.4343676567077637, 1.4858709573745728, 1.5373742580413818]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 7.0, 8.0, 13.0, 19.0, 27.0, 33.0, 42.0, 76.0, 95.0, 167.0, 254.0, 432.0, 717.0, 1273.0, 2730.0, 6547.0, 21195.0, 216081.0, 734762.0, 45964.0, 10272.0, 3893.0, 1689.0, 829.0, 509.0, 299.0, 192.0, 147.0, 89.0, 66.0, 37.0, 28.0, 26.0, 21.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.802734375, -1.7467803955078125, -1.690826416015625, -1.6348724365234375, -1.57891845703125, -1.5229644775390625, -1.467010498046875, -1.4110565185546875, -1.3551025390625, -1.2991485595703125, -1.243194580078125, -1.1872406005859375, -1.13128662109375, -1.0753326416015625, -1.019378662109375, -0.9634246826171875, -0.907470703125, -0.8515167236328125, -0.795562744140625, -0.7396087646484375, -0.68365478515625, -0.6277008056640625, -0.571746826171875, -0.5157928466796875, -0.4598388671875, -0.4038848876953125, -0.347930908203125, -0.2919769287109375, -0.23602294921875, -0.1800689697265625, -0.124114990234375, -0.0681610107421875, -0.01220703125, 0.0437469482421875, 0.099700927734375, 0.1556549072265625, 0.21160888671875, 0.2675628662109375, 0.323516845703125, 0.3794708251953125, 0.4354248046875, 0.4913787841796875, 0.547332763671875, 0.6032867431640625, 0.65924072265625, 0.7151947021484375, 0.771148681640625, 0.8271026611328125, 0.883056640625, 0.9390106201171875, 0.994964599609375, 1.0509185791015625, 1.10687255859375, 1.1628265380859375, 1.218780517578125, 1.2747344970703125, 1.3306884765625, 1.3866424560546875, 1.442596435546875, 1.4985504150390625, 1.55450439453125, 1.6104583740234375, 1.666412353515625, 1.7223663330078125, 1.7783203125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 7.0, 8.0, 5.0, 13.0, 21.0, 23.0, 97.0, 178.0, 274.0, 185.0, 101.0, 32.0, 19.0, 11.0, 4.0, 5.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.2486724853515625, -0.240509033203125, -0.2323455810546875, -0.22418212890625, -0.2160186767578125, -0.207855224609375, -0.1996917724609375, -0.1915283203125, -0.1833648681640625, -0.175201416015625, -0.1670379638671875, -0.15887451171875, -0.1507110595703125, -0.142547607421875, -0.1343841552734375, -0.126220703125, -0.1180572509765625, -0.109893798828125, -0.1017303466796875, -0.09356689453125, -0.0854034423828125, -0.077239990234375, -0.0690765380859375, -0.0609130859375, -0.0527496337890625, -0.044586181640625, -0.0364227294921875, -0.02825927734375, -0.0200958251953125, -0.011932373046875, -0.0037689208984375, 0.00439453125, 0.0125579833984375, 0.020721435546875, 0.0288848876953125, 0.03704833984375, 0.0452117919921875, 0.053375244140625, 0.0615386962890625, 0.0697021484375, 0.0778656005859375, 0.086029052734375, 0.0941925048828125, 0.10235595703125, 0.1105194091796875, 0.118682861328125, 0.1268463134765625, 0.135009765625, 0.1431732177734375, 0.151336669921875, 0.1595001220703125, 0.16766357421875, 0.1758270263671875, 0.183990478515625, 0.1921539306640625, 0.2003173828125, 0.2084808349609375, 0.216644287109375, 0.2248077392578125, 0.23297119140625, 0.2411346435546875, 0.249298095703125, 0.2574615478515625, 0.265625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 2.0, 11.0, 5.0, 5.0, 10.0, 12.0, 20.0, 21.0, 34.0, 43.0, 101.0, 153.0, 361.0, 686.0, 1676.0, 4615.0, 15703.0, 80455.0, 607377.0, 284229.0, 38428.0, 9227.0, 3026.0, 1233.0, 530.0, 233.0, 110.0, 76.0, 47.0, 37.0, 22.0, 24.0, 12.0, 7.0, 6.0, 2.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.138671875, -2.0753936767578125, -2.012115478515625, -1.9488372802734375, -1.88555908203125, -1.8222808837890625, -1.759002685546875, -1.6957244873046875, -1.6324462890625, -1.5691680908203125, -1.505889892578125, -1.4426116943359375, -1.37933349609375, -1.3160552978515625, -1.252777099609375, -1.1894989013671875, -1.126220703125, -1.0629425048828125, -0.999664306640625, -0.9363861083984375, -0.87310791015625, -0.8098297119140625, -0.746551513671875, -0.6832733154296875, -0.6199951171875, -0.5567169189453125, -0.493438720703125, -0.4301605224609375, -0.36688232421875, -0.3036041259765625, -0.240325927734375, -0.1770477294921875, -0.11376953125, -0.0504913330078125, 0.012786865234375, 0.0760650634765625, 0.13934326171875, 0.2026214599609375, 0.265899658203125, 0.3291778564453125, 0.3924560546875, 0.4557342529296875, 0.519012451171875, 0.5822906494140625, 0.64556884765625, 0.7088470458984375, 0.772125244140625, 0.8354034423828125, 0.898681640625, 0.9619598388671875, 1.025238037109375, 1.0885162353515625, 1.15179443359375, 1.2150726318359375, 1.278350830078125, 1.3416290283203125, 1.4049072265625, 1.4681854248046875, 1.531463623046875, 1.5947418212890625, 1.65802001953125, 1.7212982177734375, 1.784576416015625, 1.8478546142578125, 1.9111328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 2.0, 5.0, 5.0, 5.0, 11.0, 13.0, 13.0, 10.0, 18.0, 18.0, 24.0, 26.0, 21.0, 26.0, 27.0, 25.0, 26.0, 26.0, 33.0, 34.0, 35.0, 35.0, 32.0, 36.0, 42.0, 40.0, 39.0, 23.0, 43.0, 23.0, 27.0, 38.0, 26.0, 20.0, 20.0, 27.0, 23.0, 22.0, 11.0, 14.0, 8.0, 5.0, 5.0, 4.0, 11.0, 4.0, 2.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.7841796875, -0.7606277465820312, -0.7370758056640625, -0.7135238647460938, -0.689971923828125, -0.6664199829101562, -0.6428680419921875, -0.6193161010742188, -0.59576416015625, -0.5722122192382812, -0.5486602783203125, -0.5251083374023438, -0.501556396484375, -0.47800445556640625, -0.4544525146484375, -0.43090057373046875, -0.4073486328125, -0.38379669189453125, -0.3602447509765625, -0.33669281005859375, -0.313140869140625, -0.28958892822265625, -0.2660369873046875, -0.24248504638671875, -0.21893310546875, -0.19538116455078125, -0.1718292236328125, -0.14827728271484375, -0.124725341796875, -0.10117340087890625, -0.0776214599609375, -0.05406951904296875, -0.030517578125, -0.00696563720703125, 0.0165863037109375, 0.04013824462890625, 0.063690185546875, 0.08724212646484375, 0.1107940673828125, 0.13434600830078125, 0.15789794921875, 0.18144989013671875, 0.2050018310546875, 0.22855377197265625, 0.252105712890625, 0.27565765380859375, 0.2992095947265625, 0.32276153564453125, 0.3463134765625, 0.36986541748046875, 0.3934173583984375, 0.41696929931640625, 0.440521240234375, 0.46407318115234375, 0.4876251220703125, 0.5111770629882812, 0.53472900390625, 0.5582809448242188, 0.5818328857421875, 0.6053848266601562, 0.628936767578125, 0.6524887084960938, 0.6760406494140625, 0.6995925903320312, 0.72314453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 6.0, 7.0, 15.0, 15.0, 22.0, 36.0, 58.0, 132.0, 413.0, 1307.0, 15999.0, 1019437.0, 9439.0, 1071.0, 308.0, 124.0, 68.0, 44.0, 16.0, 12.0, 8.0, 5.0, 6.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.625, -10.29736328125, -9.9697265625, -9.64208984375, -9.314453125, -8.98681640625, -8.6591796875, -8.33154296875, -8.00390625, -7.67626953125, -7.3486328125, -7.02099609375, -6.693359375, -6.36572265625, -6.0380859375, -5.71044921875, -5.3828125, -5.05517578125, -4.7275390625, -4.39990234375, -4.072265625, -3.74462890625, -3.4169921875, -3.08935546875, -2.76171875, -2.43408203125, -2.1064453125, -1.77880859375, -1.451171875, -1.12353515625, -0.7958984375, -0.46826171875, -0.140625, 0.18701171875, 0.5146484375, 0.84228515625, 1.169921875, 1.49755859375, 1.8251953125, 2.15283203125, 2.48046875, 2.80810546875, 3.1357421875, 3.46337890625, 3.791015625, 4.11865234375, 4.4462890625, 4.77392578125, 5.1015625, 5.42919921875, 5.7568359375, 6.08447265625, 6.412109375, 6.73974609375, 7.0673828125, 7.39501953125, 7.72265625, 8.05029296875, 8.3779296875, 8.70556640625, 9.033203125, 9.36083984375, 9.6884765625, 10.01611328125, 10.34375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 4.0, 8.0, 10.0, 6.0, 17.0, 23.0, 29.0, 48.0, 85.0, 124.0, 239.0, 138.0, 83.0, 49.0, 32.0, 24.0, 16.0, 10.0, 9.0, 3.0, 4.0, 2.0, 4.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00121307373046875, -0.001161724328994751, -0.001110374927520752, -0.001059025526046753, -0.001007676124572754, -0.0009563267230987549, -0.0009049773216247559, -0.0008536279201507568, -0.0008022785186767578, -0.0007509291172027588, -0.0006995797157287598, -0.0006482303142547607, -0.0005968809127807617, -0.0005455315113067627, -0.0004941821098327637, -0.00044283270835876465, -0.0003914833068847656, -0.0003401339054107666, -0.0002887845039367676, -0.00023743510246276855, -0.00018608570098876953, -0.0001347362995147705, -8.338689804077148e-05, -3.203749656677246e-05, 1.9311904907226562e-05, 7.066130638122559e-05, 0.00012201070785522461, 0.00017336010932922363, 0.00022470951080322266, 0.0002760589122772217, 0.0003274083137512207, 0.0003787577152252197, 0.00043010711669921875, 0.0004814565181732178, 0.0005328059196472168, 0.0005841553211212158, 0.0006355047225952148, 0.0006868541240692139, 0.0007382035255432129, 0.0007895529270172119, 0.0008409023284912109, 0.00089225172996521, 0.000943601131439209, 0.000994950532913208, 0.001046299934387207, 0.001097649335861206, 0.001148998737335205, 0.001200348138809204, 0.0012516975402832031, 0.0013030469417572021, 0.0013543963432312012, 0.0014057457447052002, 0.0014570951461791992, 0.0015084445476531982, 0.0015597939491271973, 0.0016111433506011963, 0.0016624927520751953, 0.0017138421535491943, 0.0017651915550231934, 0.0018165409564971924, 0.0018678903579711914, 0.0019192397594451904, 0.0019705891609191895, 0.0020219385623931885, 0.0020732879638671875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 7.0, 11.0, 8.0, 8.0, 24.0, 34.0, 34.0, 43.0, 74.0, 122.0, 150.0, 250.0, 433.0, 693.0, 1234.0, 2290.0, 4964.0, 12772.0, 43894.0, 306322.0, 573071.0, 71587.0, 17714.0, 6380.0, 2899.0, 1459.0, 753.0, 454.0, 261.0, 168.0, 134.0, 93.0, 61.0, 48.0, 34.0, 21.0, 14.0, 10.0, 3.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.8955078125, -1.844482421875, -1.79345703125, -1.742431640625, -1.69140625, -1.640380859375, -1.58935546875, -1.538330078125, -1.4873046875, -1.436279296875, -1.38525390625, -1.334228515625, -1.283203125, -1.232177734375, -1.18115234375, -1.130126953125, -1.0791015625, -1.028076171875, -0.97705078125, -0.926025390625, -0.875, -0.823974609375, -0.77294921875, -0.721923828125, -0.6708984375, -0.619873046875, -0.56884765625, -0.517822265625, -0.466796875, -0.415771484375, -0.36474609375, -0.313720703125, -0.2626953125, -0.211669921875, -0.16064453125, -0.109619140625, -0.05859375, -0.007568359375, 0.04345703125, 0.094482421875, 0.1455078125, 0.196533203125, 0.24755859375, 0.298583984375, 0.349609375, 0.400634765625, 0.45166015625, 0.502685546875, 0.5537109375, 0.604736328125, 0.65576171875, 0.706787109375, 0.7578125, 0.808837890625, 0.85986328125, 0.910888671875, 0.9619140625, 1.012939453125, 1.06396484375, 1.114990234375, 1.166015625, 1.217041015625, 1.26806640625, 1.319091796875, 1.3701171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 4.0, 11.0, 7.0, 8.0, 17.0, 26.0, 40.0, 53.0, 84.0, 84.0, 92.0, 100.0, 100.0, 64.0, 69.0, 66.0, 53.0, 47.0, 18.0, 13.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5888671875, -1.543243408203125, -1.49761962890625, -1.451995849609375, -1.4063720703125, -1.360748291015625, -1.31512451171875, -1.269500732421875, -1.223876953125, -1.178253173828125, -1.13262939453125, -1.087005615234375, -1.0413818359375, -0.995758056640625, -0.95013427734375, -0.904510498046875, -0.85888671875, -0.813262939453125, -0.76763916015625, -0.722015380859375, -0.6763916015625, -0.630767822265625, -0.58514404296875, -0.539520263671875, -0.493896484375, -0.448272705078125, -0.40264892578125, -0.357025146484375, -0.3114013671875, -0.265777587890625, -0.22015380859375, -0.174530029296875, -0.12890625, -0.083282470703125, -0.03765869140625, 0.007965087890625, 0.0535888671875, 0.099212646484375, 0.14483642578125, 0.190460205078125, 0.236083984375, 0.281707763671875, 0.32733154296875, 0.372955322265625, 0.4185791015625, 0.464202880859375, 0.50982666015625, 0.555450439453125, 0.60107421875, 0.646697998046875, 0.69232177734375, 0.737945556640625, 0.7835693359375, 0.829193115234375, 0.87481689453125, 0.920440673828125, 0.966064453125, 1.011688232421875, 1.05731201171875, 1.102935791015625, 1.1485595703125, 1.194183349609375, 1.23980712890625, 1.285430908203125, 1.3310546875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 29.0, 59.0, 167.0, 361.0, 229.0, 79.0, 25.0, 15.0, 9.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.5438232421875, -32.677268981933594, -31.810714721679688, -30.94416046142578, -30.077606201171875, -29.21105194091797, -28.34449577331543, -27.477941513061523, -26.611387252807617, -25.74483299255371, -24.878278732299805, -24.0117244720459, -23.14516830444336, -22.278614044189453, -21.412059783935547, -20.54550552368164, -19.678951263427734, -18.812397003173828, -17.945842742919922, -17.079288482666016, -16.21273422241211, -15.346179008483887, -14.479623794555664, -13.613069534301758, -12.746515274047852, -11.879961013793945, -11.013406753540039, -10.146851539611816, -9.28029727935791, -8.413743019104004, -7.5471882820129395, -6.680633544921875, -5.814077377319336, -4.94752311706543, -4.080968379974365, -3.21441388130188, -2.3478593826293945, -1.4813051223754883, -0.6147503852844238, 0.2518043518066406, 1.1183586120605469, 1.9849131107330322, 2.8514676094055176, 3.718022108078003, 4.584576606750488, 5.4511308670043945, 6.317685604095459, 7.184240341186523, 8.05079460144043, 8.917348861694336, 9.783903121948242, 10.650458335876465, 11.517012596130371, 12.383566856384277, 13.2501220703125, 14.116676330566406, 14.983230590820312, 15.849784851074219, 16.716339111328125, 17.58289337158203, 18.449447631835938, 19.316001892089844, 20.182558059692383, 21.04911231994629, 21.915666580200195]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 8.0, 8.0, 10.0, 26.0, 41.0, 58.0, 135.0, 154.0, 154.0, 125.0, 104.0, 77.0, 30.0, 17.0, 11.0, 5.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.52658462524414, -22.83984375, -22.153104782104492, -21.46636390686035, -20.77962303161621, -20.092884063720703, -19.406143188476562, -18.719402313232422, -18.03266143798828, -17.34592056274414, -16.659181594848633, -15.972440719604492, -15.285699844360352, -14.598959922790527, -13.912220001220703, -13.225479125976562, -12.538740158081055, -11.85200023651123, -11.16525936126709, -10.478519439697266, -9.791778564453125, -9.1050386428833, -8.418298721313477, -7.731558322906494, -7.044817924499512, -6.358077526092529, -5.671337127685547, -4.984597206115723, -4.29785680770874, -3.611116409301758, -2.9243764877319336, -2.237636089324951, -1.5508975982666016, -0.8641573190689087, -0.17741703987121582, 0.5093231201171875, 1.19606351852417, 1.8828039169311523, 2.5695438385009766, 3.256284236907959, 3.9430246353149414, 4.629765033721924, 5.316505432128906, 6.0032453536987305, 6.689985752105713, 7.376726150512695, 8.06346607208252, 8.750205993652344, 9.436946868896484, 10.123686790466309, 10.81042766571045, 11.497167587280273, 12.183908462524414, 12.870648384094238, 13.557388305664062, 14.244129180908203, 14.930869102478027, 15.617609024047852, 16.304349899291992, 16.9910888671875, 17.67782974243164, 18.36457061767578, 19.051311492919922, 19.73805046081543, 20.42479133605957]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 3.0, 13.0, 10.0, 23.0, 38.0, 111.0, 383.0, 2324.0, 66612.0, 4115479.0, 8105.0, 853.0, 170.0, 46.0, 21.0, 24.0, 11.0, 10.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.15625, -17.6260986328125, -17.095947265625, -16.5657958984375, -16.03564453125, -15.5054931640625, -14.975341796875, -14.4451904296875, -13.9150390625, -13.3848876953125, -12.854736328125, -12.3245849609375, -11.79443359375, -11.2642822265625, -10.734130859375, -10.2039794921875, -9.673828125, -9.1436767578125, -8.613525390625, -8.0833740234375, -7.55322265625, -7.0230712890625, -6.492919921875, -5.9627685546875, -5.4326171875, -4.9024658203125, -4.372314453125, -3.8421630859375, -3.31201171875, -2.7818603515625, -2.251708984375, -1.7215576171875, -1.19140625, -0.6612548828125, -0.131103515625, 0.3990478515625, 0.92919921875, 1.4593505859375, 1.989501953125, 2.5196533203125, 3.0498046875, 3.5799560546875, 4.110107421875, 4.6402587890625, 5.17041015625, 5.7005615234375, 6.230712890625, 6.7608642578125, 7.291015625, 7.8211669921875, 8.351318359375, 8.8814697265625, 9.41162109375, 9.9417724609375, 10.471923828125, 11.0020751953125, 11.5322265625, 12.0623779296875, 12.592529296875, 13.1226806640625, 13.65283203125, 14.1829833984375, 14.713134765625, 15.2432861328125, 15.7734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 9.0, 5.0, 9.0, 8.0, 23.0, 23.0, 42.0, 64.0, 97.0, 144.0, 181.0, 140.0, 83.0, 56.0, 35.0, 18.0, 15.0, 17.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.23095703125, -0.22421836853027344, -0.21747970581054688, -0.2107410430908203, -0.20400238037109375, -0.1972637176513672, -0.19052505493164062, -0.18378639221191406, -0.1770477294921875, -0.17030906677246094, -0.16357040405273438, -0.1568317413330078, -0.15009307861328125, -0.1433544158935547, -0.13661575317382812, -0.12987709045410156, -0.123138427734375, -0.11639976501464844, -0.10966110229492188, -0.10292243957519531, -0.09618377685546875, -0.08944511413574219, -0.08270645141601562, -0.07596778869628906, -0.0692291259765625, -0.06249046325683594, -0.055751800537109375, -0.04901313781738281, -0.04227447509765625, -0.03553581237792969, -0.028797149658203125, -0.022058486938476562, -0.01531982421875, -0.008581161499023438, -0.001842498779296875, 0.0048961639404296875, 0.01163482666015625, 0.018373489379882812, 0.025112152099609375, 0.03185081481933594, 0.0385894775390625, 0.04532814025878906, 0.052066802978515625, 0.05880546569824219, 0.06554412841796875, 0.07228279113769531, 0.07902145385742188, 0.08576011657714844, 0.092498779296875, 0.09923744201660156, 0.10597610473632812, 0.11271476745605469, 0.11945343017578125, 0.1261920928955078, 0.13293075561523438, 0.13966941833496094, 0.1464080810546875, 0.15314674377441406, 0.15988540649414062, 0.1666240692138672, 0.17336273193359375, 0.1801013946533203, 0.18684005737304688, 0.19357872009277344, 0.2003173828125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 10.0, 15.0, 30.0, 34.0, 97.0, 152.0, 340.0, 781.0, 2073.0, 7276.0, 46282.0, 3640254.0, 465376.0, 24446.0, 4807.0, 1394.0, 513.0, 203.0, 105.0, 44.0, 22.0, 16.0, 4.0, 3.0, 2.0], "bins": [-8.90625, -8.731109619140625, -8.55596923828125, -8.380828857421875, -8.2056884765625, -8.030548095703125, -7.85540771484375, -7.680267333984375, -7.505126953125, -7.329986572265625, -7.15484619140625, -6.979705810546875, -6.8045654296875, -6.629425048828125, -6.45428466796875, -6.279144287109375, -6.10400390625, -5.928863525390625, -5.75372314453125, -5.578582763671875, -5.4034423828125, -5.228302001953125, -5.05316162109375, -4.878021240234375, -4.702880859375, -4.527740478515625, -4.35260009765625, -4.177459716796875, -4.0023193359375, -3.827178955078125, -3.65203857421875, -3.476898193359375, -3.3017578125, -3.126617431640625, -2.95147705078125, -2.776336669921875, -2.6011962890625, -2.426055908203125, -2.25091552734375, -2.075775146484375, -1.900634765625, -1.725494384765625, -1.55035400390625, -1.375213623046875, -1.2000732421875, -1.024932861328125, -0.84979248046875, -0.674652099609375, -0.49951171875, -0.324371337890625, -0.14923095703125, 0.025909423828125, 0.2010498046875, 0.376190185546875, 0.55133056640625, 0.726470947265625, 0.901611328125, 1.076751708984375, 1.25189208984375, 1.427032470703125, 1.6021728515625, 1.777313232421875, 1.95245361328125, 2.127593994140625, 2.302734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 8.0, 9.0, 8.0, 14.0, 27.0, 29.0, 56.0, 94.0, 154.0, 316.0, 1658.0, 1107.0, 236.0, 122.0, 64.0, 37.0, 33.0, 23.0, 13.0, 15.0, 9.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.60205078125, -0.5861930847167969, -0.5703353881835938, -0.5544776916503906, -0.5386199951171875, -0.5227622985839844, -0.5069046020507812, -0.4910469055175781, -0.475189208984375, -0.4593315124511719, -0.44347381591796875, -0.4276161193847656, -0.4117584228515625, -0.3959007263183594, -0.38004302978515625, -0.3641853332519531, -0.34832763671875, -0.3324699401855469, -0.31661224365234375, -0.3007545471191406, -0.2848968505859375, -0.2690391540527344, -0.25318145751953125, -0.23732376098632812, -0.221466064453125, -0.20560836791992188, -0.18975067138671875, -0.17389297485351562, -0.1580352783203125, -0.14217758178710938, -0.12631988525390625, -0.11046218872070312, -0.0946044921875, -0.07874679565429688, -0.06288909912109375, -0.047031402587890625, -0.0311737060546875, -0.015316009521484375, 0.00054168701171875, 0.016399383544921875, 0.032257080078125, 0.048114776611328125, 0.06397247314453125, 0.07983016967773438, 0.0956878662109375, 0.11154556274414062, 0.12740325927734375, 0.14326095581054688, 0.15911865234375, 0.17497634887695312, 0.19083404541015625, 0.20669174194335938, 0.2225494384765625, 0.23840713500976562, 0.25426483154296875, 0.2701225280761719, 0.285980224609375, 0.3018379211425781, 0.31769561767578125, 0.3335533142089844, 0.3494110107421875, 0.3652687072753906, 0.38112640380859375, 0.3969841003417969, 0.412841796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 21.0, 53.0, 379.0, 523.0, 29.0, 7.0, 3.0], "bins": [-34.966556549072266, -34.38604736328125, -33.805538177490234, -33.22502899169922, -32.6445198059082, -32.06401062011719, -31.483501434326172, -30.902990341186523, -30.322481155395508, -29.741971969604492, -29.161462783813477, -28.58095359802246, -28.000444412231445, -27.419933319091797, -26.83942413330078, -26.258914947509766, -25.67840576171875, -25.097896575927734, -24.51738739013672, -23.936878204345703, -23.356369018554688, -22.775859832763672, -22.195350646972656, -21.614839553833008, -21.034332275390625, -20.45382308959961, -19.873313903808594, -19.292804718017578, -18.712295532226562, -18.131786346435547, -17.55127716064453, -16.970766067504883, -16.3902587890625, -15.809749603271484, -15.229240417480469, -14.648731231689453, -14.068221092224121, -13.487711906433105, -12.90720272064209, -12.326692581176758, -11.746183395385742, -11.165674209594727, -10.585165023803711, -10.004655838012695, -9.424145698547363, -8.843636512756348, -8.263127326965332, -7.682617664337158, -7.102108478546143, -6.521599292755127, -5.941089630126953, -5.3605804443359375, -4.780071258544922, -4.199561595916748, -3.6190524101257324, -3.0385427474975586, -2.458033561706543, -1.8775241374969482, -1.297014832496643, -0.7165055274963379, -0.13599610328674316, 0.44451332092285156, 1.0250225067138672, 1.605532169342041, 2.1860413551330566]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 4.0, 4.0, 5.0, 11.0, 14.0, 20.0, 13.0, 22.0, 35.0, 28.0, 35.0, 43.0, 55.0, 60.0, 68.0, 64.0, 79.0, 65.0, 67.0, 64.0, 61.0, 38.0, 45.0, 26.0, 19.0, 18.0, 9.0, 5.0, 3.0, 8.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7313475608825684, -2.6398019790649414, -2.5482561588287354, -2.4567105770111084, -2.3651649951934814, -2.2736191749572754, -2.1820735931396484, -2.0905280113220215, -1.998982310295105, -1.9074366092681885, -1.8158910274505615, -1.724345326423645, -1.6327996253967285, -1.5412540435791016, -1.449708342552185, -1.3581626415252686, -1.2666170597076416, -1.175071358680725, -1.0835257768630981, -0.9919800758361816, -0.9004344344139099, -0.8088887929916382, -0.7173430919647217, -0.62579745054245, -0.5342518091201782, -0.4427061676979065, -0.3511604964733124, -0.25961482524871826, -0.16806918382644653, -0.0765235424041748, 0.0150221586227417, 0.10656780004501343, 0.19811344146728516, 0.2896590828895569, 0.381204754114151, 0.4727504253387451, 0.5642960667610168, 0.6558417081832886, 0.7473874092102051, 0.8389330506324768, 0.9304786920547485, 1.022024393081665, 1.113569974899292, 1.2051156759262085, 1.296661376953125, 1.388206958770752, 1.4797526597976685, 1.571298360824585, 1.662843942642212, 1.7543896436691284, 1.8459352254867554, 1.9374809265136719, 2.029026508331299, 2.120572090148926, 2.212117910385132, 2.303663492202759, 2.395209312438965, 2.486754894256592, 2.578300714492798, 2.669846296310425, 2.7613918781280518, 2.852937698364258, 2.9444832801818848, 3.0360288619995117, 3.1275744438171387]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 8.0, 5.0, 5.0, 4.0, 5.0, 23.0, 23.0, 41.0, 58.0, 89.0, 146.0, 238.0, 428.0, 774.0, 1667.0, 3580.0, 8845.0, 25130.0, 92688.0, 477378.0, 338656.0, 66190.0, 19235.0, 7231.0, 2939.0, 1438.0, 725.0, 395.0, 208.0, 122.0, 81.0, 70.0, 39.0, 22.0, 22.0, 18.0, 11.0, 7.0, 6.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.9033203125, -1.85028076171875, -1.7972412109375, -1.74420166015625, -1.691162109375, -1.63812255859375, -1.5850830078125, -1.53204345703125, -1.47900390625, -1.42596435546875, -1.3729248046875, -1.31988525390625, -1.266845703125, -1.21380615234375, -1.1607666015625, -1.10772705078125, -1.0546875, -1.00164794921875, -0.9486083984375, -0.89556884765625, -0.842529296875, -0.78948974609375, -0.7364501953125, -0.68341064453125, -0.63037109375, -0.57733154296875, -0.5242919921875, -0.47125244140625, -0.418212890625, -0.36517333984375, -0.3121337890625, -0.25909423828125, -0.2060546875, -0.15301513671875, -0.0999755859375, -0.04693603515625, 0.006103515625, 0.05914306640625, 0.1121826171875, 0.16522216796875, 0.21826171875, 0.27130126953125, 0.3243408203125, 0.37738037109375, 0.430419921875, 0.48345947265625, 0.5364990234375, 0.58953857421875, 0.642578125, 0.69561767578125, 0.7486572265625, 0.80169677734375, 0.854736328125, 0.90777587890625, 0.9608154296875, 1.01385498046875, 1.06689453125, 1.11993408203125, 1.1729736328125, 1.22601318359375, 1.279052734375, 1.33209228515625, 1.3851318359375, 1.43817138671875, 1.4912109375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 7.0, 12.0, 13.0, 18.0, 18.0, 30.0, 36.0, 41.0, 42.0, 63.0, 75.0, 93.0, 95.0, 80.0, 74.0, 57.0, 49.0, 46.0, 38.0, 26.0, 18.0, 20.0, 13.0, 8.0, 6.0, 1.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1517333984375, -0.14717864990234375, -0.1426239013671875, -0.13806915283203125, -0.133514404296875, -0.12895965576171875, -0.1244049072265625, -0.11985015869140625, -0.11529541015625, -0.11074066162109375, -0.1061859130859375, -0.10163116455078125, -0.097076416015625, -0.09252166748046875, -0.0879669189453125, -0.08341217041015625, -0.078857421875, -0.07430267333984375, -0.0697479248046875, -0.06519317626953125, -0.060638427734375, -0.05608367919921875, -0.0515289306640625, -0.04697418212890625, -0.04241943359375, -0.03786468505859375, -0.0333099365234375, -0.02875518798828125, -0.024200439453125, -0.01964569091796875, -0.0150909423828125, -0.01053619384765625, -0.0059814453125, -0.00142669677734375, 0.0031280517578125, 0.00768280029296875, 0.012237548828125, 0.01679229736328125, 0.0213470458984375, 0.02590179443359375, 0.03045654296875, 0.03501129150390625, 0.0395660400390625, 0.04412078857421875, 0.048675537109375, 0.05323028564453125, 0.0577850341796875, 0.06233978271484375, 0.06689453125, 0.07144927978515625, 0.0760040283203125, 0.08055877685546875, 0.085113525390625, 0.08966827392578125, 0.0942230224609375, 0.09877777099609375, 0.10333251953125, 0.10788726806640625, 0.1124420166015625, 0.11699676513671875, 0.121551513671875, 0.12610626220703125, 0.1306610107421875, 0.13521575927734375, 0.1397705078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 15.0, 20.0, 49.0, 237.0, 1307.0, 15425.0, 582810.0, 434802.0, 12352.0, 1225.0, 180.0, 38.0, 18.0, 6.0, 5.0, 5.0, 8.0, 2.0, 5.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.62109375, -4.492584228515625, -4.36407470703125, -4.235565185546875, -4.1070556640625, -3.978546142578125, -3.85003662109375, -3.721527099609375, -3.593017578125, -3.464508056640625, -3.33599853515625, -3.207489013671875, -3.0789794921875, -2.950469970703125, -2.82196044921875, -2.693450927734375, -2.56494140625, -2.436431884765625, -2.30792236328125, -2.179412841796875, -2.0509033203125, -1.922393798828125, -1.79388427734375, -1.665374755859375, -1.536865234375, -1.408355712890625, -1.27984619140625, -1.151336669921875, -1.0228271484375, -0.894317626953125, -0.76580810546875, -0.637298583984375, -0.5087890625, -0.380279541015625, -0.25177001953125, -0.123260498046875, 0.0052490234375, 0.133758544921875, 0.26226806640625, 0.390777587890625, 0.519287109375, 0.647796630859375, 0.77630615234375, 0.904815673828125, 1.0333251953125, 1.161834716796875, 1.29034423828125, 1.418853759765625, 1.54736328125, 1.675872802734375, 1.80438232421875, 1.932891845703125, 2.0614013671875, 2.189910888671875, 2.31842041015625, 2.446929931640625, 2.575439453125, 2.703948974609375, 2.83245849609375, 2.960968017578125, 3.0894775390625, 3.217987060546875, 3.34649658203125, 3.475006103515625, 3.603515625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 11.0, 15.0, 16.0, 19.0, 28.0, 26.0, 35.0, 31.0, 48.0, 42.0, 51.0, 42.0, 42.0, 44.0, 53.0, 60.0, 54.0, 54.0, 42.0, 51.0, 42.0, 26.0, 26.0, 22.0, 24.0, 19.0, 11.0, 9.0, 8.0, 6.0, 10.0, 8.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73974609375, -0.7165145874023438, -0.6932830810546875, -0.6700515747070312, -0.646820068359375, -0.6235885620117188, -0.6003570556640625, -0.5771255493164062, -0.55389404296875, -0.5306625366210938, -0.5074310302734375, -0.48419952392578125, -0.460968017578125, -0.43773651123046875, -0.4145050048828125, -0.39127349853515625, -0.3680419921875, -0.34481048583984375, -0.3215789794921875, -0.29834747314453125, -0.275115966796875, -0.25188446044921875, -0.2286529541015625, -0.20542144775390625, -0.18218994140625, -0.15895843505859375, -0.1357269287109375, -0.11249542236328125, -0.089263916015625, -0.06603240966796875, -0.0428009033203125, -0.01956939697265625, 0.003662109375, 0.02689361572265625, 0.0501251220703125, 0.07335662841796875, 0.096588134765625, 0.11981964111328125, 0.1430511474609375, 0.16628265380859375, 0.18951416015625, 0.21274566650390625, 0.2359771728515625, 0.25920867919921875, 0.282440185546875, 0.30567169189453125, 0.3289031982421875, 0.35213470458984375, 0.3753662109375, 0.39859771728515625, 0.4218292236328125, 0.44506072998046875, 0.468292236328125, 0.49152374267578125, 0.5147552490234375, 0.5379867553710938, 0.56121826171875, 0.5844497680664062, 0.6076812744140625, 0.6309127807617188, 0.654144287109375, 0.6773757934570312, 0.7006072998046875, 0.7238388061523438, 0.7470703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 0.0, 5.0, 4.0, 6.0, 4.0, 14.0, 26.0, 22.0, 43.0, 70.0, 97.0, 161.0, 356.0, 687.0, 1922.0, 7531.0, 76278.0, 932390.0, 22505.0, 4065.0, 1247.0, 489.0, 224.0, 132.0, 92.0, 41.0, 44.0, 29.0, 11.0, 13.0, 10.0, 8.0, 9.0, 4.0, 5.0, 2.0, 1.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.2578125, -9.98272705078125, -9.7076416015625, -9.43255615234375, -9.157470703125, -8.88238525390625, -8.6072998046875, -8.33221435546875, -8.05712890625, -7.78204345703125, -7.5069580078125, -7.23187255859375, -6.956787109375, -6.68170166015625, -6.4066162109375, -6.13153076171875, -5.8564453125, -5.58135986328125, -5.3062744140625, -5.03118896484375, -4.756103515625, -4.48101806640625, -4.2059326171875, -3.93084716796875, -3.65576171875, -3.38067626953125, -3.1055908203125, -2.83050537109375, -2.555419921875, -2.28033447265625, -2.0052490234375, -1.73016357421875, -1.455078125, -1.17999267578125, -0.9049072265625, -0.62982177734375, -0.354736328125, -0.07965087890625, 0.1954345703125, 0.47052001953125, 0.74560546875, 1.02069091796875, 1.2957763671875, 1.57086181640625, 1.845947265625, 2.12103271484375, 2.3961181640625, 2.67120361328125, 2.9462890625, 3.22137451171875, 3.4964599609375, 3.77154541015625, 4.046630859375, 4.32171630859375, 4.5968017578125, 4.87188720703125, 5.14697265625, 5.42205810546875, 5.6971435546875, 5.97222900390625, 6.247314453125, 6.52239990234375, 6.7974853515625, 7.07257080078125, 7.34765625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 13.0, 6.0, 17.0, 33.0, 27.0, 71.0, 612.0, 91.0, 33.0, 19.0, 23.0, 5.0, 5.0, 5.0, 1.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.007350921630859375, -0.007132112979888916, -0.006913304328918457, -0.006694495677947998, -0.006475687026977539, -0.00625687837600708, -0.006038069725036621, -0.005819261074066162, -0.005600452423095703, -0.005381643772125244, -0.005162835121154785, -0.004944026470184326, -0.004725217819213867, -0.004506409168243408, -0.004287600517272949, -0.00406879186630249, -0.0038499832153320312, -0.0036311745643615723, -0.0034123659133911133, -0.0031935572624206543, -0.0029747486114501953, -0.0027559399604797363, -0.0025371313095092773, -0.0023183226585388184, -0.0020995140075683594, -0.0018807053565979004, -0.0016618967056274414, -0.0014430880546569824, -0.0012242794036865234, -0.0010054707527160645, -0.0007866621017456055, -0.0005678534507751465, -0.0003490447998046875, -0.00013023614883422852, 8.857250213623047e-05, 0.00030738115310668945, 0.0005261898040771484, 0.0007449984550476074, 0.0009638071060180664, 0.0011826157569885254, 0.0014014244079589844, 0.0016202330589294434, 0.0018390417098999023, 0.0020578503608703613, 0.0022766590118408203, 0.0024954676628112793, 0.0027142763137817383, 0.0029330849647521973, 0.0031518936157226562, 0.0033707022666931152, 0.0035895109176635742, 0.003808319568634033, 0.004027128219604492, 0.004245936870574951, 0.00446474552154541, 0.004683554172515869, 0.004902362823486328, 0.005121171474456787, 0.005339980125427246, 0.005558788776397705, 0.005777597427368164, 0.005996406078338623, 0.006215214729309082, 0.006434023380279541, 0.00665283203125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 5.0, 10.0, 15.0, 15.0, 28.0, 51.0, 48.0, 90.0, 121.0, 188.0, 260.0, 409.0, 671.0, 1079.0, 2001.0, 3964.0, 8848.0, 26486.0, 218362.0, 709629.0, 50370.0, 13362.0, 5513.0, 2860.0, 1519.0, 897.0, 572.0, 386.0, 234.0, 171.0, 119.0, 82.0, 49.0, 36.0, 25.0, 21.0, 10.0, 9.0, 7.0, 6.0, 3.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.76953125, -3.652496337890625, -3.53546142578125, -3.418426513671875, -3.3013916015625, -3.184356689453125, -3.06732177734375, -2.950286865234375, -2.833251953125, -2.716217041015625, -2.59918212890625, -2.482147216796875, -2.3651123046875, -2.248077392578125, -2.13104248046875, -2.014007568359375, -1.89697265625, -1.779937744140625, -1.66290283203125, -1.545867919921875, -1.4288330078125, -1.311798095703125, -1.19476318359375, -1.077728271484375, -0.960693359375, -0.843658447265625, -0.72662353515625, -0.609588623046875, -0.4925537109375, -0.375518798828125, -0.25848388671875, -0.141448974609375, -0.0244140625, 0.092620849609375, 0.20965576171875, 0.326690673828125, 0.4437255859375, 0.560760498046875, 0.67779541015625, 0.794830322265625, 0.911865234375, 1.028900146484375, 1.14593505859375, 1.262969970703125, 1.3800048828125, 1.497039794921875, 1.61407470703125, 1.731109619140625, 1.84814453125, 1.965179443359375, 2.08221435546875, 2.199249267578125, 2.3162841796875, 2.433319091796875, 2.55035400390625, 2.667388916015625, 2.784423828125, 2.901458740234375, 3.01849365234375, 3.135528564453125, 3.2525634765625, 3.369598388671875, 3.48663330078125, 3.603668212890625, 3.720703125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 5.0, 4.0, 8.0, 22.0, 16.0, 20.0, 42.0, 97.0, 201.0, 255.0, 155.0, 53.0, 36.0, 19.0, 16.0, 8.0, 3.0, 5.0, 2.0, 7.0, 4.0, 7.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.416015625, -3.313262939453125, -3.21051025390625, -3.107757568359375, -3.0050048828125, -2.902252197265625, -2.79949951171875, -2.696746826171875, -2.593994140625, -2.491241455078125, -2.38848876953125, -2.285736083984375, -2.1829833984375, -2.080230712890625, -1.97747802734375, -1.874725341796875, -1.77197265625, -1.669219970703125, -1.56646728515625, -1.463714599609375, -1.3609619140625, -1.258209228515625, -1.15545654296875, -1.052703857421875, -0.949951171875, -0.847198486328125, -0.74444580078125, -0.641693115234375, -0.5389404296875, -0.436187744140625, -0.33343505859375, -0.230682373046875, -0.1279296875, -0.025177001953125, 0.07757568359375, 0.180328369140625, 0.2830810546875, 0.385833740234375, 0.48858642578125, 0.591339111328125, 0.694091796875, 0.796844482421875, 0.89959716796875, 1.002349853515625, 1.1051025390625, 1.207855224609375, 1.31060791015625, 1.413360595703125, 1.51611328125, 1.618865966796875, 1.72161865234375, 1.824371337890625, 1.9271240234375, 2.029876708984375, 2.13262939453125, 2.235382080078125, 2.338134765625, 2.440887451171875, 2.54364013671875, 2.646392822265625, 2.7491455078125, 2.851898193359375, 2.95465087890625, 3.057403564453125, 3.16015625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 8.0, 9.0, 17.0, 21.0, 42.0, 49.0, 100.0, 131.0, 197.0, 174.0, 119.0, 52.0, 33.0, 14.0, 11.0, 6.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.085121154785156, -10.601280212402344, -10.117440223693848, -9.633599281311035, -9.149759292602539, -8.665918350219727, -8.182077407836914, -7.698237419128418, -7.214396953582764, -6.730556488037109, -6.246716022491455, -5.762875556945801, -5.279034614562988, -4.795194625854492, -4.31135368347168, -3.8275132179260254, -3.343672752380371, -2.859832286834717, -2.3759918212890625, -1.892151117324829, -1.4083106517791748, -0.9244701862335205, -0.4406294822692871, 0.04321098327636719, 0.5270514488220215, 1.0108919143676758, 1.4947324991226196, 1.9785730838775635, 2.4624135494232178, 2.946254014968872, 3.4300947189331055, 3.9139351844787598, 4.397775650024414, 4.881616115570068, 5.365456581115723, 5.849297523498535, 6.333137512207031, 6.816978454589844, 7.300818920135498, 7.784659385681152, 8.268499374389648, 8.752340316772461, 9.236180305480957, 9.72002124786377, 10.203861236572266, 10.687702178955078, 11.17154312133789, 11.655383110046387, 12.1392240524292, 12.623064994812012, 13.106904983520508, 13.59074592590332, 14.074585914611816, 14.558426856994629, 15.042266845703125, 15.526107788085938, 16.00994873046875, 16.493789672851562, 16.977630615234375, 17.461469650268555, 17.945310592651367, 18.42915153503418, 18.912992477416992, 19.396831512451172, 19.880672454833984]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 6.0, 7.0, 6.0, 14.0, 22.0, 16.0, 19.0, 33.0, 25.0, 58.0, 53.0, 66.0, 61.0, 77.0, 69.0, 59.0, 77.0, 54.0, 56.0, 45.0, 40.0, 28.0, 28.0, 12.0, 20.0, 8.0, 15.0, 10.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.854835510253906, -8.550444602966309, -8.246052742004395, -7.941661834716797, -7.637270450592041, -7.332879066467285, -7.0284881591796875, -6.724096775054932, -6.419705390930176, -6.11531400680542, -5.810923099517822, -5.506531715393066, -5.2021403312683105, -4.897748947143555, -4.593358039855957, -4.288966655731201, -3.9845757484436035, -3.6801846027374268, -3.375793218612671, -3.071402072906494, -2.7670106887817383, -2.4626195430755615, -2.1582283973693848, -1.853837013244629, -1.5494458675384521, -1.2450546026229858, -0.9406633973121643, -0.6362721920013428, -0.33188092708587646, -0.027489662170410156, 0.2769014835357666, 0.5812928676605225, 0.8856840133666992, 1.1900752782821655, 1.4944665431976318, 1.7988576889038086, 2.1032490730285645, 2.407640218734741, 2.712031364440918, 3.016422748565674, 3.3208138942718506, 3.6252050399780273, 3.929596424102783, 4.233987808227539, 4.538378715515137, 4.842770099639893, 5.147161483764648, 5.451552391052246, 5.755943775177002, 6.060335159301758, 6.3647260665893555, 6.669117450714111, 6.973508834838867, 7.277899742126465, 7.582291126251221, 7.886682510375977, 8.191073417663574, 8.495464324951172, 8.799856185913086, 9.104247093200684, 9.408638000488281, 9.713029861450195, 10.017420768737793, 10.32181167602539, 10.626203536987305]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 4.0, 8.0, 4.0, 11.0, 7.0, 20.0, 35.0, 45.0, 123.0, 318.0, 1124.0, 6287.0, 94036.0, 4033597.0, 52352.0, 4635.0, 843.0, 288.0, 141.0, 91.0, 64.0, 62.0, 42.0, 26.0, 23.0, 17.0, 22.0, 13.0, 13.0, 8.0, 4.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.859375, -10.552734375, -10.24609375, -9.939453125, -9.6328125, -9.326171875, -9.01953125, -8.712890625, -8.40625, -8.099609375, -7.79296875, -7.486328125, -7.1796875, -6.873046875, -6.56640625, -6.259765625, -5.953125, -5.646484375, -5.33984375, -5.033203125, -4.7265625, -4.419921875, -4.11328125, -3.806640625, -3.5, -3.193359375, -2.88671875, -2.580078125, -2.2734375, -1.966796875, -1.66015625, -1.353515625, -1.046875, -0.740234375, -0.43359375, -0.126953125, 0.1796875, 0.486328125, 0.79296875, 1.099609375, 1.40625, 1.712890625, 2.01953125, 2.326171875, 2.6328125, 2.939453125, 3.24609375, 3.552734375, 3.859375, 4.166015625, 4.47265625, 4.779296875, 5.0859375, 5.392578125, 5.69921875, 6.005859375, 6.3125, 6.619140625, 6.92578125, 7.232421875, 7.5390625, 7.845703125, 8.15234375, 8.458984375, 8.765625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 14.0, 26.0, 51.0, 60.0, 65.0, 115.0, 142.0, 140.0, 109.0, 77.0, 57.0, 56.0, 31.0, 19.0, 11.0, 6.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1734619140625, -0.16483497619628906, -0.15620803833007812, -0.1475811004638672, -0.13895416259765625, -0.1303272247314453, -0.12170028686523438, -0.11307334899902344, -0.1044464111328125, -0.09581947326660156, -0.08719253540039062, -0.07856559753417969, -0.06993865966796875, -0.06131172180175781, -0.052684783935546875, -0.04405784606933594, -0.035430908203125, -0.026803970336914062, -0.018177032470703125, -0.009550094604492188, -0.00092315673828125, 0.0077037811279296875, 0.016330718994140625, 0.024957656860351562, 0.0335845947265625, 0.04221153259277344, 0.050838470458984375, 0.05946540832519531, 0.06809234619140625, 0.07671928405761719, 0.08534622192382812, 0.09397315979003906, 0.10260009765625, 0.11122703552246094, 0.11985397338867188, 0.1284809112548828, 0.13710784912109375, 0.1457347869873047, 0.15436172485351562, 0.16298866271972656, 0.1716156005859375, 0.18024253845214844, 0.18886947631835938, 0.1974964141845703, 0.20612335205078125, 0.2147502899169922, 0.22337722778320312, 0.23200416564941406, 0.240631103515625, 0.24925804138183594, 0.2578849792480469, 0.2665119171142578, 0.27513885498046875, 0.2837657928466797, 0.2923927307128906, 0.30101966857910156, 0.3096466064453125, 0.31827354431152344, 0.3269004821777344, 0.3355274200439453, 0.34415435791015625, 0.3527812957763672, 0.3614082336425781, 0.37003517150878906, 0.378662109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 9.0, 14.0, 19.0, 58.0, 199.0, 1197.0, 31803.0, 4136097.0, 23473.0, 1102.0, 207.0, 49.0, 33.0, 17.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.98828125, -4.51190185546875, -4.0355224609375, -3.55914306640625, -3.082763671875, -2.60638427734375, -2.1300048828125, -1.65362548828125, -1.17724609375, -0.70086669921875, -0.2244873046875, 0.25189208984375, 0.728271484375, 1.20465087890625, 1.6810302734375, 2.15740966796875, 2.6337890625, 3.11016845703125, 3.5865478515625, 4.06292724609375, 4.539306640625, 5.01568603515625, 5.4920654296875, 5.96844482421875, 6.44482421875, 6.92120361328125, 7.3975830078125, 7.87396240234375, 8.350341796875, 8.82672119140625, 9.3031005859375, 9.77947998046875, 10.255859375, 10.73223876953125, 11.2086181640625, 11.68499755859375, 12.161376953125, 12.63775634765625, 13.1141357421875, 13.59051513671875, 14.06689453125, 14.54327392578125, 15.0196533203125, 15.49603271484375, 15.972412109375, 16.44879150390625, 16.9251708984375, 17.40155029296875, 17.8779296875, 18.35430908203125, 18.8306884765625, 19.30706787109375, 19.783447265625, 20.25982666015625, 20.7362060546875, 21.21258544921875, 21.68896484375, 22.16534423828125, 22.6417236328125, 23.11810302734375, 23.594482421875, 24.07086181640625, 24.5472412109375, 25.02362060546875, 25.5]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 8.0, 5.0, 6.0, 9.0, 11.0, 21.0, 22.0, 46.0, 60.0, 77.0, 115.0, 176.0, 512.0, 1828.0, 619.0, 251.0, 117.0, 72.0, 40.0, 25.0, 23.0, 8.0, 7.0, 7.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6298828125, -0.6111068725585938, -0.5923309326171875, -0.5735549926757812, -0.554779052734375, -0.5360031127929688, -0.5172271728515625, -0.49845123291015625, -0.47967529296875, -0.46089935302734375, -0.4421234130859375, -0.42334747314453125, -0.404571533203125, -0.38579559326171875, -0.3670196533203125, -0.34824371337890625, -0.3294677734375, -0.31069183349609375, -0.2919158935546875, -0.27313995361328125, -0.254364013671875, -0.23558807373046875, -0.2168121337890625, -0.19803619384765625, -0.17926025390625, -0.16048431396484375, -0.1417083740234375, -0.12293243408203125, -0.104156494140625, -0.08538055419921875, -0.0666046142578125, -0.04782867431640625, -0.029052734375, -0.01027679443359375, 0.0084991455078125, 0.02727508544921875, 0.046051025390625, 0.06482696533203125, 0.0836029052734375, 0.10237884521484375, 0.12115478515625, 0.13993072509765625, 0.1587066650390625, 0.17748260498046875, 0.196258544921875, 0.21503448486328125, 0.2338104248046875, 0.25258636474609375, 0.2713623046875, 0.29013824462890625, 0.3089141845703125, 0.32769012451171875, 0.346466064453125, 0.36524200439453125, 0.3840179443359375, 0.40279388427734375, 0.42156982421875, 0.44034576416015625, 0.4591217041015625, 0.47789764404296875, 0.496673583984375, 0.5154495239257812, 0.5342254638671875, 0.5530014038085938, 0.57177734375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 39.0, 769.0, 203.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.06014633178711, -18.78954315185547, -17.51894187927246, -16.248340606689453, -14.977737426757812, -13.707135200500488, -12.436532974243164, -11.16593074798584, -9.895328521728516, -8.624726295471191, -7.354124069213867, -6.083521842956543, -4.812919616699219, -3.5423173904418945, -2.2717151641845703, -1.001112937927246, 0.2694892883300781, 1.5400915145874023, 2.8106937408447266, 4.081295967102051, 5.351898193359375, 6.622500419616699, 7.893102645874023, 9.163704872131348, 10.434307098388672, 11.704909324645996, 12.97551155090332, 14.246113777160645, 15.516716003417969, 16.78731918334961, 18.057920455932617, 19.328521728515625, 20.59912109375, 21.86972427368164, 23.14032554626465, 24.410926818847656, 25.681529998779297, 26.952133178710938, 28.222734451293945, 29.493335723876953, 30.763938903808594, 32.034542083740234, 33.305145263671875, 34.57574462890625, 35.84634780883789, 37.11695098876953, 38.387550354003906, 39.65815353393555, 40.92875671386719, 42.19935989379883, 43.46996307373047, 44.740562438964844, 46.011165618896484, 47.281768798828125, 48.5523681640625, 49.82297134399414, 51.09357452392578, 52.36417770385742, 53.63478088378906, 54.90538024902344, 56.17598342895508, 57.44658660888672, 58.717185974121094, 59.987789154052734, 61.258392333984375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 13.0, 24.0, 46.0, 81.0, 130.0, 155.0, 183.0, 167.0, 99.0, 55.0, 30.0, 16.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.331378936767578, -5.059208393096924, -4.787037372589111, -4.514866828918457, -4.242696285247803, -3.9705255031585693, -3.698354721069336, -3.4261841773986816, -3.1540133953094482, -2.881842613220215, -2.6096720695495605, -2.337501287460327, -2.0653305053710938, -1.7931599617004395, -1.520989179611206, -1.2488185167312622, -0.9766478538513184, -0.7044771909713745, -0.4323064684867859, -0.16013574600219727, 0.11203491687774658, 0.38420557975769043, 0.6563763618469238, 0.9285470247268677, 1.2007176876068115, 1.4728883504867554, 1.7450590133666992, 2.0172297954559326, 2.289400577545166, 2.5615711212158203, 2.8337419033050537, 3.105912685394287, 3.3780832290649414, 3.650254011154175, 3.922424554824829, 4.1945953369140625, 4.466765880584717, 4.738936424255371, 5.011107444763184, 5.283277988433838, 5.555448532104492, 5.8276190757751465, 6.099790096282959, 6.371960639953613, 6.644131183624268, 6.916301727294922, 7.188472747802734, 7.460643291473389, 7.732814311981201, 8.004984855651855, 8.277155876159668, 8.549325942993164, 8.821496963500977, 9.093667984008789, 9.365839004516602, 9.638009071350098, 9.91018009185791, 10.182351112365723, 10.454521179199219, 10.726692199707031, 10.998863220214844, 11.27103328704834, 11.543204307556152, 11.815375328063965, 12.087545394897461]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 4.0, 5.0, 9.0, 9.0, 15.0, 23.0, 10.0, 28.0, 22.0, 37.0, 34.0, 35.0, 38.0, 45.0, 46.0, 72.0, 269397.0, 778250.0, 78.0, 53.0, 55.0, 41.0, 43.0, 35.0, 27.0, 27.0, 23.0, 16.0, 20.0, 16.0, 7.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.484375, -19.779296875, -19.07421875, -18.369140625, -17.6640625, -16.958984375, -16.25390625, -15.548828125, -14.84375, -14.138671875, -13.43359375, -12.728515625, -12.0234375, -11.318359375, -10.61328125, -9.908203125, -9.203125, -8.498046875, -7.79296875, -7.087890625, -6.3828125, -5.677734375, -4.97265625, -4.267578125, -3.5625, -2.857421875, -2.15234375, -1.447265625, -0.7421875, -0.037109375, 0.66796875, 1.373046875, 2.078125, 2.783203125, 3.48828125, 4.193359375, 4.8984375, 5.603515625, 6.30859375, 7.013671875, 7.71875, 8.423828125, 9.12890625, 9.833984375, 10.5390625, 11.244140625, 11.94921875, 12.654296875, 13.359375, 14.064453125, 14.76953125, 15.474609375, 16.1796875, 16.884765625, 17.58984375, 18.294921875, 19.0, 19.705078125, 20.41015625, 21.115234375, 21.8203125, 22.525390625, 23.23046875, 23.935546875, 24.640625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 9.0, 93.0, 478.0, 380.0, 57.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1953125, -0.14593505859375, -0.0965576171875, -0.04718017578125, 0.002197265625, 0.05157470703125, 0.1009521484375, 0.15032958984375, 0.19970703125, 0.24908447265625, 0.2984619140625, 0.34783935546875, 0.397216796875, 0.44659423828125, 0.4959716796875, 0.54534912109375, 0.5947265625, 0.64410400390625, 0.6934814453125, 0.74285888671875, 0.792236328125, 0.84161376953125, 0.8909912109375, 0.94036865234375, 0.98974609375, 1.03912353515625, 1.0885009765625, 1.13787841796875, 1.187255859375, 1.23663330078125, 1.2860107421875, 1.33538818359375, 1.384765625, 1.43414306640625, 1.4835205078125, 1.53289794921875, 1.582275390625, 1.63165283203125, 1.6810302734375, 1.73040771484375, 1.77978515625, 1.82916259765625, 1.8785400390625, 1.92791748046875, 1.977294921875, 2.02667236328125, 2.0760498046875, 2.12542724609375, 2.1748046875, 2.22418212890625, 2.2735595703125, 2.32293701171875, 2.372314453125, 2.42169189453125, 2.4710693359375, 2.52044677734375, 2.56982421875, 2.61920166015625, 2.6685791015625, 2.71795654296875, 2.767333984375, 2.81671142578125, 2.8660888671875, 2.91546630859375, 2.96484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 7.0, 9.0, 11.0, 14.0, 20.0, 26.0, 29.0, 41.0, 59.0, 97.0, 141.0, 176.0, 296.0, 437.0, 791.0, 1397.0, 2501.0, 5063.0, 11173.0, 28137.0, 85344.0, 302247.0, 411009.0, 130131.0, 40206.0, 15049.0, 6621.0, 3196.0, 1710.0, 989.0, 556.0, 369.0, 208.0, 164.0, 99.0, 60.0, 57.0, 33.0, 27.0, 15.0, 15.0, 7.0, 5.0, 4.0, 1.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.94140625, -2.840576171875, -2.73974609375, -2.638916015625, -2.5380859375, -2.437255859375, -2.33642578125, -2.235595703125, -2.134765625, -2.033935546875, -1.93310546875, -1.832275390625, -1.7314453125, -1.630615234375, -1.52978515625, -1.428955078125, -1.328125, -1.227294921875, -1.12646484375, -1.025634765625, -0.9248046875, -0.823974609375, -0.72314453125, -0.622314453125, -0.521484375, -0.420654296875, -0.31982421875, -0.218994140625, -0.1181640625, -0.017333984375, 0.08349609375, 0.184326171875, 0.28515625, 0.385986328125, 0.48681640625, 0.587646484375, 0.6884765625, 0.789306640625, 0.89013671875, 0.990966796875, 1.091796875, 1.192626953125, 1.29345703125, 1.394287109375, 1.4951171875, 1.595947265625, 1.69677734375, 1.797607421875, 1.8984375, 1.999267578125, 2.10009765625, 2.200927734375, 2.3017578125, 2.402587890625, 2.50341796875, 2.604248046875, 2.705078125, 2.805908203125, 2.90673828125, 3.007568359375, 3.1083984375, 3.209228515625, 3.31005859375, 3.410888671875, 3.51171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 1.0, 9.0, 3.0, 8.0, 6.0, 10.0, 23.0, 31.0, 18.0, 23.0, 35.0, 39.0, 46.0, 41.0, 37.0, 57.0, 62.0, 52.0, 53.0, 52.0, 41.0, 49.0, 47.0, 40.0, 39.0, 26.0, 22.0, 27.0, 16.0, 12.0, 13.0, 11.0, 11.0, 9.0, 4.0, 7.0, 8.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1171875, -2.051116943359375, -1.98504638671875, -1.918975830078125, -1.8529052734375, -1.786834716796875, -1.72076416015625, -1.654693603515625, -1.588623046875, -1.522552490234375, -1.45648193359375, -1.390411376953125, -1.3243408203125, -1.258270263671875, -1.19219970703125, -1.126129150390625, -1.06005859375, -0.993988037109375, -0.92791748046875, -0.861846923828125, -0.7957763671875, -0.729705810546875, -0.66363525390625, -0.597564697265625, -0.531494140625, -0.465423583984375, -0.39935302734375, -0.333282470703125, -0.2672119140625, -0.201141357421875, -0.13507080078125, -0.069000244140625, -0.0029296875, 0.063140869140625, 0.12921142578125, 0.195281982421875, 0.2613525390625, 0.327423095703125, 0.39349365234375, 0.459564208984375, 0.525634765625, 0.591705322265625, 0.65777587890625, 0.723846435546875, 0.7899169921875, 0.855987548828125, 0.92205810546875, 0.988128662109375, 1.05419921875, 1.120269775390625, 1.18634033203125, 1.252410888671875, 1.3184814453125, 1.384552001953125, 1.45062255859375, 1.516693115234375, 1.582763671875, 1.648834228515625, 1.71490478515625, 1.780975341796875, 1.8470458984375, 1.913116455078125, 1.97918701171875, 2.045257568359375, 2.111328125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 11.0, 19.0, 23.0, 42.0, 88.0, 158.0, 372.0, 885.0, 2772.0, 11359.0, 73242.0, 591982.0, 322738.0, 35401.0, 6556.0, 1714.0, 635.0, 276.0, 123.0, 64.0, 29.0, 22.0, 14.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.0125732421875, -3.857177734375, -3.7017822265625, -3.54638671875, -3.3909912109375, -3.235595703125, -3.0802001953125, -2.9248046875, -2.7694091796875, -2.614013671875, -2.4586181640625, -2.30322265625, -2.1478271484375, -1.992431640625, -1.8370361328125, -1.681640625, -1.5262451171875, -1.370849609375, -1.2154541015625, -1.06005859375, -0.9046630859375, -0.749267578125, -0.5938720703125, -0.4384765625, -0.2830810546875, -0.127685546875, 0.0277099609375, 0.18310546875, 0.3385009765625, 0.493896484375, 0.6492919921875, 0.8046875, 0.9600830078125, 1.115478515625, 1.2708740234375, 1.42626953125, 1.5816650390625, 1.737060546875, 1.8924560546875, 2.0478515625, 2.2032470703125, 2.358642578125, 2.5140380859375, 2.66943359375, 2.8248291015625, 2.980224609375, 3.1356201171875, 3.291015625, 3.4464111328125, 3.601806640625, 3.7572021484375, 3.91259765625, 4.0679931640625, 4.223388671875, 4.3787841796875, 4.5341796875, 4.6895751953125, 4.844970703125, 5.0003662109375, 5.15576171875, 5.3111572265625, 5.466552734375, 5.6219482421875, 5.77734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 8.0, 7.0, 12.0, 10.0, 15.0, 23.0, 19.0, 28.0, 38.0, 42.0, 33.0, 69.0, 80.0, 64.0, 77.0, 70.0, 74.0, 63.0, 59.0, 49.0, 26.0, 29.0, 22.0, 17.0, 9.0, 16.0, 10.0, 7.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004260540008544922, -0.00041205063462257385, -0.0003980472683906555, -0.0003840439021587372, -0.00037004053592681885, -0.0003560371696949005, -0.0003420338034629822, -0.00032803043723106384, -0.0003140270709991455, -0.00030002370476722717, -0.00028602033853530884, -0.0002720169723033905, -0.00025801360607147217, -0.00024401023983955383, -0.0002300068736076355, -0.00021600350737571716, -0.00020200014114379883, -0.0001879967749118805, -0.00017399340867996216, -0.00015999004244804382, -0.0001459866762161255, -0.00013198330998420715, -0.00011797994375228882, -0.00010397657752037048, -8.997321128845215e-05, -7.596984505653381e-05, -6.196647882461548e-05, -4.7963112592697144e-05, -3.395974636077881e-05, -1.9956380128860474e-05, -5.953013896942139e-06, 8.050352334976196e-06, 2.205371856689453e-05, 3.6057084798812866e-05, 5.00604510307312e-05, 6.406381726264954e-05, 7.806718349456787e-05, 9.20705497264862e-05, 0.00010607391595840454, 0.00012007728219032288, 0.0001340806484222412, 0.00014808401465415955, 0.00016208738088607788, 0.00017609074711799622, 0.00019009411334991455, 0.00020409747958183289, 0.00021810084581375122, 0.00023210421204566956, 0.0002461075782775879, 0.0002601109445095062, 0.00027411431074142456, 0.0002881176769733429, 0.00030212104320526123, 0.00031612440943717957, 0.0003301277756690979, 0.00034413114190101624, 0.00035813450813293457, 0.0003721378743648529, 0.00038614124059677124, 0.0004001446068286896, 0.0004141479730606079, 0.00042815133929252625, 0.0004421547055244446, 0.0004561580717563629, 0.00047016143798828125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 11.0, 23.0, 27.0, 43.0, 55.0, 134.0, 252.0, 605.0, 1580.0, 5717.0, 29822.0, 296799.0, 628960.0, 70099.0, 10395.0, 2470.0, 818.0, 341.0, 151.0, 74.0, 62.0, 31.0, 19.0, 26.0, 7.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -5.23583984375, -5.0732421875, -4.91064453125, -4.748046875, -4.58544921875, -4.4228515625, -4.26025390625, -4.09765625, -3.93505859375, -3.7724609375, -3.60986328125, -3.447265625, -3.28466796875, -3.1220703125, -2.95947265625, -2.796875, -2.63427734375, -2.4716796875, -2.30908203125, -2.146484375, -1.98388671875, -1.8212890625, -1.65869140625, -1.49609375, -1.33349609375, -1.1708984375, -1.00830078125, -0.845703125, -0.68310546875, -0.5205078125, -0.35791015625, -0.1953125, -0.03271484375, 0.1298828125, 0.29248046875, 0.455078125, 0.61767578125, 0.7802734375, 0.94287109375, 1.10546875, 1.26806640625, 1.4306640625, 1.59326171875, 1.755859375, 1.91845703125, 2.0810546875, 2.24365234375, 2.40625, 2.56884765625, 2.7314453125, 2.89404296875, 3.056640625, 3.21923828125, 3.3818359375, 3.54443359375, 3.70703125, 3.86962890625, 4.0322265625, 4.19482421875, 4.357421875, 4.52001953125, 4.6826171875, 4.84521484375, 5.0078125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 6.0, 3.0, 9.0, 5.0, 16.0, 22.0, 24.0, 41.0, 67.0, 74.0, 115.0, 123.0, 133.0, 86.0, 73.0, 58.0, 58.0, 26.0, 23.0, 14.0, 13.0, 6.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7294921875, -1.6573028564453125, -1.585113525390625, -1.5129241943359375, -1.44073486328125, -1.3685455322265625, -1.296356201171875, -1.2241668701171875, -1.1519775390625, -1.0797882080078125, -1.007598876953125, -0.9354095458984375, -0.86322021484375, -0.7910308837890625, -0.718841552734375, -0.6466522216796875, -0.574462890625, -0.5022735595703125, -0.430084228515625, -0.3578948974609375, -0.28570556640625, -0.2135162353515625, -0.141326904296875, -0.0691375732421875, 0.0030517578125, 0.0752410888671875, 0.147430419921875, 0.2196197509765625, 0.29180908203125, 0.3639984130859375, 0.436187744140625, 0.5083770751953125, 0.58056640625, 0.6527557373046875, 0.724945068359375, 0.7971343994140625, 0.86932373046875, 0.9415130615234375, 1.013702392578125, 1.0858917236328125, 1.1580810546875, 1.2302703857421875, 1.302459716796875, 1.3746490478515625, 1.44683837890625, 1.5190277099609375, 1.591217041015625, 1.6634063720703125, 1.735595703125, 1.8077850341796875, 1.879974365234375, 1.9521636962890625, 2.02435302734375, 2.0965423583984375, 2.168731689453125, 2.2409210205078125, 2.3131103515625, 2.3852996826171875, 2.457489013671875, 2.5296783447265625, 2.60186767578125, 2.6740570068359375, 2.746246337890625, 2.8184356689453125, 2.890625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 6.0, 11.0, 27.0, 46.0, 142.0, 228.0, 247.0, 159.0, 72.0, 29.0, 14.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.5557746887207, -41.495723724365234, -40.435672760009766, -39.3756217956543, -38.31557083129883, -37.25551986694336, -36.19546890258789, -35.13542175292969, -34.07537078857422, -33.01531982421875, -31.95526885986328, -30.895217895507812, -29.835166931152344, -28.775115966796875, -27.71506690979004, -26.65501594543457, -25.59496307373047, -24.534912109375, -23.47486114501953, -22.414810180664062, -21.354759216308594, -20.294708251953125, -19.23465919494629, -18.17460823059082, -17.11455726623535, -16.054506301879883, -14.994455337524414, -13.934405326843262, -12.874354362487793, -11.814303398132324, -10.754253387451172, -9.694202423095703, -8.634153366088867, -7.574102401733398, -6.514051914215088, -5.454001426696777, -4.393950462341309, -3.33389949798584, -2.2738490104675293, -1.2137985229492188, -0.15374755859375, 0.9063031673431396, 1.9663538932800293, 3.026404619216919, 4.086455345153809, 5.146506309509277, 6.206556797027588, 7.266607284545898, 8.326658248901367, 9.386709213256836, 10.446760177612305, 11.506810188293457, 12.566861152648926, 13.626912117004395, 14.686962127685547, 15.747013092041016, 16.807064056396484, 17.867115020751953, 18.927165985107422, 19.98721694946289, 21.04726791381836, 22.107318878173828, 23.167367935180664, 24.227418899536133, 25.2874698638916]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 0.0, 4.0, 5.0, 11.0, 18.0, 14.0, 17.0, 20.0, 21.0, 27.0, 25.0, 20.0, 31.0, 52.0, 40.0, 48.0, 52.0, 53.0, 50.0, 40.0, 49.0, 41.0, 35.0, 44.0, 44.0, 36.0, 37.0, 22.0, 24.0, 20.0, 18.0, 19.0, 12.0, 13.0, 6.0, 7.0, 6.0, 5.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.683039665222168, -12.284528732299805, -11.886016845703125, -11.487505912780762, -11.088994979858398, -10.690483093261719, -10.291972160339355, -9.893461227416992, -9.494949340820312, -9.09643840789795, -8.69792652130127, -8.299415588378906, -7.900904178619385, -7.502392768859863, -7.1038818359375, -6.7053704261779785, -6.306859016418457, -5.9083476066589355, -5.509836196899414, -5.111325263977051, -4.712813854217529, -4.314302444458008, -3.9157912731170654, -3.517280101776123, -3.1187686920166016, -2.72025728225708, -2.3217461109161377, -1.9232348203659058, -1.5247235298156738, -1.126212239265442, -0.72770094871521, -0.3291897773742676, 0.0693206787109375, 0.46783196926116943, 0.8663432598114014, 1.2648545503616333, 1.6633658409118652, 2.0618772506713867, 2.460388422012329, 2.8588995933532715, 3.257411003112793, 3.6559224128723145, 4.054433822631836, 4.452944755554199, 4.851456165313721, 5.249967575073242, 5.6484785079956055, 6.046989917755127, 6.445501327514648, 6.84401273727417, 7.242524147033691, 7.641035079956055, 8.039546966552734, 8.438057899475098, 8.836568832397461, 9.23508071899414, 9.633591651916504, 10.032102584838867, 10.430614471435547, 10.82912540435791, 11.227636337280273, 11.626148223876953, 12.024659156799316, 12.42317008972168, 12.82168197631836]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 19.0, 90.0, 399.0, 4024666.0, 168078.0, 475.0, 222.0, 115.0, 78.0, 52.0, 33.0, 26.0, 19.0, 10.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -12.0294189453125, -10.004150390625, -7.9788818359375, -5.95361328125, -3.9283447265625, -1.903076171875, 0.1221923828125, 2.1474609375, 4.1727294921875, 6.197998046875, 8.2232666015625, 10.24853515625, 12.2738037109375, 14.299072265625, 16.3243408203125, 18.349609375, 20.3748779296875, 22.400146484375, 24.4254150390625, 26.45068359375, 28.4759521484375, 30.501220703125, 32.5264892578125, 34.5517578125, 36.5770263671875, 38.602294921875, 40.6275634765625, 42.65283203125, 44.6781005859375, 46.703369140625, 48.7286376953125, 50.75390625, 52.7791748046875, 54.804443359375, 56.8297119140625, 58.85498046875, 60.8802490234375, 62.905517578125, 64.9307861328125, 66.9560546875, 68.9813232421875, 71.006591796875, 73.0318603515625, 75.05712890625, 77.0823974609375, 79.107666015625, 81.1329345703125, 83.158203125, 85.1834716796875, 87.208740234375, 89.2340087890625, 91.25927734375, 93.2845458984375, 95.309814453125, 97.3350830078125, 99.3603515625, 101.3856201171875, 103.410888671875, 105.4361572265625, 107.46142578125, 109.4866943359375, 111.511962890625, 113.5372314453125, 115.5625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 15.0, 76.0, 164.0, 295.0, 258.0, 145.0, 49.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42431640625, -0.37062835693359375, -0.3169403076171875, -0.26325225830078125, -0.209564208984375, -0.15587615966796875, -0.1021881103515625, -0.04850006103515625, 0.00518798828125, 0.05887603759765625, 0.1125640869140625, 0.16625213623046875, 0.219940185546875, 0.27362823486328125, 0.3273162841796875, 0.38100433349609375, 0.4346923828125, 0.48838043212890625, 0.5420684814453125, 0.5957565307617188, 0.649444580078125, 0.7031326293945312, 0.7568206787109375, 0.8105087280273438, 0.86419677734375, 0.9178848266601562, 0.9715728759765625, 1.0252609252929688, 1.078948974609375, 1.1326370239257812, 1.1863250732421875, 1.2400131225585938, 1.293701171875, 1.3473892211914062, 1.4010772705078125, 1.4547653198242188, 1.508453369140625, 1.5621414184570312, 1.6158294677734375, 1.6695175170898438, 1.72320556640625, 1.7768936157226562, 1.8305816650390625, 1.8842697143554688, 1.937957763671875, 1.9916458129882812, 2.0453338623046875, 2.0990219116210938, 2.1527099609375, 2.2063980102539062, 2.2600860595703125, 2.3137741088867188, 2.367462158203125, 2.4211502075195312, 2.4748382568359375, 2.5285263061523438, 2.58221435546875, 2.6359024047851562, 2.6895904541015625, 2.7432785034179688, 2.796966552734375, 2.8506546020507812, 2.9043426513671875, 2.9580307006835938, 3.01171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 9.0, 18.0, 33.0, 63.0, 103.0, 241.0, 759.0, 3770.0, 142774.0, 4034569.0, 9899.0, 1283.0, 406.0, 156.0, 97.0, 55.0, 35.0, 9.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -10.7528076171875, -9.872802734375, -8.9927978515625, -8.11279296875, -7.2327880859375, -6.352783203125, -5.4727783203125, -4.5927734375, -3.7127685546875, -2.832763671875, -1.9527587890625, -1.07275390625, -0.1927490234375, 0.687255859375, 1.5672607421875, 2.447265625, 3.3272705078125, 4.207275390625, 5.0872802734375, 5.96728515625, 6.8472900390625, 7.727294921875, 8.6072998046875, 9.4873046875, 10.3673095703125, 11.247314453125, 12.1273193359375, 13.00732421875, 13.8873291015625, 14.767333984375, 15.6473388671875, 16.52734375, 17.4073486328125, 18.287353515625, 19.1673583984375, 20.04736328125, 20.9273681640625, 21.807373046875, 22.6873779296875, 23.5673828125, 24.4473876953125, 25.327392578125, 26.2073974609375, 27.08740234375, 27.9674072265625, 28.847412109375, 29.7274169921875, 30.607421875, 31.4874267578125, 32.367431640625, 33.2474365234375, 34.12744140625, 35.0074462890625, 35.887451171875, 36.7674560546875, 37.6474609375, 38.5274658203125, 39.407470703125, 40.2874755859375, 41.16748046875, 42.0474853515625, 42.927490234375, 43.8074951171875, 44.6875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 8.0, 24.0, 37.0, 75.0, 193.0, 967.0, 2374.0, 261.0, 80.0, 26.0, 13.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.806640625, -2.70330810546875, -2.5999755859375, -2.49664306640625, -2.393310546875, -2.28997802734375, -2.1866455078125, -2.08331298828125, -1.97998046875, -1.87664794921875, -1.7733154296875, -1.66998291015625, -1.566650390625, -1.46331787109375, -1.3599853515625, -1.25665283203125, -1.1533203125, -1.04998779296875, -0.9466552734375, -0.84332275390625, -0.739990234375, -0.63665771484375, -0.5333251953125, -0.42999267578125, -0.32666015625, -0.22332763671875, -0.1199951171875, -0.01666259765625, 0.086669921875, 0.19000244140625, 0.2933349609375, 0.39666748046875, 0.5, 0.60333251953125, 0.7066650390625, 0.80999755859375, 0.913330078125, 1.01666259765625, 1.1199951171875, 1.22332763671875, 1.32666015625, 1.42999267578125, 1.5333251953125, 1.63665771484375, 1.739990234375, 1.84332275390625, 1.9466552734375, 2.04998779296875, 2.1533203125, 2.25665283203125, 2.3599853515625, 2.46331787109375, 2.566650390625, 2.66998291015625, 2.7733154296875, 2.87664794921875, 2.97998046875, 3.08331298828125, 3.1866455078125, 3.28997802734375, 3.393310546875, 3.49664306640625, 3.5999755859375, 3.70330810546875, 3.806640625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 10.0, 48.0, 233.0, 540.0, 125.0, 35.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.085010528564453, -29.754823684692383, -28.424636840820312, -27.09444808959961, -25.76426124572754, -24.43407440185547, -23.1038875579834, -21.773700714111328, -20.443511962890625, -19.113325119018555, -17.783138275146484, -16.45294952392578, -15.122762680053711, -13.79257583618164, -12.46238899230957, -11.132201194763184, -9.80201530456543, -8.47182846069336, -7.141640663146973, -5.811453819274902, -4.481266498565674, -3.1510791778564453, -1.820892333984375, -0.4907045364379883, 0.839482307434082, 2.1696696281433105, 3.49985671043396, 4.830043792724609, 6.160231113433838, 7.490418434143066, 8.820605278015137, 10.150793075561523, 11.480979919433594, 12.811166763305664, 14.14135456085205, 15.471541404724121, 16.801729202270508, 18.131916046142578, 19.46210289001465, 20.79228973388672, 22.122478485107422, 23.452665328979492, 24.782852172851562, 26.113040924072266, 27.443227767944336, 28.773414611816406, 30.103601455688477, 31.433788299560547, 32.76397705078125, 34.09416580200195, 35.42435073852539, 36.754539489746094, 38.08472442626953, 39.414913177490234, 40.74510192871094, 42.075286865234375, 43.40547180175781, 44.735660552978516, 46.06584548950195, 47.396034240722656, 48.726219177246094, 50.0564079284668, 51.3865966796875, 52.71678161621094, 54.04697036743164]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 10.0, 17.0, 23.0, 44.0, 54.0, 96.0, 95.0, 124.0, 119.0, 108.0, 92.0, 79.0, 54.0, 39.0, 22.0, 10.0, 9.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.95156478881836, -17.43938636779785, -16.927207946777344, -16.415029525756836, -15.902850151062012, -15.390671730041504, -14.87849235534668, -14.366313934326172, -13.854135513305664, -13.341957092285156, -12.829778671264648, -12.317599296569824, -11.805420875549316, -11.293242454528809, -10.781063079833984, -10.268884658813477, -9.756706237792969, -9.244527816772461, -8.732349395751953, -8.220170021057129, -7.707991600036621, -7.195813179016113, -6.683634281158447, -6.171455383300781, -5.659276962280273, -5.147098541259766, -4.6349196434021, -4.122740745544434, -3.610562324523926, -3.098383665084839, -2.586205005645752, -2.074026346206665, -1.561849594116211, -1.049670934677124, -0.5374922752380371, -0.025313615798950195, 0.4868650436401367, 0.9990437030792236, 1.5112223625183105, 2.0234010219573975, 2.5355796813964844, 3.0477583408355713, 3.559937000274658, 4.072115898132324, 4.584294319152832, 5.09647274017334, 5.608651638031006, 6.120830535888672, 6.63300895690918, 7.1451873779296875, 7.6573662757873535, 8.16954517364502, 8.681723594665527, 9.193902015686035, 9.70608139038086, 10.218259811401367, 10.730438232421875, 11.242616653442383, 11.75479507446289, 12.266974449157715, 12.779152870178223, 13.29133129119873, 13.803510665893555, 14.315689086914062, 14.82786750793457]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 10.0, 8.0, 12.0, 11.0, 10.0, 26.0, 28.0, 27.0, 31.0, 38.0, 56.0, 65.0, 187.0, 807.0, 12592.0, 895552.0, 135593.0, 2708.0, 359.0, 90.0, 71.0, 47.0, 37.0, 28.0, 31.0, 21.0, 23.0, 18.0, 18.0, 8.0, 8.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6953125, -13.1187744140625, -12.542236328125, -11.9656982421875, -11.38916015625, -10.8126220703125, -10.236083984375, -9.6595458984375, -9.0830078125, -8.5064697265625, -7.929931640625, -7.3533935546875, -6.77685546875, -6.2003173828125, -5.623779296875, -5.0472412109375, -4.470703125, -3.8941650390625, -3.317626953125, -2.7410888671875, -2.16455078125, -1.5880126953125, -1.011474609375, -0.4349365234375, 0.1416015625, 0.7181396484375, 1.294677734375, 1.8712158203125, 2.44775390625, 3.0242919921875, 3.600830078125, 4.1773681640625, 4.75390625, 5.3304443359375, 5.906982421875, 6.4835205078125, 7.06005859375, 7.6365966796875, 8.213134765625, 8.7896728515625, 9.3662109375, 9.9427490234375, 10.519287109375, 11.0958251953125, 11.67236328125, 12.2489013671875, 12.825439453125, 13.4019775390625, 13.978515625, 14.5550537109375, 15.131591796875, 15.7081298828125, 16.28466796875, 16.8612060546875, 17.437744140625, 18.0142822265625, 18.5908203125, 19.1673583984375, 19.743896484375, 20.3204345703125, 20.89697265625, 21.4735107421875, 22.050048828125, 22.6265869140625, 23.203125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 8.0, 16.0, 20.0, 66.0, 163.0, 237.0, 230.0, 132.0, 90.0, 37.0, 10.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.46512603759765625, -0.4073028564453125, -0.34947967529296875, -0.291656494140625, -0.23383331298828125, -0.1760101318359375, -0.11818695068359375, -0.06036376953125, -0.00254058837890625, 0.0552825927734375, 0.11310577392578125, 0.170928955078125, 0.22875213623046875, 0.2865753173828125, 0.34439849853515625, 0.4022216796875, 0.46004486083984375, 0.5178680419921875, 0.5756912231445312, 0.633514404296875, 0.6913375854492188, 0.7491607666015625, 0.8069839477539062, 0.86480712890625, 0.9226303100585938, 0.9804534912109375, 1.0382766723632812, 1.096099853515625, 1.1539230346679688, 1.2117462158203125, 1.2695693969726562, 1.327392578125, 1.3852157592773438, 1.4430389404296875, 1.5008621215820312, 1.558685302734375, 1.6165084838867188, 1.6743316650390625, 1.7321548461914062, 1.78997802734375, 1.8478012084960938, 1.9056243896484375, 1.9634475708007812, 2.021270751953125, 2.0790939331054688, 2.1369171142578125, 2.1947402954101562, 2.2525634765625, 2.3103866577148438, 2.3682098388671875, 2.4260330200195312, 2.483856201171875, 2.5416793823242188, 2.5995025634765625, 2.6573257446289062, 2.71514892578125, 2.7729721069335938, 2.8307952880859375, 2.8886184692382812, 2.946441650390625, 3.0042648315429688, 3.0620880126953125, 3.1199111938476562, 3.177734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 6.0, 9.0, 16.0, 26.0, 42.0, 51.0, 108.0, 164.0, 351.0, 668.0, 1650.0, 4408.0, 15397.0, 85998.0, 540105.0, 338294.0, 45827.0, 9777.0, 3182.0, 1219.0, 578.0, 276.0, 149.0, 80.0, 64.0, 39.0, 18.0, 18.0, 7.0, 6.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8046875, -4.632080078125, -4.45947265625, -4.286865234375, -4.1142578125, -3.941650390625, -3.76904296875, -3.596435546875, -3.423828125, -3.251220703125, -3.07861328125, -2.906005859375, -2.7333984375, -2.560791015625, -2.38818359375, -2.215576171875, -2.04296875, -1.870361328125, -1.69775390625, -1.525146484375, -1.3525390625, -1.179931640625, -1.00732421875, -0.834716796875, -0.662109375, -0.489501953125, -0.31689453125, -0.144287109375, 0.0283203125, 0.200927734375, 0.37353515625, 0.546142578125, 0.71875, 0.891357421875, 1.06396484375, 1.236572265625, 1.4091796875, 1.581787109375, 1.75439453125, 1.927001953125, 2.099609375, 2.272216796875, 2.44482421875, 2.617431640625, 2.7900390625, 2.962646484375, 3.13525390625, 3.307861328125, 3.48046875, 3.653076171875, 3.82568359375, 3.998291015625, 4.1708984375, 4.343505859375, 4.51611328125, 4.688720703125, 4.861328125, 5.033935546875, 5.20654296875, 5.379150390625, 5.5517578125, 5.724365234375, 5.89697265625, 6.069580078125, 6.2421875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 5.0, 4.0, 4.0, 16.0, 12.0, 9.0, 34.0, 30.0, 31.0, 54.0, 56.0, 65.0, 53.0, 66.0, 66.0, 74.0, 65.0, 59.0, 53.0, 42.0, 56.0, 36.0, 25.0, 27.0, 15.0, 11.0, 4.0, 7.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.865234375, -2.7657470703125, -2.666259765625, -2.5667724609375, -2.46728515625, -2.3677978515625, -2.268310546875, -2.1688232421875, -2.0693359375, -1.9698486328125, -1.870361328125, -1.7708740234375, -1.67138671875, -1.5718994140625, -1.472412109375, -1.3729248046875, -1.2734375, -1.1739501953125, -1.074462890625, -0.9749755859375, -0.87548828125, -0.7760009765625, -0.676513671875, -0.5770263671875, -0.4775390625, -0.3780517578125, -0.278564453125, -0.1790771484375, -0.07958984375, 0.0198974609375, 0.119384765625, 0.2188720703125, 0.318359375, 0.4178466796875, 0.517333984375, 0.6168212890625, 0.71630859375, 0.8157958984375, 0.915283203125, 1.0147705078125, 1.1142578125, 1.2137451171875, 1.313232421875, 1.4127197265625, 1.51220703125, 1.6116943359375, 1.711181640625, 1.8106689453125, 1.91015625, 2.0096435546875, 2.109130859375, 2.2086181640625, 2.30810546875, 2.4075927734375, 2.507080078125, 2.6065673828125, 2.7060546875, 2.8055419921875, 2.905029296875, 3.0045166015625, 3.10400390625, 3.2034912109375, 3.302978515625, 3.4024658203125, 3.501953125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 18.0, 21.0, 32.0, 46.0, 106.0, 237.0, 532.0, 1752.0, 10327.0, 248260.0, 752368.0, 30010.0, 3274.0, 881.0, 336.0, 173.0, 67.0, 43.0, 24.0, 16.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73828125, -6.529052734375, -6.31982421875, -6.110595703125, -5.9013671875, -5.692138671875, -5.48291015625, -5.273681640625, -5.064453125, -4.855224609375, -4.64599609375, -4.436767578125, -4.2275390625, -4.018310546875, -3.80908203125, -3.599853515625, -3.390625, -3.181396484375, -2.97216796875, -2.762939453125, -2.5537109375, -2.344482421875, -2.13525390625, -1.926025390625, -1.716796875, -1.507568359375, -1.29833984375, -1.089111328125, -0.8798828125, -0.670654296875, -0.46142578125, -0.252197265625, -0.04296875, 0.166259765625, 0.37548828125, 0.584716796875, 0.7939453125, 1.003173828125, 1.21240234375, 1.421630859375, 1.630859375, 1.840087890625, 2.04931640625, 2.258544921875, 2.4677734375, 2.677001953125, 2.88623046875, 3.095458984375, 3.3046875, 3.513916015625, 3.72314453125, 3.932373046875, 4.1416015625, 4.350830078125, 4.56005859375, 4.769287109375, 4.978515625, 5.187744140625, 5.39697265625, 5.606201171875, 5.8154296875, 6.024658203125, 6.23388671875, 6.443115234375, 6.65234375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 9.0, 7.0, 4.0, 9.0, 15.0, 26.0, 45.0, 36.0, 63.0, 89.0, 99.0, 89.0, 95.0, 83.0, 87.0, 71.0, 47.0, 33.0, 29.0, 16.0, 16.0, 10.0, 3.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003390312194824219, -0.0003236904740333557, -0.00030834972858428955, -0.0002930089831352234, -0.0002776682376861572, -0.00026232749223709106, -0.0002469867467880249, -0.00023164600133895874, -0.00021630525588989258, -0.00020096451044082642, -0.00018562376499176025, -0.0001702830195426941, -0.00015494227409362793, -0.00013960152864456177, -0.0001242607831954956, -0.00010892003774642944, -9.357929229736328e-05, -7.823854684829712e-05, -6.289780139923096e-05, -4.7557055950164795e-05, -3.221631050109863e-05, -1.687556505203247e-05, -1.5348196029663086e-06, 1.3805925846099854e-05, 2.9146671295166016e-05, 4.448741674423218e-05, 5.982816219329834e-05, 7.51689076423645e-05, 9.050965309143066e-05, 0.00010585039854049683, 0.00012119114398956299, 0.00013653188943862915, 0.0001518726348876953, 0.00016721338033676147, 0.00018255412578582764, 0.0001978948712348938, 0.00021323561668395996, 0.00022857636213302612, 0.00024391710758209229, 0.00025925785303115845, 0.0002745985984802246, 0.00028993934392929077, 0.00030528008937835693, 0.0003206208348274231, 0.00033596158027648926, 0.0003513023257255554, 0.0003666430711746216, 0.00038198381662368774, 0.0003973245620727539, 0.00041266530752182007, 0.00042800605297088623, 0.0004433467984199524, 0.00045868754386901855, 0.0004740282893180847, 0.0004893690347671509, 0.000504709780216217, 0.0005200505256652832, 0.0005353912711143494, 0.0005507320165634155, 0.0005660727620124817, 0.0005814135074615479, 0.000596754252910614, 0.0006120949983596802, 0.0006274357438087463, 0.0006427764892578125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 11.0, 4.0, 15.0, 22.0, 24.0, 51.0, 75.0, 151.0, 368.0, 860.0, 2705.0, 11954.0, 122001.0, 760186.0, 133028.0, 12622.0, 2856.0, 896.0, 364.0, 153.0, 88.0, 51.0, 29.0, 20.0, 8.0, 8.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.32489013671875, -4.1732177734375, -4.02154541015625, -3.869873046875, -3.71820068359375, -3.5665283203125, -3.41485595703125, -3.26318359375, -3.11151123046875, -2.9598388671875, -2.80816650390625, -2.656494140625, -2.50482177734375, -2.3531494140625, -2.20147705078125, -2.0498046875, -1.89813232421875, -1.7464599609375, -1.59478759765625, -1.443115234375, -1.29144287109375, -1.1397705078125, -0.98809814453125, -0.83642578125, -0.68475341796875, -0.5330810546875, -0.38140869140625, -0.229736328125, -0.07806396484375, 0.0736083984375, 0.22528076171875, 0.376953125, 0.52862548828125, 0.6802978515625, 0.83197021484375, 0.983642578125, 1.13531494140625, 1.2869873046875, 1.43865966796875, 1.59033203125, 1.74200439453125, 1.8936767578125, 2.04534912109375, 2.197021484375, 2.34869384765625, 2.5003662109375, 2.65203857421875, 2.8037109375, 2.95538330078125, 3.1070556640625, 3.25872802734375, 3.410400390625, 3.56207275390625, 3.7137451171875, 3.86541748046875, 4.01708984375, 4.16876220703125, 4.3204345703125, 4.47210693359375, 4.623779296875, 4.77545166015625, 4.9271240234375, 5.07879638671875, 5.23046875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 9.0, 4.0, 5.0, 4.0, 11.0, 13.0, 19.0, 28.0, 29.0, 46.0, 57.0, 58.0, 92.0, 86.0, 83.0, 88.0, 75.0, 60.0, 71.0, 39.0, 33.0, 19.0, 24.0, 22.0, 13.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.7705078125, -1.719329833984375, -1.66815185546875, -1.616973876953125, -1.5657958984375, -1.514617919921875, -1.46343994140625, -1.412261962890625, -1.361083984375, -1.309906005859375, -1.25872802734375, -1.207550048828125, -1.1563720703125, -1.105194091796875, -1.05401611328125, -1.002838134765625, -0.95166015625, -0.900482177734375, -0.84930419921875, -0.798126220703125, -0.7469482421875, -0.695770263671875, -0.64459228515625, -0.593414306640625, -0.542236328125, -0.491058349609375, -0.43988037109375, -0.388702392578125, -0.3375244140625, -0.286346435546875, -0.23516845703125, -0.183990478515625, -0.1328125, -0.081634521484375, -0.03045654296875, 0.020721435546875, 0.0718994140625, 0.123077392578125, 0.17425537109375, 0.225433349609375, 0.276611328125, 0.327789306640625, 0.37896728515625, 0.430145263671875, 0.4813232421875, 0.532501220703125, 0.58367919921875, 0.634857177734375, 0.68603515625, 0.737213134765625, 0.78839111328125, 0.839569091796875, 0.8907470703125, 0.941925048828125, 0.99310302734375, 1.044281005859375, 1.095458984375, 1.146636962890625, 1.19781494140625, 1.248992919921875, 1.3001708984375, 1.351348876953125, 1.40252685546875, 1.453704833984375, 1.5048828125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 11.0, 33.0, 188.0, 447.0, 240.0, 62.0, 17.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.72560119628906, -108.58108520507812, -106.43656921386719, -104.29205322265625, -102.14754486083984, -100.0030288696289, -97.85851287841797, -95.71399688720703, -93.5694808959961, -91.42496490478516, -89.28044891357422, -87.13594055175781, -84.99142456054688, -82.84690856933594, -80.702392578125, -78.55787658691406, -76.41336059570312, -74.26884460449219, -72.12432861328125, -69.97981262207031, -67.8353042602539, -65.69078826904297, -63.54627227783203, -61.401756286621094, -59.25724792480469, -57.11273193359375, -54.96821975708008, -52.82370376586914, -50.6791877746582, -48.53467559814453, -46.390159606933594, -44.245643615722656, -42.10112762451172, -39.95661163330078, -37.81209945678711, -35.66758346557617, -33.523067474365234, -31.37855339050293, -29.234039306640625, -27.089523315429688, -24.945009231567383, -22.800495147705078, -20.65597915649414, -18.511465072631836, -16.36695098876953, -14.222434997558594, -12.077920913696289, -9.933405876159668, -7.788890838623047, -5.644375801086426, -3.499861240386963, -1.3553466796875, 0.7891683578491211, 2.933683395385742, 5.078197479248047, 7.222712516784668, 9.367227554321289, 11.51174259185791, 13.656257629394531, 15.800771713256836, 17.94528579711914, 20.089801788330078, 22.234315872192383, 24.378829956054688, 26.523345947265625]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 4.0, 9.0, 16.0, 28.0, 36.0, 41.0, 58.0, 67.0, 79.0, 87.0, 74.0, 101.0, 92.0, 86.0, 54.0, 43.0, 44.0, 29.0, 20.0, 16.0, 3.0, 6.0, 8.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.819007873535156, -31.993244171142578, -31.167478561401367, -30.34171485900879, -29.515949249267578, -28.690185546875, -27.864421844482422, -27.03865623474121, -26.212890625, -25.387126922607422, -24.56136131286621, -23.735597610473633, -22.909832000732422, -22.084068298339844, -21.258304595947266, -20.432538986206055, -19.606775283813477, -18.7810115814209, -17.955245971679688, -17.12948226928711, -16.3037166595459, -15.47795295715332, -14.652188301086426, -13.826423645019531, -13.000658988952637, -12.174894332885742, -11.349129676818848, -10.523365020751953, -9.697601318359375, -8.871835708618164, -8.046072006225586, -7.220307350158691, -6.394542694091797, -5.568778038024902, -4.743013381958008, -3.9172492027282715, -3.091484546661377, -2.2657198905944824, -1.439955711364746, -0.6141910552978516, 0.21157360076904297, 1.037338137626648, 1.863102674484253, 2.6888670921325684, 3.514631748199463, 4.340396404266357, 5.166160583496094, 5.991925239562988, 6.817689895629883, 7.643454551696777, 8.469219207763672, 9.29498291015625, 10.120748519897461, 10.946512222290039, 11.772276878356934, 12.598041534423828, 13.423806190490723, 14.249570846557617, 15.075335502624512, 15.901100158691406, 16.726863861083984, 17.552629470825195, 18.378393173217773, 19.204158782958984, 20.029922485351562]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 8.0, 12.0, 33.0, 98.0, 233.0, 902.0, 8291.0, 748917.0, 3422868.0, 10760.0, 1147.0, 346.0, 171.0, 88.0, 65.0, 52.0, 65.0, 52.0, 30.0, 29.0, 20.0, 22.0, 17.0, 14.0, 12.0, 9.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.01983642578125, -4.4654541015625, -3.91107177734375, -3.356689453125, -2.80230712890625, -2.2479248046875, -1.69354248046875, -1.13916015625, -0.58477783203125, -0.0303955078125, 0.52398681640625, 1.078369140625, 1.63275146484375, 2.1871337890625, 2.74151611328125, 3.2958984375, 3.85028076171875, 4.4046630859375, 4.95904541015625, 5.513427734375, 6.06781005859375, 6.6221923828125, 7.17657470703125, 7.73095703125, 8.28533935546875, 8.8397216796875, 9.39410400390625, 9.948486328125, 10.50286865234375, 11.0572509765625, 11.61163330078125, 12.166015625, 12.72039794921875, 13.2747802734375, 13.82916259765625, 14.383544921875, 14.93792724609375, 15.4923095703125, 16.04669189453125, 16.60107421875, 17.15545654296875, 17.7098388671875, 18.26422119140625, 18.818603515625, 19.37298583984375, 19.9273681640625, 20.48175048828125, 21.0361328125, 21.59051513671875, 22.1448974609375, 22.69927978515625, 23.253662109375, 23.80804443359375, 24.3624267578125, 24.91680908203125, 25.47119140625, 26.02557373046875, 26.5799560546875, 27.13433837890625, 27.688720703125, 28.24310302734375, 28.7974853515625, 29.35186767578125, 29.90625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 4.0, 16.0, 44.0, 70.0, 126.0, 184.0, 222.0, 146.0, 111.0, 50.0, 25.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.495849609375, -0.4425697326660156, -0.38928985595703125, -0.3360099792480469, -0.2827301025390625, -0.22945022583007812, -0.17617034912109375, -0.12289047241210938, -0.069610595703125, -0.016330718994140625, 0.03694915771484375, 0.09022903442382812, 0.1435089111328125, 0.19678878784179688, 0.25006866455078125, 0.3033485412597656, 0.35662841796875, 0.4099082946777344, 0.46318817138671875, 0.5164680480957031, 0.5697479248046875, 0.6230278015136719, 0.6763076782226562, 0.7295875549316406, 0.782867431640625, 0.8361473083496094, 0.8894271850585938, 0.9427070617675781, 0.9959869384765625, 1.0492668151855469, 1.1025466918945312, 1.1558265686035156, 1.2091064453125, 1.2623863220214844, 1.3156661987304688, 1.3689460754394531, 1.4222259521484375, 1.4755058288574219, 1.5287857055664062, 1.5820655822753906, 1.635345458984375, 1.6886253356933594, 1.7419052124023438, 1.7951850891113281, 1.8484649658203125, 1.9017448425292969, 1.9550247192382812, 2.0083045959472656, 2.06158447265625, 2.1148643493652344, 2.1681442260742188, 2.221424102783203, 2.2747039794921875, 2.327983856201172, 2.3812637329101562, 2.4345436096191406, 2.487823486328125, 2.5411033630371094, 2.5943832397460938, 2.647663116455078, 2.7009429931640625, 2.754222869873047, 2.8075027465820312, 2.8607826232910156, 2.9140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 11.0, 29.0, 42.0, 119.0, 347.0, 1118.0, 15147.0, 4148582.0, 26215.0, 1740.0, 482.0, 241.0, 108.0, 52.0, 21.0, 13.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6171875, -12.7945556640625, -11.971923828125, -11.1492919921875, -10.32666015625, -9.5040283203125, -8.681396484375, -7.8587646484375, -7.0361328125, -6.2135009765625, -5.390869140625, -4.5682373046875, -3.74560546875, -2.9229736328125, -2.100341796875, -1.2777099609375, -0.455078125, 0.3675537109375, 1.190185546875, 2.0128173828125, 2.83544921875, 3.6580810546875, 4.480712890625, 5.3033447265625, 6.1259765625, 6.9486083984375, 7.771240234375, 8.5938720703125, 9.41650390625, 10.2391357421875, 11.061767578125, 11.8843994140625, 12.70703125, 13.5296630859375, 14.352294921875, 15.1749267578125, 15.99755859375, 16.8201904296875, 17.642822265625, 18.4654541015625, 19.2880859375, 20.1107177734375, 20.933349609375, 21.7559814453125, 22.57861328125, 23.4012451171875, 24.223876953125, 25.0465087890625, 25.869140625, 26.6917724609375, 27.514404296875, 28.3370361328125, 29.15966796875, 29.9822998046875, 30.804931640625, 31.6275634765625, 32.4501953125, 33.2728271484375, 34.095458984375, 34.9180908203125, 35.74072265625, 36.5633544921875, 37.385986328125, 38.2086181640625, 39.03125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 0.0, 5.0, 12.0, 21.0, 34.0, 63.0, 160.0, 354.0, 1715.0, 1124.0, 296.0, 124.0, 61.0, 45.0, 18.0, 17.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.97021484375, -0.9091873168945312, -0.8481597900390625, -0.7871322631835938, -0.726104736328125, -0.6650772094726562, -0.6040496826171875, -0.5430221557617188, -0.48199462890625, -0.42096710205078125, -0.3599395751953125, -0.29891204833984375, -0.237884521484375, -0.17685699462890625, -0.1158294677734375, -0.05480194091796875, 0.0062255859375, 0.06725311279296875, 0.1282806396484375, 0.18930816650390625, 0.250335693359375, 0.31136322021484375, 0.3723907470703125, 0.43341827392578125, 0.49444580078125, 0.5554733276367188, 0.6165008544921875, 0.6775283813476562, 0.738555908203125, 0.7995834350585938, 0.8606109619140625, 0.9216384887695312, 0.982666015625, 1.0436935424804688, 1.1047210693359375, 1.1657485961914062, 1.226776123046875, 1.2878036499023438, 1.3488311767578125, 1.4098587036132812, 1.47088623046875, 1.5319137573242188, 1.5929412841796875, 1.6539688110351562, 1.714996337890625, 1.7760238647460938, 1.8370513916015625, 1.8980789184570312, 1.9591064453125, 2.0201339721679688, 2.0811614990234375, 2.1421890258789062, 2.203216552734375, 2.2642440795898438, 2.3252716064453125, 2.3862991333007812, 2.44732666015625, 2.5083541870117188, 2.5693817138671875, 2.6304092407226562, 2.691436767578125, 2.7524642944335938, 2.8134918212890625, 2.8745193481445312, 2.935546875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 18.0, 19.0, 44.0, 122.0, 149.0, 221.0, 184.0, 91.0, 62.0, 34.0, 22.0, 8.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.326394081115723, -7.91871976852417, -7.511045455932617, -7.103371620178223, -6.695696830749512, -6.288022994995117, -5.8803486824035645, -5.472674369812012, -5.065000057220459, -4.657325744628906, -4.2496514320373535, -3.84197735786438, -3.434303045272827, -3.0266287326812744, -2.618954658508301, -2.211280345916748, -1.8036060333251953, -1.3959317207336426, -0.9882575273513794, -0.5805833339691162, -0.17290902137756348, 0.23476529121398926, 0.6424393653869629, 1.0501136779785156, 1.4577879905700684, 1.865462303161621, 2.273136615753174, 2.6808106899261475, 3.0884850025177, 3.496159315109253, 3.9038333892822266, 4.311507701873779, 4.719181060791016, 5.126855373382568, 5.534529685974121, 5.942203521728516, 6.349878311157227, 6.757552146911621, 7.165226459503174, 7.572900772094727, 7.980575084686279, 8.388249397277832, 8.795923233032227, 9.203598022460938, 9.611271858215332, 10.018946647644043, 10.426620483398438, 10.834295272827148, 11.241969108581543, 11.649642944335938, 12.057317733764648, 12.464991569519043, 12.872666358947754, 13.280340194702148, 13.68801498413086, 14.095688819885254, 14.503362655639648, 14.911036491394043, 15.318711280822754, 15.726385116577148, 16.13405990600586, 16.54173469543457, 16.94940757751465, 17.35708236694336, 17.76475715637207]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 12.0, 16.0, 29.0, 42.0, 42.0, 50.0, 69.0, 96.0, 99.0, 73.0, 94.0, 85.0, 71.0, 60.0, 50.0, 37.0, 18.0, 11.0, 11.0, 8.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.946641445159912, -7.660915374755859, -7.375189781188965, -7.089463710784912, -6.803737640380859, -6.518012046813965, -6.232285976409912, -5.946559906005859, -5.660834312438965, -5.375108242034912, -5.089382648468018, -4.803656578063965, -4.51793098449707, -4.232204914093018, -3.946478843688965, -3.660753011703491, -3.3750271797180176, -3.089301347732544, -2.8035755157470703, -2.5178494453430176, -2.232123613357544, -1.9463977813720703, -1.6606718301773071, -1.374945878982544, -1.0892200469970703, -0.8034941554069519, -0.5177682638168335, -0.2320423722267151, 0.05368351936340332, 0.33940935134887695, 0.6251353025436401, 0.9108612537384033, 1.1965866088867188, 1.4823124408721924, 1.7680383920669556, 2.0537643432617188, 2.3394901752471924, 2.625216007232666, 2.9109420776367188, 3.1966679096221924, 3.482393741607666, 3.7681195735931396, 4.053845405578613, 4.339571475982666, 4.625297546386719, 4.911023139953613, 5.196749210357666, 5.482475280761719, 5.768200874328613, 6.053926944732666, 6.3396525382995605, 6.625378608703613, 6.911104202270508, 7.1968302726745605, 7.482556343078613, 7.768281936645508, 8.054008483886719, 8.339734077453613, 8.625460624694824, 8.911186218261719, 9.196911811828613, 9.482637405395508, 9.768363952636719, 10.054089546203613, 10.339815139770508]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 7.0, 8.0, 5.0, 11.0, 14.0, 16.0, 17.0, 14.0, 30.0, 28.0, 35.0, 61.0, 63.0, 115.0, 303.0, 947.0, 6669.0, 173473.0, 824523.0, 38400.0, 2637.0, 548.0, 234.0, 108.0, 62.0, 42.0, 41.0, 31.0, 28.0, 17.0, 20.0, 5.0, 12.0, 10.0, 6.0, 4.0, 0.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3203125, -10.9466552734375, -10.572998046875, -10.1993408203125, -9.82568359375, -9.4520263671875, -9.078369140625, -8.7047119140625, -8.3310546875, -7.9573974609375, -7.583740234375, -7.2100830078125, -6.83642578125, -6.4627685546875, -6.089111328125, -5.7154541015625, -5.341796875, -4.9681396484375, -4.594482421875, -4.2208251953125, -3.84716796875, -3.4735107421875, -3.099853515625, -2.7261962890625, -2.3525390625, -1.9788818359375, -1.605224609375, -1.2315673828125, -0.85791015625, -0.4842529296875, -0.110595703125, 0.2630615234375, 0.63671875, 1.0103759765625, 1.384033203125, 1.7576904296875, 2.13134765625, 2.5050048828125, 2.878662109375, 3.2523193359375, 3.6259765625, 3.9996337890625, 4.373291015625, 4.7469482421875, 5.12060546875, 5.4942626953125, 5.867919921875, 6.2415771484375, 6.615234375, 6.9888916015625, 7.362548828125, 7.7362060546875, 8.10986328125, 8.4835205078125, 8.857177734375, 9.2308349609375, 9.6044921875, 9.9781494140625, 10.351806640625, 10.7254638671875, 11.09912109375, 11.4727783203125, 11.846435546875, 12.2200927734375, 12.59375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 14.0, 16.0, 39.0, 80.0, 121.0, 175.0, 186.0, 144.0, 115.0, 55.0, 36.0, 14.0, 9.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6396484375, -0.5835418701171875, -0.527435302734375, -0.4713287353515625, -0.41522216796875, -0.3591156005859375, -0.303009033203125, -0.2469024658203125, -0.1907958984375, -0.1346893310546875, -0.078582763671875, -0.0224761962890625, 0.03363037109375, 0.0897369384765625, 0.145843505859375, 0.2019500732421875, 0.258056640625, 0.3141632080078125, 0.370269775390625, 0.4263763427734375, 0.48248291015625, 0.5385894775390625, 0.594696044921875, 0.6508026123046875, 0.7069091796875, 0.7630157470703125, 0.819122314453125, 0.8752288818359375, 0.93133544921875, 0.9874420166015625, 1.043548583984375, 1.0996551513671875, 1.15576171875, 1.2118682861328125, 1.267974853515625, 1.3240814208984375, 1.38018798828125, 1.4362945556640625, 1.492401123046875, 1.5485076904296875, 1.6046142578125, 1.6607208251953125, 1.716827392578125, 1.7729339599609375, 1.82904052734375, 1.8851470947265625, 1.941253662109375, 1.9973602294921875, 2.053466796875, 2.1095733642578125, 2.165679931640625, 2.2217864990234375, 2.27789306640625, 2.3339996337890625, 2.390106201171875, 2.4462127685546875, 2.5023193359375, 2.5584259033203125, 2.614532470703125, 2.6706390380859375, 2.72674560546875, 2.7828521728515625, 2.838958740234375, 2.8950653076171875, 2.951171875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 6.0, 11.0, 16.0, 26.0, 35.0, 54.0, 87.0, 147.0, 255.0, 448.0, 768.0, 1480.0, 3338.0, 8596.0, 27501.0, 119738.0, 465592.0, 322840.0, 68724.0, 17795.0, 5997.0, 2418.0, 1159.0, 594.0, 365.0, 200.0, 128.0, 69.0, 54.0, 37.0, 27.0, 9.0, 14.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83984375, -3.71527099609375, -3.5906982421875, -3.46612548828125, -3.341552734375, -3.21697998046875, -3.0924072265625, -2.96783447265625, -2.84326171875, -2.71868896484375, -2.5941162109375, -2.46954345703125, -2.344970703125, -2.22039794921875, -2.0958251953125, -1.97125244140625, -1.8466796875, -1.72210693359375, -1.5975341796875, -1.47296142578125, -1.348388671875, -1.22381591796875, -1.0992431640625, -0.97467041015625, -0.85009765625, -0.72552490234375, -0.6009521484375, -0.47637939453125, -0.351806640625, -0.22723388671875, -0.1026611328125, 0.02191162109375, 0.146484375, 0.27105712890625, 0.3956298828125, 0.52020263671875, 0.644775390625, 0.76934814453125, 0.8939208984375, 1.01849365234375, 1.14306640625, 1.26763916015625, 1.3922119140625, 1.51678466796875, 1.641357421875, 1.76593017578125, 1.8905029296875, 2.01507568359375, 2.1396484375, 2.26422119140625, 2.3887939453125, 2.51336669921875, 2.637939453125, 2.76251220703125, 2.8870849609375, 3.01165771484375, 3.13623046875, 3.26080322265625, 3.3853759765625, 3.50994873046875, 3.634521484375, 3.75909423828125, 3.8836669921875, 4.00823974609375, 4.1328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 4.0, 10.0, 7.0, 4.0, 6.0, 15.0, 12.0, 13.0, 23.0, 17.0, 27.0, 39.0, 45.0, 51.0, 44.0, 49.0, 37.0, 47.0, 60.0, 46.0, 44.0, 49.0, 49.0, 34.0, 38.0, 32.0, 30.0, 27.0, 26.0, 16.0, 22.0, 19.0, 14.0, 9.0, 6.0, 6.0, 4.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0], "bins": [-3.283203125, -3.2012481689453125, -3.119293212890625, -3.0373382568359375, -2.95538330078125, -2.8734283447265625, -2.791473388671875, -2.7095184326171875, -2.6275634765625, -2.5456085205078125, -2.463653564453125, -2.3816986083984375, -2.29974365234375, -2.2177886962890625, -2.135833740234375, -2.0538787841796875, -1.971923828125, -1.8899688720703125, -1.808013916015625, -1.7260589599609375, -1.64410400390625, -1.5621490478515625, -1.480194091796875, -1.3982391357421875, -1.3162841796875, -1.2343292236328125, -1.152374267578125, -1.0704193115234375, -0.98846435546875, -0.9065093994140625, -0.824554443359375, -0.7425994873046875, -0.66064453125, -0.5786895751953125, -0.496734619140625, -0.4147796630859375, -0.33282470703125, -0.2508697509765625, -0.168914794921875, -0.0869598388671875, -0.0050048828125, 0.0769500732421875, 0.158905029296875, 0.2408599853515625, 0.32281494140625, 0.4047698974609375, 0.486724853515625, 0.5686798095703125, 0.650634765625, 0.7325897216796875, 0.814544677734375, 0.8964996337890625, 0.97845458984375, 1.0604095458984375, 1.142364501953125, 1.2243194580078125, 1.3062744140625, 1.3882293701171875, 1.470184326171875, 1.5521392822265625, 1.63409423828125, 1.7160491943359375, 1.798004150390625, 1.8799591064453125, 1.9619140625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 14.0, 17.0, 33.0, 35.0, 39.0, 59.0, 93.0, 151.0, 257.0, 341.0, 653.0, 1251.0, 2759.0, 6422.0, 17595.0, 59807.0, 231519.0, 456499.0, 194508.0, 50216.0, 15333.0, 5769.0, 2422.0, 1194.0, 614.0, 303.0, 191.0, 131.0, 90.0, 63.0, 38.0, 31.0, 24.0, 24.0, 14.0, 11.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.005859375, -1.949249267578125, -1.89263916015625, -1.836029052734375, -1.7794189453125, -1.722808837890625, -1.66619873046875, -1.609588623046875, -1.552978515625, -1.496368408203125, -1.43975830078125, -1.383148193359375, -1.3265380859375, -1.269927978515625, -1.21331787109375, -1.156707763671875, -1.10009765625, -1.043487548828125, -0.98687744140625, -0.930267333984375, -0.8736572265625, -0.817047119140625, -0.76043701171875, -0.703826904296875, -0.647216796875, -0.590606689453125, -0.53399658203125, -0.477386474609375, -0.4207763671875, -0.364166259765625, -0.30755615234375, -0.250946044921875, -0.1943359375, -0.137725830078125, -0.08111572265625, -0.024505615234375, 0.0321044921875, 0.088714599609375, 0.14532470703125, 0.201934814453125, 0.258544921875, 0.315155029296875, 0.37176513671875, 0.428375244140625, 0.4849853515625, 0.541595458984375, 0.59820556640625, 0.654815673828125, 0.71142578125, 0.768035888671875, 0.82464599609375, 0.881256103515625, 0.9378662109375, 0.994476318359375, 1.05108642578125, 1.107696533203125, 1.164306640625, 1.220916748046875, 1.27752685546875, 1.334136962890625, 1.3907470703125, 1.447357177734375, 1.50396728515625, 1.560577392578125, 1.6171875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 6.0, 2.0, 6.0, 3.0, 9.0, 10.0, 14.0, 9.0, 14.0, 19.0, 20.0, 23.0, 25.0, 41.0, 45.0, 57.0, 56.0, 77.0, 93.0, 75.0, 63.0, 50.0, 67.0, 46.0, 38.0, 27.0, 29.0, 17.0, 11.0, 12.0, 6.0, 5.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003266334533691406, -0.0003174878656864166, -0.0003083422780036926, -0.00029919669032096863, -0.00029005110263824463, -0.00028090551495552063, -0.00027175992727279663, -0.00026261433959007263, -0.00025346875190734863, -0.00024432316422462463, -0.00023517757654190063, -0.00022603198885917664, -0.00021688640117645264, -0.00020774081349372864, -0.00019859522581100464, -0.00018944963812828064, -0.00018030405044555664, -0.00017115846276283264, -0.00016201287508010864, -0.00015286728739738464, -0.00014372169971466064, -0.00013457611203193665, -0.00012543052434921265, -0.00011628493666648865, -0.00010713934898376465, -9.799376130104065e-05, -8.884817361831665e-05, -7.970258593559265e-05, -7.055699825286865e-05, -6.141141057014465e-05, -5.2265822887420654e-05, -4.3120235204696655e-05, -3.3974647521972656e-05, -2.4829059839248657e-05, -1.5683472156524658e-05, -6.537884473800659e-06, 2.60770320892334e-06, 1.1753290891647339e-05, 2.0898878574371338e-05, 3.0044466257095337e-05, 3.9190053939819336e-05, 4.8335641622543335e-05, 5.7481229305267334e-05, 6.662681698799133e-05, 7.577240467071533e-05, 8.491799235343933e-05, 9.406358003616333e-05, 0.00010320916771888733, 0.00011235475540161133, 0.00012150034308433533, 0.00013064593076705933, 0.00013979151844978333, 0.00014893710613250732, 0.00015808269381523132, 0.00016722828149795532, 0.00017637386918067932, 0.00018551945686340332, 0.00019466504454612732, 0.00020381063222885132, 0.00021295621991157532, 0.00022210180759429932, 0.00023124739527702332, 0.00024039298295974731, 0.0002495385706424713, 0.0002586841583251953]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 11.0, 5.0, 12.0, 13.0, 27.0, 34.0, 45.0, 59.0, 88.0, 162.0, 253.0, 443.0, 800.0, 1660.0, 3664.0, 9241.0, 29886.0, 142230.0, 500998.0, 279107.0, 55106.0, 14400.0, 5372.0, 2326.0, 1108.0, 591.0, 320.0, 204.0, 122.0, 95.0, 48.0, 25.0, 24.0, 16.0, 11.0, 14.0, 5.0, 8.0, 4.0, 8.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.349609375, -2.2838134765625, -2.218017578125, -2.1522216796875, -2.08642578125, -2.0206298828125, -1.954833984375, -1.8890380859375, -1.8232421875, -1.7574462890625, -1.691650390625, -1.6258544921875, -1.56005859375, -1.4942626953125, -1.428466796875, -1.3626708984375, -1.296875, -1.2310791015625, -1.165283203125, -1.0994873046875, -1.03369140625, -0.9678955078125, -0.902099609375, -0.8363037109375, -0.7705078125, -0.7047119140625, -0.638916015625, -0.5731201171875, -0.50732421875, -0.4415283203125, -0.375732421875, -0.3099365234375, -0.244140625, -0.1783447265625, -0.112548828125, -0.0467529296875, 0.01904296875, 0.0848388671875, 0.150634765625, 0.2164306640625, 0.2822265625, 0.3480224609375, 0.413818359375, 0.4796142578125, 0.54541015625, 0.6112060546875, 0.677001953125, 0.7427978515625, 0.80859375, 0.8743896484375, 0.940185546875, 1.0059814453125, 1.07177734375, 1.1375732421875, 1.203369140625, 1.2691650390625, 1.3349609375, 1.4007568359375, 1.466552734375, 1.5323486328125, 1.59814453125, 1.6639404296875, 1.729736328125, 1.7955322265625, 1.861328125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 4.0, 6.0, 5.0, 16.0, 14.0, 19.0, 34.0, 38.0, 52.0, 68.0, 78.0, 68.0, 87.0, 76.0, 71.0, 71.0, 60.0, 51.0, 44.0, 35.0, 19.0, 22.0, 16.0, 8.0, 9.0, 9.0, 5.0, 2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.251953125, -1.207611083984375, -1.16326904296875, -1.118927001953125, -1.0745849609375, -1.030242919921875, -0.98590087890625, -0.941558837890625, -0.897216796875, -0.852874755859375, -0.80853271484375, -0.764190673828125, -0.7198486328125, -0.675506591796875, -0.63116455078125, -0.586822509765625, -0.54248046875, -0.498138427734375, -0.45379638671875, -0.409454345703125, -0.3651123046875, -0.320770263671875, -0.27642822265625, -0.232086181640625, -0.187744140625, -0.143402099609375, -0.09906005859375, -0.054718017578125, -0.0103759765625, 0.033966064453125, 0.07830810546875, 0.122650146484375, 0.1669921875, 0.211334228515625, 0.25567626953125, 0.300018310546875, 0.3443603515625, 0.388702392578125, 0.43304443359375, 0.477386474609375, 0.521728515625, 0.566070556640625, 0.61041259765625, 0.654754638671875, 0.6990966796875, 0.743438720703125, 0.78778076171875, 0.832122802734375, 0.87646484375, 0.920806884765625, 0.96514892578125, 1.009490966796875, 1.0538330078125, 1.098175048828125, 1.14251708984375, 1.186859130859375, 1.231201171875, 1.275543212890625, 1.31988525390625, 1.364227294921875, 1.4085693359375, 1.452911376953125, 1.49725341796875, 1.541595458984375, 1.5859375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 12.0, 45.0, 126.0, 269.0, 317.0, 154.0, 52.0, 17.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.29301452636719, -74.70619201660156, -73.11936950683594, -71.53254699707031, -69.94571685791016, -68.35889434814453, -66.7720718383789, -65.18524932861328, -63.59842300415039, -62.011600494384766, -60.424774169921875, -58.83795166015625, -57.251129150390625, -55.664302825927734, -54.07748031616211, -52.49065399169922, -50.903831481933594, -49.31700897216797, -47.73018264770508, -46.14336013793945, -44.55653762817383, -42.96971130371094, -41.38288879394531, -39.79606628417969, -38.20924377441406, -36.62242126464844, -35.03559494018555, -33.44877243041992, -31.861948013305664, -30.275123596191406, -28.68830108642578, -27.101476669311523, -25.514652252197266, -23.927827835083008, -22.341005325317383, -20.754180908203125, -19.167356491088867, -17.58053207397461, -15.993709564208984, -14.406885147094727, -12.820061683654785, -11.233238220214844, -9.646413803100586, -8.059590339660645, -6.472766399383545, -4.885942459106445, -3.299118995666504, -1.712294578552246, -0.1254711151123047, 1.4613527059555054, 3.0481765270233154, 4.635000228881836, 6.2218241691589355, 7.808648109436035, 9.395471572875977, 10.982295989990234, 12.569119453430176, 14.155942916870117, 15.742767333984375, 17.32958984375, 18.916414260864258, 20.503238677978516, 22.09006118774414, 23.67688751220703, 25.263710021972656]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 9.0, 13.0, 12.0, 17.0, 15.0, 19.0, 34.0, 33.0, 26.0, 31.0, 42.0, 45.0, 47.0, 50.0, 52.0, 48.0, 59.0, 50.0, 50.0, 47.0, 50.0, 38.0, 34.0, 32.0, 24.0, 22.0, 12.0, 15.0, 20.0, 9.0, 11.0, 3.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.388898849487305, -16.89767837524414, -16.40645980834961, -15.915239334106445, -15.424019813537598, -14.93280029296875, -14.441580772399902, -13.950361251831055, -13.45914077758789, -12.967921257019043, -12.476701736450195, -11.985481262207031, -11.494261741638184, -11.003042221069336, -10.511822700500488, -10.02060317993164, -9.529382705688477, -9.038163185119629, -8.546943664550781, -8.055723190307617, -7.5645036697387695, -7.073284149169922, -6.582064628601074, -6.090844631195068, -5.599625587463379, -5.108406066894531, -4.617186069488525, -4.125966548919678, -3.634746551513672, -3.143527030944824, -2.6523072719573975, -2.1610875129699707, -1.6698675155639648, -1.178647756576538, -0.6874280571937561, -0.19620835781097412, 0.29501140117645264, 0.7862310409545898, 1.2774507999420166, 1.7686705589294434, 2.25989031791687, 2.751110076904297, 3.2423298358917236, 3.7335495948791504, 4.224769115447998, 4.715989112854004, 5.207208633422852, 5.698428153991699, 6.189648151397705, 6.680867671966553, 7.172087669372559, 7.663307189941406, 8.154526710510254, 8.645746231079102, 9.136966705322266, 9.628186225891113, 10.119405746459961, 10.610625267028809, 11.101844787597656, 11.59306526184082, 12.084284782409668, 12.575504302978516, 13.066723823547363, 13.557943344116211, 14.049163818359375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 20.0, 27.0, 47.0, 79.0, 213.0, 584.0, 1982.0, 11637.0, 335696.0, 3813026.0, 25881.0, 3235.0, 856.0, 352.0, 172.0, 117.0, 85.0, 51.0, 43.0, 34.0, 30.0, 12.0, 13.0, 14.0, 13.0, 6.0, 8.0, 10.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.44921875, -6.11285400390625, -5.7764892578125, -5.44012451171875, -5.103759765625, -4.76739501953125, -4.4310302734375, -4.09466552734375, -3.75830078125, -3.42193603515625, -3.0855712890625, -2.74920654296875, -2.412841796875, -2.07647705078125, -1.7401123046875, -1.40374755859375, -1.0673828125, -0.73101806640625, -0.3946533203125, -0.05828857421875, 0.278076171875, 0.61444091796875, 0.9508056640625, 1.28717041015625, 1.62353515625, 1.95989990234375, 2.2962646484375, 2.63262939453125, 2.968994140625, 3.30535888671875, 3.6417236328125, 3.97808837890625, 4.314453125, 4.65081787109375, 4.9871826171875, 5.32354736328125, 5.659912109375, 5.99627685546875, 6.3326416015625, 6.66900634765625, 7.00537109375, 7.34173583984375, 7.6781005859375, 8.01446533203125, 8.350830078125, 8.68719482421875, 9.0235595703125, 9.35992431640625, 9.6962890625, 10.03265380859375, 10.3690185546875, 10.70538330078125, 11.041748046875, 11.37811279296875, 11.7144775390625, 12.05084228515625, 12.38720703125, 12.72357177734375, 13.0599365234375, 13.39630126953125, 13.732666015625, 14.06903076171875, 14.4053955078125, 14.74176025390625, 15.078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 21.0, 43.0, 64.0, 93.0, 137.0, 170.0, 164.0, 130.0, 95.0, 39.0, 27.0, 14.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66259765625, -0.6064987182617188, -0.5503997802734375, -0.49430084228515625, -0.438201904296875, -0.38210296630859375, -0.3260040283203125, -0.26990509033203125, -0.21380615234375, -0.15770721435546875, -0.1016082763671875, -0.04550933837890625, 0.010589599609375, 0.06668853759765625, 0.1227874755859375, 0.17888641357421875, 0.2349853515625, 0.29108428955078125, 0.3471832275390625, 0.40328216552734375, 0.459381103515625, 0.5154800415039062, 0.5715789794921875, 0.6276779174804688, 0.68377685546875, 0.7398757934570312, 0.7959747314453125, 0.8520736694335938, 0.908172607421875, 0.9642715454101562, 1.0203704833984375, 1.0764694213867188, 1.132568359375, 1.1886672973632812, 1.2447662353515625, 1.3008651733398438, 1.356964111328125, 1.4130630493164062, 1.4691619873046875, 1.5252609252929688, 1.58135986328125, 1.6374588012695312, 1.6935577392578125, 1.7496566772460938, 1.805755615234375, 1.8618545532226562, 1.9179534912109375, 1.9740524291992188, 2.0301513671875, 2.0862503051757812, 2.1423492431640625, 2.1984481811523438, 2.254547119140625, 2.3106460571289062, 2.3667449951171875, 2.4228439331054688, 2.47894287109375, 2.5350418090820312, 2.5911407470703125, 2.6472396850585938, 2.703338623046875, 2.7594375610351562, 2.8155364990234375, 2.8716354370117188, 2.927734375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 8.0, 17.0, 20.0, 44.0, 64.0, 105.0, 309.0, 1338.0, 174080.0, 4014709.0, 2850.0, 464.0, 158.0, 57.0, 39.0, 14.0, 7.0, 4.0, 2.0, 1.0], "bins": [-45.6875, -44.82763671875, -43.9677734375, -43.10791015625, -42.248046875, -41.38818359375, -40.5283203125, -39.66845703125, -38.80859375, -37.94873046875, -37.0888671875, -36.22900390625, -35.369140625, -34.50927734375, -33.6494140625, -32.78955078125, -31.9296875, -31.06982421875, -30.2099609375, -29.35009765625, -28.490234375, -27.63037109375, -26.7705078125, -25.91064453125, -25.05078125, -24.19091796875, -23.3310546875, -22.47119140625, -21.611328125, -20.75146484375, -19.8916015625, -19.03173828125, -18.171875, -17.31201171875, -16.4521484375, -15.59228515625, -14.732421875, -13.87255859375, -13.0126953125, -12.15283203125, -11.29296875, -10.43310546875, -9.5732421875, -8.71337890625, -7.853515625, -6.99365234375, -6.1337890625, -5.27392578125, -4.4140625, -3.55419921875, -2.6943359375, -1.83447265625, -0.974609375, -0.11474609375, 0.7451171875, 1.60498046875, 2.46484375, 3.32470703125, 4.1845703125, 5.04443359375, 5.904296875, 6.76416015625, 7.6240234375, 8.48388671875, 9.34375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 19.0, 53.0, 178.0, 1628.0, 1954.0, 182.0, 49.0, 13.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.890625, -5.765350341796875, -5.64007568359375, -5.514801025390625, -5.3895263671875, -5.264251708984375, -5.13897705078125, -5.013702392578125, -4.888427734375, -4.763153076171875, -4.63787841796875, -4.512603759765625, -4.3873291015625, -4.262054443359375, -4.13677978515625, -4.011505126953125, -3.88623046875, -3.760955810546875, -3.63568115234375, -3.510406494140625, -3.3851318359375, -3.259857177734375, -3.13458251953125, -3.009307861328125, -2.884033203125, -2.758758544921875, -2.63348388671875, -2.508209228515625, -2.3829345703125, -2.257659912109375, -2.13238525390625, -2.007110595703125, -1.8818359375, -1.756561279296875, -1.63128662109375, -1.506011962890625, -1.3807373046875, -1.255462646484375, -1.13018798828125, -1.004913330078125, -0.879638671875, -0.754364013671875, -0.62908935546875, -0.503814697265625, -0.3785400390625, -0.253265380859375, -0.12799072265625, -0.002716064453125, 0.12255859375, 0.247833251953125, 0.37310791015625, 0.498382568359375, 0.6236572265625, 0.748931884765625, 0.87420654296875, 0.999481201171875, 1.124755859375, 1.250030517578125, 1.37530517578125, 1.500579833984375, 1.6258544921875, 1.751129150390625, 1.87640380859375, 2.001678466796875, 2.126953125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 43.0, 281.0, 568.0, 95.0, 8.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.83489990234375, -39.570491790771484, -38.306087493896484, -37.04167938232422, -35.77727127075195, -34.51286315917969, -33.24845886230469, -31.984050750732422, -30.71964454650879, -29.455238342285156, -28.19083023071289, -26.926424026489258, -25.662017822265625, -24.39760971069336, -23.133203506469727, -21.868797302246094, -20.604389190673828, -19.339982986450195, -18.07557487487793, -16.811168670654297, -15.546761512756348, -14.282354354858398, -13.017948150634766, -11.753540992736816, -10.489133834838867, -9.224726676940918, -7.960319995880127, -6.695913314819336, -5.431506156921387, -4.1670989990234375, -2.9026923179626465, -1.6382856369018555, -0.37387847900390625, 0.8905284404754639, 2.154935359954834, 3.419342279434204, 4.683749198913574, 5.948156356811523, 7.2125630378723145, 8.476969718933105, 9.741376876831055, 11.005784034729004, 12.270191192626953, 13.534597396850586, 14.799004554748535, 16.063411712646484, 17.327817916870117, 18.59222412109375, 19.856632232666016, 21.12103843688965, 22.385446548461914, 23.649852752685547, 24.914260864257812, 26.178667068481445, 27.443073272705078, 28.707481384277344, 29.971887588500977, 31.23629379272461, 32.500701904296875, 33.76511001586914, 35.02951431274414, 36.293922424316406, 37.55833053588867, 38.82273483276367, 40.08714294433594]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 4.0, 17.0, 19.0, 25.0, 35.0, 49.0, 75.0, 68.0, 88.0, 76.0, 88.0, 86.0, 87.0, 72.0, 52.0, 54.0, 39.0, 24.0, 15.0, 11.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.560365676879883, -5.338555812835693, -5.116746425628662, -4.894936561584473, -4.673127174377441, -4.451317310333252, -4.2295074462890625, -4.007698059082031, -3.785888433456421, -3.5640788078308105, -3.3422691822052, -3.12045955657959, -2.8986496925354004, -2.676840305328369, -2.4550304412841797, -2.2332208156585693, -2.011411190032959, -1.7896015644073486, -1.5677919387817383, -1.3459821939468384, -1.124172568321228, -0.9023629426956177, -0.6805531978607178, -0.4587435722351074, -0.23693394660949707, -0.015124291181564331, 0.2066853642463684, 0.42849504947662354, 0.6503046751022339, 0.8721143007278442, 1.0939240455627441, 1.3157336711883545, 1.5375432968139648, 1.7593529224395752, 1.9811625480651855, 2.202972412109375, 2.4247817993164062, 2.6465916633605957, 2.868401288986206, 3.0902109146118164, 3.3120205402374268, 3.533830165863037, 3.7556397914886475, 3.977449417114258, 4.199259281158447, 4.4210686683654785, 4.642878532409668, 4.864687919616699, 5.086497783660889, 5.308307647705078, 5.530117034912109, 5.751926898956299, 5.97373628616333, 6.1955461502075195, 6.417355537414551, 6.63916540145874, 6.86097526550293, 7.082785129547119, 7.30459451675415, 7.52640438079834, 7.748213768005371, 7.9700236320495605, 8.19183349609375, 8.413642883300781, 8.635452270507812]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 10.0, 13.0, 11.0, 28.0, 31.0, 29.0, 34.0, 54.0, 78.0, 195.0, 599.0, 3379.0, 89944.0, 908519.0, 42500.0, 2234.0, 440.0, 164.0, 78.0, 69.0, 26.0, 36.0, 21.0, 12.0, 18.0, 8.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.71875, -14.2781982421875, -13.837646484375, -13.3970947265625, -12.95654296875, -12.5159912109375, -12.075439453125, -11.6348876953125, -11.1943359375, -10.7537841796875, -10.313232421875, -9.8726806640625, -9.43212890625, -8.9915771484375, -8.551025390625, -8.1104736328125, -7.669921875, -7.2293701171875, -6.788818359375, -6.3482666015625, -5.90771484375, -5.4671630859375, -5.026611328125, -4.5860595703125, -4.1455078125, -3.7049560546875, -3.264404296875, -2.8238525390625, -2.38330078125, -1.9427490234375, -1.502197265625, -1.0616455078125, -0.62109375, -0.1805419921875, 0.260009765625, 0.7005615234375, 1.14111328125, 1.5816650390625, 2.022216796875, 2.4627685546875, 2.9033203125, 3.3438720703125, 3.784423828125, 4.2249755859375, 4.66552734375, 5.1060791015625, 5.546630859375, 5.9871826171875, 6.427734375, 6.8682861328125, 7.308837890625, 7.7493896484375, 8.18994140625, 8.6304931640625, 9.071044921875, 9.5115966796875, 9.9521484375, 10.3927001953125, 10.833251953125, 11.2738037109375, 11.71435546875, 12.1549072265625, 12.595458984375, 13.0360107421875, 13.4765625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 16.0, 24.0, 55.0, 67.0, 101.0, 138.0, 172.0, 153.0, 122.0, 71.0, 53.0, 18.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60791015625, -0.5553207397460938, -0.5027313232421875, -0.45014190673828125, -0.397552490234375, -0.34496307373046875, -0.2923736572265625, -0.23978424072265625, -0.18719482421875, -0.13460540771484375, -0.0820159912109375, -0.02942657470703125, 0.023162841796875, 0.07575225830078125, 0.1283416748046875, 0.18093109130859375, 0.2335205078125, 0.28610992431640625, 0.3386993408203125, 0.39128875732421875, 0.443878173828125, 0.49646759033203125, 0.5490570068359375, 0.6016464233398438, 0.65423583984375, 0.7068252563476562, 0.7594146728515625, 0.8120040893554688, 0.864593505859375, 0.9171829223632812, 0.9697723388671875, 1.0223617553710938, 1.074951171875, 1.1275405883789062, 1.1801300048828125, 1.2327194213867188, 1.285308837890625, 1.3378982543945312, 1.3904876708984375, 1.4430770874023438, 1.49566650390625, 1.5482559204101562, 1.6008453369140625, 1.6534347534179688, 1.706024169921875, 1.7586135864257812, 1.8112030029296875, 1.8637924194335938, 1.9163818359375, 1.9689712524414062, 2.0215606689453125, 2.0741500854492188, 2.126739501953125, 2.1793289184570312, 2.2319183349609375, 2.2845077514648438, 2.33709716796875, 2.3896865844726562, 2.4422760009765625, 2.4948654174804688, 2.547454833984375, 2.6000442504882812, 2.6526336669921875, 2.7052230834960938, 2.7578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 10.0, 13.0, 18.0, 29.0, 49.0, 78.0, 119.0, 224.0, 373.0, 724.0, 1493.0, 3337.0, 9492.0, 35100.0, 185494.0, 549534.0, 206647.0, 38663.0, 10219.0, 3676.0, 1506.0, 762.0, 427.0, 216.0, 132.0, 83.0, 42.0, 29.0, 26.0, 11.0, 13.0, 5.0, 0.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -5.0035400390625, -4.858642578125, -4.7137451171875, -4.56884765625, -4.4239501953125, -4.279052734375, -4.1341552734375, -3.9892578125, -3.8443603515625, -3.699462890625, -3.5545654296875, -3.40966796875, -3.2647705078125, -3.119873046875, -2.9749755859375, -2.830078125, -2.6851806640625, -2.540283203125, -2.3953857421875, -2.25048828125, -2.1055908203125, -1.960693359375, -1.8157958984375, -1.6708984375, -1.5260009765625, -1.381103515625, -1.2362060546875, -1.09130859375, -0.9464111328125, -0.801513671875, -0.6566162109375, -0.51171875, -0.3668212890625, -0.221923828125, -0.0770263671875, 0.06787109375, 0.2127685546875, 0.357666015625, 0.5025634765625, 0.6474609375, 0.7923583984375, 0.937255859375, 1.0821533203125, 1.22705078125, 1.3719482421875, 1.516845703125, 1.6617431640625, 1.806640625, 1.9515380859375, 2.096435546875, 2.2413330078125, 2.38623046875, 2.5311279296875, 2.676025390625, 2.8209228515625, 2.9658203125, 3.1107177734375, 3.255615234375, 3.4005126953125, 3.54541015625, 3.6903076171875, 3.835205078125, 3.9801025390625, 4.125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 8.0, 1.0, 5.0, 9.0, 4.0, 12.0, 8.0, 14.0, 17.0, 23.0, 26.0, 33.0, 39.0, 44.0, 40.0, 56.0, 47.0, 50.0, 52.0, 44.0, 52.0, 66.0, 40.0, 45.0, 48.0, 31.0, 29.0, 38.0, 25.0, 27.0, 18.0, 14.0, 8.0, 9.0, 5.0, 7.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.3671875, -2.265625, -2.1640625, -2.0625, -1.9609375, -1.859375, -1.7578125, -1.65625, -1.5546875, -1.453125, -1.3515625, -1.25, -1.1484375, -1.046875, -0.9453125, -0.84375, -0.7421875, -0.640625, -0.5390625, -0.4375, -0.3359375, -0.234375, -0.1328125, -0.03125, 0.0703125, 0.171875, 0.2734375, 0.375, 0.4765625, 0.578125, 0.6796875, 0.78125, 0.8828125, 0.984375, 1.0859375, 1.1875, 1.2890625, 1.390625, 1.4921875, 1.59375, 1.6953125, 1.796875, 1.8984375, 2.0, 2.1015625, 2.203125, 2.3046875, 2.40625, 2.5078125, 2.609375, 2.7109375, 2.8125, 2.9140625, 3.015625, 3.1171875, 3.21875, 3.3203125, 3.421875, 3.5234375, 3.625, 3.7265625, 3.828125, 3.9296875, 4.03125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 5.0, 8.0, 16.0, 20.0, 47.0, 50.0, 84.0, 117.0, 219.0, 381.0, 722.0, 1515.0, 3417.0, 9580.0, 33194.0, 142964.0, 437933.0, 310798.0, 77121.0, 19292.0, 6237.0, 2448.0, 1100.0, 521.0, 302.0, 161.0, 94.0, 62.0, 52.0, 29.0, 20.0, 9.0, 10.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.54296875, -1.4893798828125, -1.435791015625, -1.3822021484375, -1.32861328125, -1.2750244140625, -1.221435546875, -1.1678466796875, -1.1142578125, -1.0606689453125, -1.007080078125, -0.9534912109375, -0.89990234375, -0.8463134765625, -0.792724609375, -0.7391357421875, -0.685546875, -0.6319580078125, -0.578369140625, -0.5247802734375, -0.47119140625, -0.4176025390625, -0.364013671875, -0.3104248046875, -0.2568359375, -0.2032470703125, -0.149658203125, -0.0960693359375, -0.04248046875, 0.0111083984375, 0.064697265625, 0.1182861328125, 0.171875, 0.2254638671875, 0.279052734375, 0.3326416015625, 0.38623046875, 0.4398193359375, 0.493408203125, 0.5469970703125, 0.6005859375, 0.6541748046875, 0.707763671875, 0.7613525390625, 0.81494140625, 0.8685302734375, 0.922119140625, 0.9757080078125, 1.029296875, 1.0828857421875, 1.136474609375, 1.1900634765625, 1.24365234375, 1.2972412109375, 1.350830078125, 1.4044189453125, 1.4580078125, 1.5115966796875, 1.565185546875, 1.6187744140625, 1.67236328125, 1.7259521484375, 1.779541015625, 1.8331298828125, 1.88671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 6.0, 7.0, 5.0, 11.0, 9.0, 13.0, 15.0, 15.0, 11.0, 21.0, 30.0, 48.0, 43.0, 60.0, 51.0, 61.0, 62.0, 69.0, 81.0, 62.0, 41.0, 49.0, 42.0, 31.0, 21.0, 27.0, 19.0, 21.0, 22.0, 6.0, 4.0, 5.0, 12.0, 3.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0002663135528564453, -0.0002582930028438568, -0.0002502724528312683, -0.0002422519028186798, -0.0002342313528060913, -0.0002262108027935028, -0.0002181902527809143, -0.0002101697027683258, -0.0002021491527557373, -0.0001941286027431488, -0.0001861080527305603, -0.0001780875027179718, -0.0001700669527053833, -0.0001620464026927948, -0.0001540258526802063, -0.0001460053026676178, -0.0001379847526550293, -0.0001299642026424408, -0.0001219436526298523, -0.0001139231026172638, -0.00010590255260467529, -9.788200259208679e-05, -8.986145257949829e-05, -8.184090256690979e-05, -7.382035255432129e-05, -6.579980254173279e-05, -5.777925252914429e-05, -4.9758702516555786e-05, -4.1738152503967285e-05, -3.3717602491378784e-05, -2.5697052478790283e-05, -1.7676502466201782e-05, -9.655952453613281e-06, -1.6354024410247803e-06, 6.385147571563721e-06, 1.4405697584152222e-05, 2.2426247596740723e-05, 3.0446797609329224e-05, 3.8467347621917725e-05, 4.6487897634506226e-05, 5.4508447647094727e-05, 6.252899765968323e-05, 7.054954767227173e-05, 7.857009768486023e-05, 8.659064769744873e-05, 9.461119771003723e-05, 0.00010263174772262573, 0.00011065229773521423, 0.00011867284774780273, 0.00012669339776039124, 0.00013471394777297974, 0.00014273449778556824, 0.00015075504779815674, 0.00015877559781074524, 0.00016679614782333374, 0.00017481669783592224, 0.00018283724784851074, 0.00019085779786109924, 0.00019887834787368774, 0.00020689889788627625, 0.00021491944789886475, 0.00022293999791145325, 0.00023096054792404175, 0.00023898109793663025, 0.00024700164794921875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 6.0, 6.0, 12.0, 9.0, 18.0, 33.0, 47.0, 66.0, 93.0, 163.0, 280.0, 605.0, 1133.0, 2531.0, 6438.0, 20781.0, 89000.0, 392733.0, 406554.0, 94382.0, 21773.0, 6713.0, 2592.0, 1219.0, 586.0, 305.0, 186.0, 100.0, 68.0, 40.0, 31.0, 26.0, 7.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8212890625, -1.764404296875, -1.70751953125, -1.650634765625, -1.59375, -1.536865234375, -1.47998046875, -1.423095703125, -1.3662109375, -1.309326171875, -1.25244140625, -1.195556640625, -1.138671875, -1.081787109375, -1.02490234375, -0.968017578125, -0.9111328125, -0.854248046875, -0.79736328125, -0.740478515625, -0.68359375, -0.626708984375, -0.56982421875, -0.512939453125, -0.4560546875, -0.399169921875, -0.34228515625, -0.285400390625, -0.228515625, -0.171630859375, -0.11474609375, -0.057861328125, -0.0009765625, 0.055908203125, 0.11279296875, 0.169677734375, 0.2265625, 0.283447265625, 0.34033203125, 0.397216796875, 0.4541015625, 0.510986328125, 0.56787109375, 0.624755859375, 0.681640625, 0.738525390625, 0.79541015625, 0.852294921875, 0.9091796875, 0.966064453125, 1.02294921875, 1.079833984375, 1.13671875, 1.193603515625, 1.25048828125, 1.307373046875, 1.3642578125, 1.421142578125, 1.47802734375, 1.534912109375, 1.591796875, 1.648681640625, 1.70556640625, 1.762451171875, 1.8193359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 11.0, 9.0, 16.0, 17.0, 16.0, 34.0, 32.0, 55.0, 65.0, 68.0, 72.0, 79.0, 72.0, 84.0, 67.0, 58.0, 38.0, 48.0, 32.0, 25.0, 19.0, 22.0, 14.0, 14.0, 4.0, 3.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.38671875, -1.34735107421875, -1.3079833984375, -1.26861572265625, -1.229248046875, -1.18988037109375, -1.1505126953125, -1.11114501953125, -1.07177734375, -1.03240966796875, -0.9930419921875, -0.95367431640625, -0.914306640625, -0.87493896484375, -0.8355712890625, -0.79620361328125, -0.7568359375, -0.71746826171875, -0.6781005859375, -0.63873291015625, -0.599365234375, -0.55999755859375, -0.5206298828125, -0.48126220703125, -0.44189453125, -0.40252685546875, -0.3631591796875, -0.32379150390625, -0.284423828125, -0.24505615234375, -0.2056884765625, -0.16632080078125, -0.126953125, -0.08758544921875, -0.0482177734375, -0.00885009765625, 0.030517578125, 0.06988525390625, 0.1092529296875, 0.14862060546875, 0.18798828125, 0.22735595703125, 0.2667236328125, 0.30609130859375, 0.345458984375, 0.38482666015625, 0.4241943359375, 0.46356201171875, 0.5029296875, 0.54229736328125, 0.5816650390625, 0.62103271484375, 0.660400390625, 0.69976806640625, 0.7391357421875, 0.77850341796875, 0.81787109375, 0.85723876953125, 0.8966064453125, 0.93597412109375, 0.975341796875, 1.01470947265625, 1.0540771484375, 1.09344482421875, 1.1328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 17.0, 30.0, 35.0, 93.0, 129.0, 163.0, 170.0, 145.0, 87.0, 55.0, 19.0, 13.0, 11.0, 9.0, 3.0, 1.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.135120391845703, -19.182296752929688, -18.22947120666504, -17.276647567749023, -16.323822021484375, -15.37099838256836, -14.418173789978027, -13.465349197387695, -12.51252555847168, -11.559700965881348, -10.606876373291016, -9.654052734375, -8.701228141784668, -7.748403549194336, -6.795578956604004, -5.84275484085083, -4.88992977142334, -3.937105417251587, -2.984281063079834, -2.031456470489502, -1.078632116317749, -0.1258077621459961, 0.8270168304443359, 1.7798409461975098, 2.732665538787842, 3.6854898929595947, 4.638314247131348, 5.59113883972168, 6.543963432312012, 7.4967875480651855, 8.44961166381836, 9.402436256408691, 10.355260848999023, 11.308085441589355, 12.260910034179688, 13.213733673095703, 14.166558265686035, 15.119382858276367, 16.072208404541016, 17.02503204345703, 17.977855682373047, 18.930679321289062, 19.88350486755371, 20.836328506469727, 21.789154052734375, 22.74197769165039, 23.694801330566406, 24.647626876831055, 25.600452423095703, 26.55327606201172, 27.506101608276367, 28.458925247192383, 29.41175079345703, 30.364574432373047, 31.317398071289062, 32.27022171020508, 33.223045349121094, 34.17586898803711, 35.128692626953125, 36.081520080566406, 37.03434371948242, 37.98716735839844, 38.93999099731445, 39.89281463623047, 40.84564208984375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 10.0, 3.0, 7.0, 8.0, 9.0, 12.0, 10.0, 14.0, 21.0, 17.0, 30.0, 29.0, 39.0, 38.0, 36.0, 39.0, 36.0, 57.0, 37.0, 56.0, 55.0, 47.0, 47.0, 46.0, 50.0, 25.0, 31.0, 24.0, 29.0, 20.0, 27.0, 17.0, 13.0, 8.0, 10.0, 7.0, 13.0, 7.0, 1.0, 4.0, 6.0, 1.0, 5.0, 1.0, 0.0, 3.0], "bins": [-18.54563331604004, -18.051284790039062, -17.55693817138672, -17.062589645385742, -16.5682430267334, -16.073894500732422, -15.579546928405762, -15.085199356079102, -14.590851783752441, -14.096504211425781, -13.602156639099121, -13.107809066772461, -12.613460540771484, -12.11911392211914, -11.624765396118164, -11.130417823791504, -10.636070251464844, -10.141722679138184, -9.647375106811523, -9.153027534484863, -8.658679962158203, -8.164331436157227, -7.669983863830566, -7.175636291503906, -6.681288719177246, -6.186941146850586, -5.692593574523926, -5.198245525360107, -4.703897953033447, -4.209550380706787, -3.715202569961548, -3.2208547592163086, -2.7265071868896484, -2.2321596145629883, -1.737811803817749, -1.2434641122817993, -0.7491164207458496, -0.25476884841918945, 0.2395789623260498, 0.7339267730712891, 1.2282743453979492, 1.722622036933899, 2.2169697284698486, 2.711317539215088, 3.205665111541748, 3.700012683868408, 4.194360733032227, 4.688708305358887, 5.183055877685547, 5.677403450012207, 6.171751022338867, 6.6660990715026855, 7.160446643829346, 7.654794216156006, 8.149142265319824, 8.643489837646484, 9.137837409973145, 9.632184982299805, 10.126532554626465, 10.620880126953125, 11.115228652954102, 11.609575271606445, 12.103923797607422, 12.598271369934082, 13.092618942260742]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 8.0, 11.0, 32.0, 60.0, 131.0, 323.0, 1017.0, 3419.0, 19906.0, 404608.0, 3707718.0, 48630.0, 5630.0, 1407.0, 518.0, 263.0, 150.0, 73.0, 59.0, 48.0, 47.0, 33.0, 27.0, 23.0, 24.0, 16.0, 20.0, 15.0, 11.0, 15.0, 8.0, 5.0, 3.0, 6.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.265625, -3.942626953125, -3.61962890625, -3.296630859375, -2.9736328125, -2.650634765625, -2.32763671875, -2.004638671875, -1.681640625, -1.358642578125, -1.03564453125, -0.712646484375, -0.3896484375, -0.066650390625, 0.25634765625, 0.579345703125, 0.90234375, 1.225341796875, 1.54833984375, 1.871337890625, 2.1943359375, 2.517333984375, 2.84033203125, 3.163330078125, 3.486328125, 3.809326171875, 4.13232421875, 4.455322265625, 4.7783203125, 5.101318359375, 5.42431640625, 5.747314453125, 6.0703125, 6.393310546875, 6.71630859375, 7.039306640625, 7.3623046875, 7.685302734375, 8.00830078125, 8.331298828125, 8.654296875, 8.977294921875, 9.30029296875, 9.623291015625, 9.9462890625, 10.269287109375, 10.59228515625, 10.915283203125, 11.23828125, 11.561279296875, 11.88427734375, 12.207275390625, 12.5302734375, 12.853271484375, 13.17626953125, 13.499267578125, 13.822265625, 14.145263671875, 14.46826171875, 14.791259765625, 15.1142578125, 15.437255859375, 15.76025390625, 16.083251953125, 16.40625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 8.0, 20.0, 35.0, 42.0, 82.0, 116.0, 140.0, 153.0, 134.0, 132.0, 56.0, 50.0, 31.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54931640625, -0.49654388427734375, -0.4437713623046875, -0.39099884033203125, -0.338226318359375, -0.28545379638671875, -0.2326812744140625, -0.17990875244140625, -0.12713623046875, -0.07436370849609375, -0.0215911865234375, 0.03118133544921875, 0.083953857421875, 0.13672637939453125, 0.1894989013671875, 0.24227142333984375, 0.2950439453125, 0.34781646728515625, 0.4005889892578125, 0.45336151123046875, 0.506134033203125, 0.5589065551757812, 0.6116790771484375, 0.6644515991210938, 0.71722412109375, 0.7699966430664062, 0.8227691650390625, 0.8755416870117188, 0.928314208984375, 0.9810867309570312, 1.0338592529296875, 1.0866317749023438, 1.139404296875, 1.1921768188476562, 1.2449493408203125, 1.2977218627929688, 1.350494384765625, 1.4032669067382812, 1.4560394287109375, 1.5088119506835938, 1.56158447265625, 1.6143569946289062, 1.6671295166015625, 1.7199020385742188, 1.772674560546875, 1.8254470825195312, 1.8782196044921875, 1.9309921264648438, 1.9837646484375, 2.0365371704101562, 2.0893096923828125, 2.1420822143554688, 2.194854736328125, 2.2476272583007812, 2.3003997802734375, 2.3531723022460938, 2.40594482421875, 2.4587173461914062, 2.5114898681640625, 2.5642623901367188, 2.617034912109375, 2.6698074340820312, 2.7225799560546875, 2.7753524780273438, 2.828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 14.0, 16.0, 24.0, 40.0, 48.0, 93.0, 206.0, 461.0, 1183.0, 4725.0, 101153.0, 4069954.0, 12611.0, 2331.0, 724.0, 322.0, 147.0, 83.0, 44.0, 27.0, 18.0, 18.0, 10.0, 9.0, 12.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.375, -34.51708984375, -33.6591796875, -32.80126953125, -31.943359375, -31.08544921875, -30.2275390625, -29.36962890625, -28.51171875, -27.65380859375, -26.7958984375, -25.93798828125, -25.080078125, -24.22216796875, -23.3642578125, -22.50634765625, -21.6484375, -20.79052734375, -19.9326171875, -19.07470703125, -18.216796875, -17.35888671875, -16.5009765625, -15.64306640625, -14.78515625, -13.92724609375, -13.0693359375, -12.21142578125, -11.353515625, -10.49560546875, -9.6376953125, -8.77978515625, -7.921875, -7.06396484375, -6.2060546875, -5.34814453125, -4.490234375, -3.63232421875, -2.7744140625, -1.91650390625, -1.05859375, -0.20068359375, 0.6572265625, 1.51513671875, 2.373046875, 3.23095703125, 4.0888671875, 4.94677734375, 5.8046875, 6.66259765625, 7.5205078125, 8.37841796875, 9.236328125, 10.09423828125, 10.9521484375, 11.81005859375, 12.66796875, 13.52587890625, 14.3837890625, 15.24169921875, 16.099609375, 16.95751953125, 17.8154296875, 18.67333984375, 19.53125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 8.0, 15.0, 92.0, 515.0, 2913.0, 393.0, 90.0, 22.0, 5.0, 7.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.38360595703125, -5.1539306640625, -4.92425537109375, -4.694580078125, -4.46490478515625, -4.2352294921875, -4.00555419921875, -3.77587890625, -3.54620361328125, -3.3165283203125, -3.08685302734375, -2.857177734375, -2.62750244140625, -2.3978271484375, -2.16815185546875, -1.9384765625, -1.70880126953125, -1.4791259765625, -1.24945068359375, -1.019775390625, -0.79010009765625, -0.5604248046875, -0.33074951171875, -0.10107421875, 0.12860107421875, 0.3582763671875, 0.58795166015625, 0.817626953125, 1.04730224609375, 1.2769775390625, 1.50665283203125, 1.736328125, 1.96600341796875, 2.1956787109375, 2.42535400390625, 2.655029296875, 2.88470458984375, 3.1143798828125, 3.34405517578125, 3.57373046875, 3.80340576171875, 4.0330810546875, 4.26275634765625, 4.492431640625, 4.72210693359375, 4.9517822265625, 5.18145751953125, 5.4111328125, 5.64080810546875, 5.8704833984375, 6.10015869140625, 6.329833984375, 6.55950927734375, 6.7891845703125, 7.01885986328125, 7.24853515625, 7.47821044921875, 7.7078857421875, 7.93756103515625, 8.167236328125, 8.39691162109375, 8.6265869140625, 8.85626220703125, 9.0859375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 43.0, 96.0, 237.0, 309.0, 170.0, 66.0, 35.0, 7.0, 12.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.66364669799805, -37.467140197753906, -36.2706298828125, -35.07412338256836, -33.87761688232422, -32.68111038208008, -31.484601974487305, -30.28809356689453, -29.09158706665039, -27.89508056640625, -26.698572158813477, -25.502063751220703, -24.305557250976562, -23.109050750732422, -21.91254234313965, -20.716033935546875, -19.519527435302734, -18.323020935058594, -17.12651252746582, -15.930005073547363, -14.733497619628906, -13.53699016571045, -12.340482711791992, -11.143975257873535, -9.947467803955078, -8.750960350036621, -7.554452896118164, -6.357945442199707, -5.16143798828125, -3.964930534362793, -2.768423080444336, -1.571915626525879, -0.3754081726074219, 0.8210992813110352, 2.017606735229492, 3.214114189147949, 4.410621643066406, 5.607129096984863, 6.80363655090332, 8.000144004821777, 9.196651458740234, 10.393158912658691, 11.589666366577148, 12.786173820495605, 13.982681274414062, 15.17918872833252, 16.375696182250977, 17.57220458984375, 18.76871109008789, 19.96521759033203, 21.161725997924805, 22.358234405517578, 23.55474090576172, 24.75124740600586, 25.947755813598633, 27.144264221191406, 28.340770721435547, 29.537277221679688, 30.73378562927246, 31.930294036865234, 33.126800537109375, 34.323307037353516, 35.519813537597656, 36.71632385253906, 37.9128303527832]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 4.0, 16.0, 27.0, 34.0, 55.0, 60.0, 88.0, 79.0, 102.0, 117.0, 80.0, 96.0, 73.0, 56.0, 34.0, 31.0, 18.0, 11.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.972763061523438, -18.469802856445312, -17.966842651367188, -17.463882446289062, -16.960922241210938, -16.457962036132812, -15.955002784729004, -15.452042579650879, -14.949082374572754, -14.446122169494629, -13.943161964416504, -13.440201759338379, -12.93724250793457, -12.434282302856445, -11.93132209777832, -11.428361892700195, -10.92540168762207, -10.422441482543945, -9.91948127746582, -9.416521072387695, -8.91356086730957, -8.410600662231445, -7.907641410827637, -7.404681205749512, -6.901721000671387, -6.398760795593262, -5.895800590515137, -5.39284086227417, -4.889880657196045, -4.38692045211792, -3.883960485458374, -3.381000518798828, -2.8780384063720703, -2.3750782012939453, -1.8721182346343994, -1.369158148765564, -0.8661980628967285, -0.3632378578186035, 0.13972210884094238, 0.6426820755004883, 1.1456422805786133, 1.6486023664474487, 2.151562452316284, 2.65452241897583, 3.157482624053955, 3.66044282913208, 4.163402557373047, 4.666362762451172, 5.169322967529297, 5.672283172607422, 6.175243377685547, 6.678203105926514, 7.181163311004639, 7.684123516082764, 8.18708324432373, 8.690043449401855, 9.19300365447998, 9.695963859558105, 10.19892406463623, 10.701884269714355, 11.204843521118164, 11.707803726196289, 12.210763931274414, 12.713724136352539, 13.216684341430664]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 7.0, 21.0, 22.0, 30.0, 27.0, 38.0, 45.0, 72.0, 122.0, 176.0, 290.0, 527.0, 1067.0, 3188.0, 14782.0, 132103.0, 711772.0, 161088.0, 16924.0, 3512.0, 1250.0, 559.0, 312.0, 172.0, 133.0, 81.0, 56.0, 35.0, 42.0, 24.0, 22.0, 16.0, 10.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90234375, -7.63482666015625, -7.3673095703125, -7.09979248046875, -6.832275390625, -6.56475830078125, -6.2972412109375, -6.02972412109375, -5.76220703125, -5.49468994140625, -5.2271728515625, -4.95965576171875, -4.692138671875, -4.42462158203125, -4.1571044921875, -3.88958740234375, -3.6220703125, -3.35455322265625, -3.0870361328125, -2.81951904296875, -2.552001953125, -2.28448486328125, -2.0169677734375, -1.74945068359375, -1.48193359375, -1.21441650390625, -0.9468994140625, -0.67938232421875, -0.411865234375, -0.14434814453125, 0.1231689453125, 0.39068603515625, 0.658203125, 0.92572021484375, 1.1932373046875, 1.46075439453125, 1.728271484375, 1.99578857421875, 2.2633056640625, 2.53082275390625, 2.79833984375, 3.06585693359375, 3.3333740234375, 3.60089111328125, 3.868408203125, 4.13592529296875, 4.4034423828125, 4.67095947265625, 4.9384765625, 5.20599365234375, 5.4735107421875, 5.74102783203125, 6.008544921875, 6.27606201171875, 6.5435791015625, 6.81109619140625, 7.07861328125, 7.34613037109375, 7.6136474609375, 7.88116455078125, 8.148681640625, 8.41619873046875, 8.6837158203125, 8.95123291015625, 9.21875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 10.0, 15.0, 39.0, 44.0, 64.0, 82.0, 123.0, 131.0, 122.0, 103.0, 100.0, 68.0, 47.0, 24.0, 15.0, 10.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8571395874023438, -0.8094940185546875, -0.7618484497070312, -0.714202880859375, -0.6665573120117188, -0.6189117431640625, -0.5712661743164062, -0.52362060546875, -0.47597503662109375, -0.4283294677734375, -0.38068389892578125, -0.333038330078125, -0.28539276123046875, -0.2377471923828125, -0.19010162353515625, -0.1424560546875, -0.09481048583984375, -0.0471649169921875, 0.00048065185546875, 0.048126220703125, 0.09577178955078125, 0.1434173583984375, 0.19106292724609375, 0.23870849609375, 0.28635406494140625, 0.3339996337890625, 0.38164520263671875, 0.429290771484375, 0.47693634033203125, 0.5245819091796875, 0.5722274780273438, 0.619873046875, 0.6675186157226562, 0.7151641845703125, 0.7628097534179688, 0.810455322265625, 0.8581008911132812, 0.9057464599609375, 0.9533920288085938, 1.00103759765625, 1.0486831665039062, 1.0963287353515625, 1.1439743041992188, 1.191619873046875, 1.2392654418945312, 1.2869110107421875, 1.3345565795898438, 1.3822021484375, 1.4298477172851562, 1.4774932861328125, 1.5251388549804688, 1.572784423828125, 1.6204299926757812, 1.6680755615234375, 1.7157211303710938, 1.76336669921875, 1.8110122680664062, 1.8586578369140625, 1.9063034057617188, 1.953948974609375, 2.0015945434570312, 2.0492401123046875, 2.0968856811523438, 2.14453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 6.0, 12.0, 18.0, 11.0, 24.0, 30.0, 45.0, 53.0, 86.0, 93.0, 127.0, 184.0, 284.0, 462.0, 820.0, 1399.0, 2613.0, 5186.0, 11003.0, 25117.0, 61118.0, 150282.0, 298560.0, 272638.0, 126500.0, 51102.0, 21183.0, 9493.0, 4506.0, 2268.0, 1268.0, 701.0, 417.0, 276.0, 196.0, 142.0, 81.0, 64.0, 45.0, 27.0, 35.0, 17.0, 18.0, 18.0, 8.0, 3.0, 5.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.294921875, -2.218170166015625, -2.14141845703125, -2.064666748046875, -1.9879150390625, -1.911163330078125, -1.83441162109375, -1.757659912109375, -1.680908203125, -1.604156494140625, -1.52740478515625, -1.450653076171875, -1.3739013671875, -1.297149658203125, -1.22039794921875, -1.143646240234375, -1.06689453125, -0.990142822265625, -0.91339111328125, -0.836639404296875, -0.7598876953125, -0.683135986328125, -0.60638427734375, -0.529632568359375, -0.452880859375, -0.376129150390625, -0.29937744140625, -0.222625732421875, -0.1458740234375, -0.069122314453125, 0.00762939453125, 0.084381103515625, 0.1611328125, 0.237884521484375, 0.31463623046875, 0.391387939453125, 0.4681396484375, 0.544891357421875, 0.62164306640625, 0.698394775390625, 0.775146484375, 0.851898193359375, 0.92864990234375, 1.005401611328125, 1.0821533203125, 1.158905029296875, 1.23565673828125, 1.312408447265625, 1.38916015625, 1.465911865234375, 1.54266357421875, 1.619415283203125, 1.6961669921875, 1.772918701171875, 1.84967041015625, 1.926422119140625, 2.003173828125, 2.079925537109375, 2.15667724609375, 2.233428955078125, 2.3101806640625, 2.386932373046875, 2.46368408203125, 2.540435791015625, 2.6171875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 8.0, 11.0, 4.0, 9.0, 9.0, 9.0, 10.0, 11.0, 13.0, 19.0, 23.0, 27.0, 36.0, 32.0, 26.0, 53.0, 43.0, 41.0, 45.0, 51.0, 47.0, 46.0, 50.0, 43.0, 37.0, 44.0, 34.0, 24.0, 32.0, 33.0, 28.0, 14.0, 19.0, 15.0, 10.0, 11.0, 8.0, 8.0, 2.0, 10.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2109375, -2.128082275390625, -2.04522705078125, -1.962371826171875, -1.8795166015625, -1.796661376953125, -1.71380615234375, -1.630950927734375, -1.548095703125, -1.465240478515625, -1.38238525390625, -1.299530029296875, -1.2166748046875, -1.133819580078125, -1.05096435546875, -0.968109130859375, -0.88525390625, -0.802398681640625, -0.71954345703125, -0.636688232421875, -0.5538330078125, -0.470977783203125, -0.38812255859375, -0.305267333984375, -0.222412109375, -0.139556884765625, -0.05670166015625, 0.026153564453125, 0.1090087890625, 0.191864013671875, 0.27471923828125, 0.357574462890625, 0.4404296875, 0.523284912109375, 0.60614013671875, 0.688995361328125, 0.7718505859375, 0.854705810546875, 0.93756103515625, 1.020416259765625, 1.103271484375, 1.186126708984375, 1.26898193359375, 1.351837158203125, 1.4346923828125, 1.517547607421875, 1.60040283203125, 1.683258056640625, 1.76611328125, 1.848968505859375, 1.93182373046875, 2.014678955078125, 2.0975341796875, 2.180389404296875, 2.26324462890625, 2.346099853515625, 2.428955078125, 2.511810302734375, 2.59466552734375, 2.677520751953125, 2.7603759765625, 2.843231201171875, 2.92608642578125, 3.008941650390625, 3.091796875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 8.0, 11.0, 11.0, 9.0, 23.0, 21.0, 40.0, 41.0, 66.0, 125.0, 172.0, 348.0, 646.0, 1276.0, 2746.0, 6369.0, 17335.0, 58868.0, 240193.0, 472284.0, 180125.0, 43883.0, 13897.0, 5305.0, 2317.0, 1083.0, 546.0, 289.0, 173.0, 102.0, 70.0, 43.0, 33.0, 28.0, 24.0, 11.0, 9.0, 4.0, 9.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.025390625, -1.96087646484375, -1.8963623046875, -1.83184814453125, -1.767333984375, -1.70281982421875, -1.6383056640625, -1.57379150390625, -1.50927734375, -1.44476318359375, -1.3802490234375, -1.31573486328125, -1.251220703125, -1.18670654296875, -1.1221923828125, -1.05767822265625, -0.9931640625, -0.92864990234375, -0.8641357421875, -0.79962158203125, -0.735107421875, -0.67059326171875, -0.6060791015625, -0.54156494140625, -0.47705078125, -0.41253662109375, -0.3480224609375, -0.28350830078125, -0.218994140625, -0.15447998046875, -0.0899658203125, -0.02545166015625, 0.0390625, 0.10357666015625, 0.1680908203125, 0.23260498046875, 0.297119140625, 0.36163330078125, 0.4261474609375, 0.49066162109375, 0.55517578125, 0.61968994140625, 0.6842041015625, 0.74871826171875, 0.813232421875, 0.87774658203125, 0.9422607421875, 1.00677490234375, 1.0712890625, 1.13580322265625, 1.2003173828125, 1.26483154296875, 1.329345703125, 1.39385986328125, 1.4583740234375, 1.52288818359375, 1.58740234375, 1.65191650390625, 1.7164306640625, 1.78094482421875, 1.845458984375, 1.90997314453125, 1.9744873046875, 2.03900146484375, 2.103515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 3.0, 19.0, 2.0, 5.0, 17.0, 13.0, 16.0, 18.0, 19.0, 28.0, 29.0, 36.0, 53.0, 68.0, 85.0, 104.0, 98.0, 79.0, 55.0, 47.0, 39.0, 33.0, 18.0, 24.0, 13.0, 12.0, 10.0, 8.0, 9.0, 10.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024771690368652344, -0.000238809734582901, -0.00022990256547927856, -0.00022099539637565613, -0.0002120882272720337, -0.00020318105816841125, -0.00019427388906478882, -0.00018536671996116638, -0.00017645955085754395, -0.0001675523817539215, -0.00015864521265029907, -0.00014973804354667664, -0.0001408308744430542, -0.00013192370533943176, -0.00012301653623580933, -0.00011410936713218689, -0.00010520219802856445, -9.629502892494202e-05, -8.738785982131958e-05, -7.848069071769714e-05, -6.957352161407471e-05, -6.066635251045227e-05, -5.1759183406829834e-05, -4.28520143032074e-05, -3.394484519958496e-05, -2.5037676095962524e-05, -1.6130506992340088e-05, -7.223337888717651e-06, 1.6838312149047852e-06, 1.0591000318527222e-05, 1.9498169422149658e-05, 2.8405338525772095e-05, 3.731250762939453e-05, 4.621967673301697e-05, 5.5126845836639404e-05, 6.403401494026184e-05, 7.294118404388428e-05, 8.184835314750671e-05, 9.075552225112915e-05, 9.966269135475159e-05, 0.00010856986045837402, 0.00011747702956199646, 0.0001263841986656189, 0.00013529136776924133, 0.00014419853687286377, 0.0001531057059764862, 0.00016201287508010864, 0.00017092004418373108, 0.00017982721328735352, 0.00018873438239097595, 0.0001976415514945984, 0.00020654872059822083, 0.00021545588970184326, 0.0002243630588054657, 0.00023327022790908813, 0.00024217739701271057, 0.000251084566116333, 0.00025999173521995544, 0.0002688989043235779, 0.0002778060734272003, 0.00028671324253082275, 0.0002956204116344452, 0.0003045275807380676, 0.00031343474984169006, 0.0003223419189453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 12.0, 15.0, 23.0, 22.0, 52.0, 54.0, 97.0, 113.0, 195.0, 323.0, 502.0, 904.0, 1722.0, 3721.0, 8685.0, 24809.0, 93876.0, 354894.0, 398985.0, 112580.0, 28912.0, 9642.0, 3963.0, 1946.0, 1003.0, 546.0, 318.0, 215.0, 139.0, 91.0, 46.0, 41.0, 28.0, 25.0, 11.0, 9.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.111328125, -2.049346923828125, -1.98736572265625, -1.925384521484375, -1.8634033203125, -1.801422119140625, -1.73944091796875, -1.677459716796875, -1.615478515625, -1.553497314453125, -1.49151611328125, -1.429534912109375, -1.3675537109375, -1.305572509765625, -1.24359130859375, -1.181610107421875, -1.11962890625, -1.057647705078125, -0.99566650390625, -0.933685302734375, -0.8717041015625, -0.809722900390625, -0.74774169921875, -0.685760498046875, -0.623779296875, -0.561798095703125, -0.49981689453125, -0.437835693359375, -0.3758544921875, -0.313873291015625, -0.25189208984375, -0.189910888671875, -0.1279296875, -0.065948486328125, -0.00396728515625, 0.058013916015625, 0.1199951171875, 0.181976318359375, 0.24395751953125, 0.305938720703125, 0.367919921875, 0.429901123046875, 0.49188232421875, 0.553863525390625, 0.6158447265625, 0.677825927734375, 0.73980712890625, 0.801788330078125, 0.86376953125, 0.925750732421875, 0.98773193359375, 1.049713134765625, 1.1116943359375, 1.173675537109375, 1.23565673828125, 1.297637939453125, 1.359619140625, 1.421600341796875, 1.48358154296875, 1.545562744140625, 1.6075439453125, 1.669525146484375, 1.73150634765625, 1.793487548828125, 1.85546875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 9.0, 14.0, 11.0, 26.0, 33.0, 43.0, 56.0, 86.0, 92.0, 85.0, 117.0, 103.0, 82.0, 75.0, 44.0, 37.0, 23.0, 9.0, 9.0, 3.0, 7.0, 3.0, 5.0, 13.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.283203125, -2.2200469970703125, -2.156890869140625, -2.0937347412109375, -2.03057861328125, -1.9674224853515625, -1.904266357421875, -1.8411102294921875, -1.7779541015625, -1.7147979736328125, -1.651641845703125, -1.5884857177734375, -1.52532958984375, -1.4621734619140625, -1.399017333984375, -1.3358612060546875, -1.272705078125, -1.2095489501953125, -1.146392822265625, -1.0832366943359375, -1.02008056640625, -0.9569244384765625, -0.893768310546875, -0.8306121826171875, -0.7674560546875, -0.7042999267578125, -0.641143798828125, -0.5779876708984375, -0.51483154296875, -0.4516754150390625, -0.388519287109375, -0.3253631591796875, -0.26220703125, -0.1990509033203125, -0.135894775390625, -0.0727386474609375, -0.00958251953125, 0.0535736083984375, 0.116729736328125, 0.1798858642578125, 0.2430419921875, 0.3061981201171875, 0.369354248046875, 0.4325103759765625, 0.49566650390625, 0.5588226318359375, 0.621978759765625, 0.6851348876953125, 0.748291015625, 0.8114471435546875, 0.874603271484375, 0.9377593994140625, 1.00091552734375, 1.0640716552734375, 1.127227783203125, 1.1903839111328125, 1.2535400390625, 1.3166961669921875, 1.379852294921875, 1.4430084228515625, 1.50616455078125, 1.5693206787109375, 1.632476806640625, 1.6956329345703125, 1.7587890625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 14.0, 11.0, 37.0, 72.0, 110.0, 200.0, 195.0, 147.0, 94.0, 60.0, 36.0, 12.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.938976287841797, -18.784746170043945, -17.630516052246094, -16.476287841796875, -15.322057723999023, -14.167827606201172, -13.013598442077637, -11.859369277954102, -10.70513916015625, -9.550909042358398, -8.396679878234863, -7.24245023727417, -6.088220596313477, -4.933990955352783, -3.77976131439209, -2.6255321502685547, -1.4713020324707031, -0.31707239151000977, 0.8371572494506836, 1.991386890411377, 3.1456165313720703, 4.299846172332764, 5.454075813293457, 6.608304977416992, 7.762535095214844, 8.916765213012695, 10.07099437713623, 11.225223541259766, 12.379453659057617, 13.533683776855469, 14.687912940979004, 15.842142105102539, 16.996368408203125, 18.150598526000977, 19.304828643798828, 20.459056854248047, 21.6132869720459, 22.76751708984375, 23.92174530029297, 25.07597541809082, 26.230205535888672, 27.384435653686523, 28.538665771484375, 29.692893981933594, 30.847124099731445, 32.0013542175293, 33.155582427978516, 34.309814453125, 35.46404266357422, 36.61827087402344, 37.77250289916992, 38.92673110961914, 40.080963134765625, 41.235191345214844, 42.38941955566406, 43.54364776611328, 44.697879791259766, 45.852108001708984, 47.00634002685547, 48.16056823730469, 49.314796447753906, 50.46902847290039, 51.62325668334961, 52.777488708496094, 53.93171691894531]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 5.0, 8.0, 11.0, 14.0, 15.0, 27.0, 31.0, 29.0, 22.0, 49.0, 42.0, 52.0, 56.0, 51.0, 54.0, 66.0, 61.0, 52.0, 47.0, 41.0, 39.0, 54.0, 30.0, 30.0, 19.0, 20.0, 11.0, 11.0, 16.0, 9.0, 6.0, 7.0, 4.0, 3.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.47918701171875, -14.908544540405273, -14.337902069091797, -13.76725959777832, -13.196617126464844, -12.625974655151367, -12.055331230163574, -11.484688758850098, -10.914046287536621, -10.343403816223145, -9.772761344909668, -9.202118873596191, -8.631475448608398, -8.060832977294922, -7.490190505981445, -6.919548034667969, -6.348905563354492, -5.778263092041016, -5.207620620727539, -4.636977672576904, -4.066335201263428, -3.495692729949951, -2.9250500202178955, -2.35440731048584, -1.7837648391723633, -1.2131222486495972, -0.642479658126831, -0.07183706760406494, 0.49880552291870117, 1.0694479942321777, 1.6400907039642334, 2.210733413696289, 2.7813777923583984, 3.352020263671875, 3.9226629734039307, 4.493305683135986, 5.063948154449463, 5.6345906257629395, 6.205233573913574, 6.775876045227051, 7.346518516540527, 7.917160987854004, 8.48780345916748, 9.058445930480957, 9.62908935546875, 10.199731826782227, 10.770374298095703, 11.34101676940918, 11.911659240722656, 12.482301712036133, 13.05294418334961, 13.623586654663086, 14.194229125976562, 14.764871597290039, 15.335515022277832, 15.906157493591309, 16.47679901123047, 17.047441482543945, 17.618083953857422, 18.1887264251709, 18.759368896484375, 19.33001136779785, 19.900653839111328, 20.471298217773438, 21.041940689086914]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 8.0, 9.0, 20.0, 23.0, 36.0, 56.0, 88.0, 170.0, 265.0, 472.0, 1013.0, 2370.0, 8204.0, 51099.0, 3724305.0, 376207.0, 21992.0, 4403.0, 1530.0, 708.0, 374.0, 240.0, 158.0, 115.0, 101.0, 76.0, 45.0, 52.0, 30.0, 22.0, 17.0, 18.0, 15.0, 9.0, 6.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3515625, -6.0955810546875, -5.839599609375, -5.5836181640625, -5.32763671875, -5.0716552734375, -4.815673828125, -4.5596923828125, -4.3037109375, -4.0477294921875, -3.791748046875, -3.5357666015625, -3.27978515625, -3.0238037109375, -2.767822265625, -2.5118408203125, -2.255859375, -1.9998779296875, -1.743896484375, -1.4879150390625, -1.23193359375, -0.9759521484375, -0.719970703125, -0.4639892578125, -0.2080078125, 0.0479736328125, 0.303955078125, 0.5599365234375, 0.81591796875, 1.0718994140625, 1.327880859375, 1.5838623046875, 1.83984375, 2.0958251953125, 2.351806640625, 2.6077880859375, 2.86376953125, 3.1197509765625, 3.375732421875, 3.6317138671875, 3.8876953125, 4.1436767578125, 4.399658203125, 4.6556396484375, 4.91162109375, 5.1676025390625, 5.423583984375, 5.6795654296875, 5.935546875, 6.1915283203125, 6.447509765625, 6.7034912109375, 6.95947265625, 7.2154541015625, 7.471435546875, 7.7274169921875, 7.9833984375, 8.2393798828125, 8.495361328125, 8.7513427734375, 9.00732421875, 9.2633056640625, 9.519287109375, 9.7752685546875, 10.03125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 15.0, 21.0, 19.0, 29.0, 49.0, 53.0, 57.0, 76.0, 109.0, 92.0, 108.0, 99.0, 69.0, 53.0, 49.0, 37.0, 28.0, 14.0, 7.0, 8.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7294921875, -0.6903839111328125, -0.651275634765625, -0.6121673583984375, -0.57305908203125, -0.5339508056640625, -0.494842529296875, -0.4557342529296875, -0.4166259765625, -0.3775177001953125, -0.338409423828125, -0.2993011474609375, -0.26019287109375, -0.2210845947265625, -0.181976318359375, -0.1428680419921875, -0.103759765625, -0.0646514892578125, -0.025543212890625, 0.0135650634765625, 0.05267333984375, 0.0917816162109375, 0.130889892578125, 0.1699981689453125, 0.2091064453125, 0.2482147216796875, 0.287322998046875, 0.3264312744140625, 0.36553955078125, 0.4046478271484375, 0.443756103515625, 0.4828643798828125, 0.52197265625, 0.5610809326171875, 0.600189208984375, 0.6392974853515625, 0.67840576171875, 0.7175140380859375, 0.756622314453125, 0.7957305908203125, 0.8348388671875, 0.8739471435546875, 0.913055419921875, 0.9521636962890625, 0.99127197265625, 1.0303802490234375, 1.069488525390625, 1.1085968017578125, 1.147705078125, 1.1868133544921875, 1.225921630859375, 1.2650299072265625, 1.30413818359375, 1.3432464599609375, 1.382354736328125, 1.4214630126953125, 1.4605712890625, 1.4996795654296875, 1.538787841796875, 1.5778961181640625, 1.61700439453125, 1.6561126708984375, 1.695220947265625, 1.7343292236328125, 1.7734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 6.0, 3.0, 3.0, 10.0, 13.0, 10.0, 18.0, 28.0, 19.0, 26.0, 30.0, 39.0, 39.0, 51.0, 90.0, 102.0, 161.0, 281.0, 640.0, 1987.0, 9393.0, 92385.0, 3879321.0, 192003.0, 13395.0, 2504.0, 742.0, 335.0, 169.0, 123.0, 80.0, 53.0, 44.0, 36.0, 35.0, 19.0, 15.0, 15.0, 17.0, 5.0, 11.0, 6.0, 8.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.5546875, -7.299560546875, -7.04443359375, -6.789306640625, -6.5341796875, -6.279052734375, -6.02392578125, -5.768798828125, -5.513671875, -5.258544921875, -5.00341796875, -4.748291015625, -4.4931640625, -4.238037109375, -3.98291015625, -3.727783203125, -3.47265625, -3.217529296875, -2.96240234375, -2.707275390625, -2.4521484375, -2.197021484375, -1.94189453125, -1.686767578125, -1.431640625, -1.176513671875, -0.92138671875, -0.666259765625, -0.4111328125, -0.156005859375, 0.09912109375, 0.354248046875, 0.609375, 0.864501953125, 1.11962890625, 1.374755859375, 1.6298828125, 1.885009765625, 2.14013671875, 2.395263671875, 2.650390625, 2.905517578125, 3.16064453125, 3.415771484375, 3.6708984375, 3.926025390625, 4.18115234375, 4.436279296875, 4.69140625, 4.946533203125, 5.20166015625, 5.456787109375, 5.7119140625, 5.967041015625, 6.22216796875, 6.477294921875, 6.732421875, 6.987548828125, 7.24267578125, 7.497802734375, 7.7529296875, 8.008056640625, 8.26318359375, 8.518310546875, 8.7734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 5.0, 7.0, 1.0, 17.0, 26.0, 44.0, 93.0, 129.0, 448.0, 2099.0, 802.0, 222.0, 91.0, 50.0, 20.0, 13.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.970703125, -3.8891754150390625, -3.807647705078125, -3.7261199951171875, -3.64459228515625, -3.5630645751953125, -3.481536865234375, -3.4000091552734375, -3.3184814453125, -3.2369537353515625, -3.155426025390625, -3.0738983154296875, -2.99237060546875, -2.9108428955078125, -2.829315185546875, -2.7477874755859375, -2.666259765625, -2.5847320556640625, -2.503204345703125, -2.4216766357421875, -2.34014892578125, -2.2586212158203125, -2.177093505859375, -2.0955657958984375, -2.0140380859375, -1.9325103759765625, -1.850982666015625, -1.7694549560546875, -1.68792724609375, -1.6063995361328125, -1.524871826171875, -1.4433441162109375, -1.36181640625, -1.2802886962890625, -1.198760986328125, -1.1172332763671875, -1.03570556640625, -0.9541778564453125, -0.872650146484375, -0.7911224365234375, -0.7095947265625, -0.6280670166015625, -0.546539306640625, -0.4650115966796875, -0.38348388671875, -0.3019561767578125, -0.220428466796875, -0.1389007568359375, -0.057373046875, 0.0241546630859375, 0.105682373046875, 0.1872100830078125, 0.26873779296875, 0.3502655029296875, 0.431793212890625, 0.5133209228515625, 0.5948486328125, 0.6763763427734375, 0.757904052734375, 0.8394317626953125, 0.92095947265625, 1.0024871826171875, 1.084014892578125, 1.1655426025390625, 1.2470703125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 14.0, 42.0, 63.0, 132.0, 191.0, 209.0, 160.0, 94.0, 47.0, 20.0, 11.0, 6.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.465267181396484, -21.936521530151367, -21.40777587890625, -20.879030227661133, -20.350284576416016, -19.8215389251709, -19.29279327392578, -18.764049530029297, -18.235301971435547, -17.70655632019043, -17.177810668945312, -16.649065017700195, -16.120319366455078, -15.591573715209961, -15.06282901763916, -14.534083366394043, -14.005338668823242, -13.476593017578125, -12.947847366333008, -12.41910171508789, -11.890356063842773, -11.361610412597656, -10.832865715026855, -10.304120063781738, -9.775374412536621, -9.246628761291504, -8.717883110046387, -8.18913745880127, -7.6603922843933105, -7.131646633148193, -6.602901458740234, -6.074155807495117, -5.545408248901367, -5.01666259765625, -4.487916946411133, -3.959171772003174, -3.4304261207580566, -2.9016804695129395, -2.3729350566864014, -1.8441896438598633, -1.315443992614746, -0.7866984605789185, -0.2579529285430908, 0.2707926034927368, 0.7995381355285645, 1.3282837867736816, 1.8570291996002197, 2.385774612426758, 2.914520263671875, 3.443265914916992, 3.9720113277435303, 4.500756740570068, 5.0295023918151855, 5.558248043060303, 6.086993217468262, 6.615738868713379, 7.144484519958496, 7.673230171203613, 8.20197582244873, 8.730721473693848, 9.259466171264648, 9.788211822509766, 10.316957473754883, 10.845703125, 11.374448776245117]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 11.0, 15.0, 16.0, 23.0, 24.0, 38.0, 31.0, 38.0, 62.0, 54.0, 57.0, 69.0, 57.0, 67.0, 69.0, 60.0, 60.0, 44.0, 51.0, 37.0, 31.0, 23.0, 23.0, 9.0, 8.0, 8.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.600630283355713, -7.36495304107666, -7.129275321960449, -6.8935980796813965, -6.6579203605651855, -6.422243118286133, -6.186565399169922, -5.950888156890869, -5.715210914611816, -5.479533672332764, -5.243855953216553, -5.0081787109375, -4.772500991821289, -4.536823749542236, -4.301146507263184, -4.065468788146973, -3.8297910690307617, -3.59411358833313, -3.358436107635498, -3.1227588653564453, -2.8870811462402344, -2.6514039039611816, -2.41572642326355, -2.180048942565918, -1.9443714618682861, -1.7086939811706543, -1.4730165004730225, -1.2373391389846802, -1.0016616582870483, -0.7659841775894165, -0.5303068161010742, -0.2946293354034424, -0.05895233154296875, 0.1767251193523407, 0.41240257024765015, 0.6480799913406372, 0.883757472038269, 1.1194349527359009, 1.3551123142242432, 1.590789794921875, 1.8264672756195068, 2.0621447563171387, 2.2978222370147705, 2.5334997177124023, 2.769176959991455, 3.004854679107666, 3.2405319213867188, 3.4762094020843506, 3.7118868827819824, 3.9475643634796143, 4.183241844177246, 4.418919086456299, 4.65459680557251, 4.8902740478515625, 5.125951766967773, 5.361629009246826, 5.597306251525879, 5.832983493804932, 6.068661212921143, 6.304338455200195, 6.540016174316406, 6.775693416595459, 7.011370658874512, 7.247048377990723, 7.482726097106934]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 11.0, 6.0, 6.0, 23.0, 9.0, 25.0, 23.0, 34.0, 49.0, 57.0, 85.0, 125.0, 159.0, 277.0, 462.0, 909.0, 1940.0, 4913.0, 17141.0, 87814.0, 463194.0, 382852.0, 66746.0, 13834.0, 4092.0, 1644.0, 813.0, 413.0, 254.0, 180.0, 117.0, 85.0, 73.0, 46.0, 38.0, 25.0, 21.0, 18.0, 11.0, 5.0, 3.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-6.6875, -6.484375, -6.28125, -6.078125, -5.875, -5.671875, -5.46875, -5.265625, -5.0625, -4.859375, -4.65625, -4.453125, -4.25, -4.046875, -3.84375, -3.640625, -3.4375, -3.234375, -3.03125, -2.828125, -2.625, -2.421875, -2.21875, -2.015625, -1.8125, -1.609375, -1.40625, -1.203125, -1.0, -0.796875, -0.59375, -0.390625, -0.1875, 0.015625, 0.21875, 0.421875, 0.625, 0.828125, 1.03125, 1.234375, 1.4375, 1.640625, 1.84375, 2.046875, 2.25, 2.453125, 2.65625, 2.859375, 3.0625, 3.265625, 3.46875, 3.671875, 3.875, 4.078125, 4.28125, 4.484375, 4.6875, 4.890625, 5.09375, 5.296875, 5.5, 5.703125, 5.90625, 6.109375, 6.3125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 8.0, 16.0, 9.0, 15.0, 27.0, 32.0, 54.0, 64.0, 72.0, 70.0, 87.0, 100.0, 91.0, 82.0, 60.0, 57.0, 55.0, 34.0, 28.0, 13.0, 16.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6796875, -0.6429443359375, -0.606201171875, -0.5694580078125, -0.53271484375, -0.4959716796875, -0.459228515625, -0.4224853515625, -0.3857421875, -0.3489990234375, -0.312255859375, -0.2755126953125, -0.23876953125, -0.2020263671875, -0.165283203125, -0.1285400390625, -0.091796875, -0.0550537109375, -0.018310546875, 0.0184326171875, 0.05517578125, 0.0919189453125, 0.128662109375, 0.1654052734375, 0.2021484375, 0.2388916015625, 0.275634765625, 0.3123779296875, 0.34912109375, 0.3858642578125, 0.422607421875, 0.4593505859375, 0.49609375, 0.5328369140625, 0.569580078125, 0.6063232421875, 0.64306640625, 0.6798095703125, 0.716552734375, 0.7532958984375, 0.7900390625, 0.8267822265625, 0.863525390625, 0.9002685546875, 0.93701171875, 0.9737548828125, 1.010498046875, 1.0472412109375, 1.083984375, 1.1207275390625, 1.157470703125, 1.1942138671875, 1.23095703125, 1.2677001953125, 1.304443359375, 1.3411865234375, 1.3779296875, 1.4146728515625, 1.451416015625, 1.4881591796875, 1.52490234375, 1.5616455078125, 1.598388671875, 1.6351318359375, 1.671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 8.0, 13.0, 20.0, 18.0, 31.0, 45.0, 64.0, 83.0, 103.0, 186.0, 263.0, 416.0, 626.0, 1144.0, 2151.0, 4379.0, 9923.0, 24415.0, 63622.0, 159934.0, 314076.0, 267897.0, 119385.0, 46482.0, 17952.0, 7483.0, 3445.0, 1756.0, 988.0, 571.0, 327.0, 252.0, 160.0, 87.0, 74.0, 50.0, 28.0, 36.0, 17.0, 19.0, 6.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.68359375, -2.60186767578125, -2.5201416015625, -2.43841552734375, -2.356689453125, -2.27496337890625, -2.1932373046875, -2.11151123046875, -2.02978515625, -1.94805908203125, -1.8663330078125, -1.78460693359375, -1.702880859375, -1.62115478515625, -1.5394287109375, -1.45770263671875, -1.3759765625, -1.29425048828125, -1.2125244140625, -1.13079833984375, -1.049072265625, -0.96734619140625, -0.8856201171875, -0.80389404296875, -0.72216796875, -0.64044189453125, -0.5587158203125, -0.47698974609375, -0.395263671875, -0.31353759765625, -0.2318115234375, -0.15008544921875, -0.068359375, 0.01336669921875, 0.0950927734375, 0.17681884765625, 0.258544921875, 0.34027099609375, 0.4219970703125, 0.50372314453125, 0.58544921875, 0.66717529296875, 0.7489013671875, 0.83062744140625, 0.912353515625, 0.99407958984375, 1.0758056640625, 1.15753173828125, 1.2392578125, 1.32098388671875, 1.4027099609375, 1.48443603515625, 1.566162109375, 1.64788818359375, 1.7296142578125, 1.81134033203125, 1.89306640625, 1.97479248046875, 2.0565185546875, 2.13824462890625, 2.219970703125, 2.30169677734375, 2.3834228515625, 2.46514892578125, 2.546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 2.0, 8.0, 8.0, 6.0, 12.0, 9.0, 17.0, 14.0, 18.0, 31.0, 27.0, 30.0, 32.0, 31.0, 40.0, 29.0, 33.0, 40.0, 30.0, 57.0, 44.0, 41.0, 36.0, 41.0, 34.0, 35.0, 29.0, 28.0, 38.0, 29.0, 30.0, 19.0, 18.0, 20.0, 7.0, 12.0, 9.0, 12.0, 12.0, 7.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.36328125, -2.2845458984375, -2.205810546875, -2.1270751953125, -2.04833984375, -1.9696044921875, -1.890869140625, -1.8121337890625, -1.7333984375, -1.6546630859375, -1.575927734375, -1.4971923828125, -1.41845703125, -1.3397216796875, -1.260986328125, -1.1822509765625, -1.103515625, -1.0247802734375, -0.946044921875, -0.8673095703125, -0.78857421875, -0.7098388671875, -0.631103515625, -0.5523681640625, -0.4736328125, -0.3948974609375, -0.316162109375, -0.2374267578125, -0.15869140625, -0.0799560546875, -0.001220703125, 0.0775146484375, 0.15625, 0.2349853515625, 0.313720703125, 0.3924560546875, 0.47119140625, 0.5499267578125, 0.628662109375, 0.7073974609375, 0.7861328125, 0.8648681640625, 0.943603515625, 1.0223388671875, 1.10107421875, 1.1798095703125, 1.258544921875, 1.3372802734375, 1.416015625, 1.4947509765625, 1.573486328125, 1.6522216796875, 1.73095703125, 1.8096923828125, 1.888427734375, 1.9671630859375, 2.0458984375, 2.1246337890625, 2.203369140625, 2.2821044921875, 2.36083984375, 2.4395751953125, 2.518310546875, 2.5970458984375, 2.67578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 13.0, 19.0, 17.0, 25.0, 47.0, 66.0, 118.0, 206.0, 362.0, 690.0, 1536.0, 3731.0, 11262.0, 44992.0, 298835.0, 558426.0, 98180.0, 19884.0, 5809.0, 2203.0, 977.0, 471.0, 262.0, 146.0, 89.0, 49.0, 40.0, 34.0, 20.0, 12.0, 10.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.46484375, -3.36358642578125, -3.2623291015625, -3.16107177734375, -3.059814453125, -2.95855712890625, -2.8572998046875, -2.75604248046875, -2.65478515625, -2.55352783203125, -2.4522705078125, -2.35101318359375, -2.249755859375, -2.14849853515625, -2.0472412109375, -1.94598388671875, -1.8447265625, -1.74346923828125, -1.6422119140625, -1.54095458984375, -1.439697265625, -1.33843994140625, -1.2371826171875, -1.13592529296875, -1.03466796875, -0.93341064453125, -0.8321533203125, -0.73089599609375, -0.629638671875, -0.52838134765625, -0.4271240234375, -0.32586669921875, -0.224609375, -0.12335205078125, -0.0220947265625, 0.07916259765625, 0.180419921875, 0.28167724609375, 0.3829345703125, 0.48419189453125, 0.58544921875, 0.68670654296875, 0.7879638671875, 0.88922119140625, 0.990478515625, 1.09173583984375, 1.1929931640625, 1.29425048828125, 1.3955078125, 1.49676513671875, 1.5980224609375, 1.69927978515625, 1.800537109375, 1.90179443359375, 2.0030517578125, 2.10430908203125, 2.20556640625, 2.30682373046875, 2.4080810546875, 2.50933837890625, 2.610595703125, 2.71185302734375, 2.8131103515625, 2.91436767578125, 3.015625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 2.0, 12.0, 11.0, 22.0, 38.0, 57.0, 81.0, 135.0, 187.0, 150.0, 93.0, 65.0, 43.0, 28.0, 22.0, 18.0, 10.0, 8.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005946159362792969, -0.0005763843655586243, -0.0005581527948379517, -0.000539921224117279, -0.0005216896533966064, -0.0005034580826759338, -0.00048522651195526123, -0.0004669949412345886, -0.000448763370513916, -0.0004305317997932434, -0.0004123002290725708, -0.0003940686583518982, -0.0003758370876312256, -0.000357605516910553, -0.00033937394618988037, -0.00032114237546920776, -0.00030291080474853516, -0.00028467923402786255, -0.00026644766330718994, -0.00024821609258651733, -0.00022998452186584473, -0.00021175295114517212, -0.0001935213804244995, -0.0001752898097038269, -0.0001570582389831543, -0.0001388266682624817, -0.00012059509754180908, -0.00010236352682113647, -8.413195610046387e-05, -6.590038537979126e-05, -4.766881465911865e-05, -2.9437243938446045e-05, -1.1205673217773438e-05, 7.02589750289917e-06, 2.5257468223571777e-05, 4.3489038944244385e-05, 6.172060966491699e-05, 7.99521803855896e-05, 9.818375110626221e-05, 0.00011641532182693481, 0.00013464689254760742, 0.00015287846326828003, 0.00017111003398895264, 0.00018934160470962524, 0.00020757317543029785, 0.00022580474615097046, 0.00024403631687164307, 0.0002622678875923157, 0.0002804994583129883, 0.0002987310290336609, 0.0003169625997543335, 0.0003351941704750061, 0.0003534257411956787, 0.0003716573119163513, 0.0003898888826370239, 0.00040812045335769653, 0.00042635202407836914, 0.00044458359479904175, 0.00046281516551971436, 0.00048104673624038696, 0.0004992783069610596, 0.0005175098776817322, 0.0005357414484024048, 0.0005539730191230774, 0.00057220458984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 7.0, 6.0, 17.0, 19.0, 21.0, 57.0, 66.0, 108.0, 206.0, 367.0, 636.0, 1325.0, 2757.0, 6715.0, 19954.0, 74758.0, 367717.0, 444684.0, 91726.0, 23452.0, 7655.0, 3074.0, 1446.0, 740.0, 419.0, 258.0, 121.0, 84.0, 47.0, 32.0, 20.0, 9.0, 12.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.6015625, -2.515045166015625, -2.42852783203125, -2.342010498046875, -2.2554931640625, -2.168975830078125, -2.08245849609375, -1.995941162109375, -1.909423828125, -1.822906494140625, -1.73638916015625, -1.649871826171875, -1.5633544921875, -1.476837158203125, -1.39031982421875, -1.303802490234375, -1.21728515625, -1.130767822265625, -1.04425048828125, -0.957733154296875, -0.8712158203125, -0.784698486328125, -0.69818115234375, -0.611663818359375, -0.525146484375, -0.438629150390625, -0.35211181640625, -0.265594482421875, -0.1790771484375, -0.092559814453125, -0.00604248046875, 0.080474853515625, 0.1669921875, 0.253509521484375, 0.34002685546875, 0.426544189453125, 0.5130615234375, 0.599578857421875, 0.68609619140625, 0.772613525390625, 0.859130859375, 0.945648193359375, 1.03216552734375, 1.118682861328125, 1.2052001953125, 1.291717529296875, 1.37823486328125, 1.464752197265625, 1.55126953125, 1.637786865234375, 1.72430419921875, 1.810821533203125, 1.8973388671875, 1.983856201171875, 2.07037353515625, 2.156890869140625, 2.243408203125, 2.329925537109375, 2.41644287109375, 2.502960205078125, 2.5894775390625, 2.675994873046875, 2.76251220703125, 2.849029541015625, 2.935546875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 7.0, 5.0, 13.0, 11.0, 22.0, 22.0, 32.0, 24.0, 47.0, 58.0, 75.0, 80.0, 95.0, 90.0, 72.0, 69.0, 56.0, 46.0, 40.0, 26.0, 23.0, 20.0, 15.0, 11.0, 11.0, 4.0, 3.0, 2.0, 2.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-2.29296875, -2.2310638427734375, -2.169158935546875, -2.1072540283203125, -2.04534912109375, -1.9834442138671875, -1.921539306640625, -1.8596343994140625, -1.7977294921875, -1.7358245849609375, -1.673919677734375, -1.6120147705078125, -1.55010986328125, -1.4882049560546875, -1.426300048828125, -1.3643951416015625, -1.302490234375, -1.2405853271484375, -1.178680419921875, -1.1167755126953125, -1.05487060546875, -0.9929656982421875, -0.931060791015625, -0.8691558837890625, -0.8072509765625, -0.7453460693359375, -0.683441162109375, -0.6215362548828125, -0.55963134765625, -0.4977264404296875, -0.435821533203125, -0.3739166259765625, -0.31201171875, -0.2501068115234375, -0.188201904296875, -0.1262969970703125, -0.06439208984375, -0.0024871826171875, 0.059417724609375, 0.1213226318359375, 0.1832275390625, 0.2451324462890625, 0.307037353515625, 0.3689422607421875, 0.43084716796875, 0.4927520751953125, 0.554656982421875, 0.6165618896484375, 0.678466796875, 0.7403717041015625, 0.802276611328125, 0.8641815185546875, 0.92608642578125, 0.9879913330078125, 1.049896240234375, 1.1118011474609375, 1.1737060546875, 1.2356109619140625, 1.297515869140625, 1.3594207763671875, 1.42132568359375, 1.4832305908203125, 1.545135498046875, 1.6070404052734375, 1.6689453125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 29.0, 100.0, 225.0, 299.0, 218.0, 85.0, 28.0, 10.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.77985763549805, -32.665496826171875, -30.55113983154297, -28.436779022216797, -26.322420120239258, -24.20806121826172, -22.093700408935547, -19.979341506958008, -17.86498260498047, -15.75062370300293, -13.636263847351074, -11.521903991699219, -9.40754508972168, -7.293186187744141, -5.178826332092285, -3.0644664764404297, -0.9501075744628906, 1.1642518043518066, 3.278611183166504, 5.392970561981201, 7.507329940795898, 9.621688842773438, 11.736048698425293, 13.850408554077148, 15.964767456054688, 18.079126358032227, 20.193485260009766, 22.307846069335938, 24.422204971313477, 26.536563873291016, 28.650924682617188, 30.765283584594727, 32.87964630126953, 34.9940071105957, 37.10836410522461, 39.22272491455078, 41.33708190917969, 43.45144271850586, 45.56580352783203, 47.68016052246094, 49.79452133178711, 51.90888214111328, 54.02323913574219, 56.13759994506836, 58.25196075439453, 60.36631774902344, 62.48067855834961, 64.59503936767578, 66.70939636230469, 68.8237533569336, 70.93811798095703, 73.05247497558594, 75.16683197021484, 77.28118896484375, 79.39555358886719, 81.5099105834961, 83.624267578125, 85.7386245727539, 87.85298919677734, 89.96734619140625, 92.08170318603516, 94.19606018066406, 96.3104248046875, 98.4247817993164, 100.53914642333984]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 8.0, 10.0, 10.0, 11.0, 11.0, 16.0, 14.0, 19.0, 18.0, 32.0, 34.0, 38.0, 31.0, 31.0, 43.0, 50.0, 43.0, 34.0, 43.0, 44.0, 47.0, 40.0, 39.0, 41.0, 29.0, 40.0, 32.0, 31.0, 31.0, 22.0, 18.0, 17.0, 15.0, 13.0, 13.0, 6.0, 12.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.534975051879883, -16.988554000854492, -16.4421329498291, -15.895711898803711, -15.34929084777832, -14.80286979675293, -14.256449699401855, -13.710028648376465, -13.163607597351074, -12.617186546325684, -12.070765495300293, -11.524344444274902, -10.977924346923828, -10.431503295898438, -9.885082244873047, -9.338661193847656, -8.792240142822266, -8.245819091796875, -7.699398040771484, -7.152977466583252, -6.606556415557861, -6.060135364532471, -5.513714790344238, -4.967293739318848, -4.420872688293457, -3.8744516372680664, -3.328030824661255, -2.7816100120544434, -2.2351889610290527, -1.688767910003662, -1.1423470973968506, -0.5959262847900391, -0.04950523376464844, 0.49691569805145264, 1.0433366298675537, 1.5897575616836548, 2.136178493499756, 2.6825995445251465, 3.229020357131958, 3.7754411697387695, 4.32186222076416, 4.868283271789551, 5.414704322814941, 5.961124897003174, 6.5075459480285645, 7.053966999053955, 7.6003875732421875, 8.146808624267578, 8.693229675292969, 9.23965072631836, 9.78607177734375, 10.33249282836914, 10.878913879394531, 11.425334930419922, 11.971755027770996, 12.518176078796387, 13.064597129821777, 13.611018180847168, 14.157439231872559, 14.70386028289795, 15.250280380249023, 15.796701431274414, 16.343122482299805, 16.889543533325195, 17.435964584350586]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 7.0, 19.0, 26.0, 35.0, 45.0, 78.0, 142.0, 247.0, 415.0, 836.0, 1886.0, 5373.0, 22510.0, 289267.0, 3794236.0, 63878.0, 9754.0, 2796.0, 1125.0, 537.0, 326.0, 222.0, 151.0, 128.0, 75.0, 48.0, 34.0, 19.0, 21.0, 13.0, 9.0, 5.0, 3.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.60546875, -6.34393310546875, -6.0823974609375, -5.82086181640625, -5.559326171875, -5.29779052734375, -5.0362548828125, -4.77471923828125, -4.51318359375, -4.25164794921875, -3.9901123046875, -3.72857666015625, -3.467041015625, -3.20550537109375, -2.9439697265625, -2.68243408203125, -2.4208984375, -2.15936279296875, -1.8978271484375, -1.63629150390625, -1.374755859375, -1.11322021484375, -0.8516845703125, -0.59014892578125, -0.32861328125, -0.06707763671875, 0.1944580078125, 0.45599365234375, 0.717529296875, 0.97906494140625, 1.2406005859375, 1.50213623046875, 1.763671875, 2.02520751953125, 2.2867431640625, 2.54827880859375, 2.809814453125, 3.07135009765625, 3.3328857421875, 3.59442138671875, 3.85595703125, 4.11749267578125, 4.3790283203125, 4.64056396484375, 4.902099609375, 5.16363525390625, 5.4251708984375, 5.68670654296875, 5.9482421875, 6.20977783203125, 6.4713134765625, 6.73284912109375, 6.994384765625, 7.25592041015625, 7.5174560546875, 7.77899169921875, 8.04052734375, 8.30206298828125, 8.5635986328125, 8.82513427734375, 9.086669921875, 9.34820556640625, 9.6097412109375, 9.87127685546875, 10.1328125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 10.0, 14.0, 14.0, 14.0, 24.0, 27.0, 27.0, 46.0, 61.0, 58.0, 66.0, 67.0, 74.0, 58.0, 51.0, 69.0, 59.0, 52.0, 44.0, 51.0, 27.0, 18.0, 18.0, 11.0, 15.0, 9.0, 4.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7021484375, -0.670318603515625, -0.63848876953125, -0.606658935546875, -0.5748291015625, -0.542999267578125, -0.51116943359375, -0.479339599609375, -0.447509765625, -0.415679931640625, -0.38385009765625, -0.352020263671875, -0.3201904296875, -0.288360595703125, -0.25653076171875, -0.224700927734375, -0.19287109375, -0.161041259765625, -0.12921142578125, -0.097381591796875, -0.0655517578125, -0.033721923828125, -0.00189208984375, 0.029937744140625, 0.061767578125, 0.093597412109375, 0.12542724609375, 0.157257080078125, 0.1890869140625, 0.220916748046875, 0.25274658203125, 0.284576416015625, 0.31640625, 0.348236083984375, 0.38006591796875, 0.411895751953125, 0.4437255859375, 0.475555419921875, 0.50738525390625, 0.539215087890625, 0.571044921875, 0.602874755859375, 0.63470458984375, 0.666534423828125, 0.6983642578125, 0.730194091796875, 0.76202392578125, 0.793853759765625, 0.82568359375, 0.857513427734375, 0.88934326171875, 0.921173095703125, 0.9530029296875, 0.984832763671875, 1.01666259765625, 1.048492431640625, 1.080322265625, 1.112152099609375, 1.14398193359375, 1.175811767578125, 1.2076416015625, 1.239471435546875, 1.27130126953125, 1.303131103515625, 1.3349609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 6.0, 14.0, 20.0, 22.0, 42.0, 60.0, 108.0, 169.0, 235.0, 438.0, 807.0, 1420.0, 3212.0, 8012.0, 27013.0, 145122.0, 3211266.0, 704216.0, 66329.0, 15687.0, 5184.0, 2246.0, 1134.0, 658.0, 344.0, 187.0, 128.0, 70.0, 42.0, 31.0, 18.0, 20.0, 7.0, 7.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.48046875, -4.330078125, -4.1796875, -4.029296875, -3.87890625, -3.728515625, -3.578125, -3.427734375, -3.27734375, -3.126953125, -2.9765625, -2.826171875, -2.67578125, -2.525390625, -2.375, -2.224609375, -2.07421875, -1.923828125, -1.7734375, -1.623046875, -1.47265625, -1.322265625, -1.171875, -1.021484375, -0.87109375, -0.720703125, -0.5703125, -0.419921875, -0.26953125, -0.119140625, 0.03125, 0.181640625, 0.33203125, 0.482421875, 0.6328125, 0.783203125, 0.93359375, 1.083984375, 1.234375, 1.384765625, 1.53515625, 1.685546875, 1.8359375, 1.986328125, 2.13671875, 2.287109375, 2.4375, 2.587890625, 2.73828125, 2.888671875, 3.0390625, 3.189453125, 3.33984375, 3.490234375, 3.640625, 3.791015625, 3.94140625, 4.091796875, 4.2421875, 4.392578125, 4.54296875, 4.693359375, 4.84375, 4.994140625, 5.14453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 10.0, 5.0, 15.0, 17.0, 27.0, 44.0, 63.0, 100.0, 234.0, 535.0, 1631.0, 750.0, 309.0, 126.0, 78.0, 54.0, 27.0, 15.0, 5.0, 7.0, 5.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.314453125, -2.2435302734375, -2.172607421875, -2.1016845703125, -2.03076171875, -1.9598388671875, -1.888916015625, -1.8179931640625, -1.7470703125, -1.6761474609375, -1.605224609375, -1.5343017578125, -1.46337890625, -1.3924560546875, -1.321533203125, -1.2506103515625, -1.1796875, -1.1087646484375, -1.037841796875, -0.9669189453125, -0.89599609375, -0.8250732421875, -0.754150390625, -0.6832275390625, -0.6123046875, -0.5413818359375, -0.470458984375, -0.3995361328125, -0.32861328125, -0.2576904296875, -0.186767578125, -0.1158447265625, -0.044921875, 0.0260009765625, 0.096923828125, 0.1678466796875, 0.23876953125, 0.3096923828125, 0.380615234375, 0.4515380859375, 0.5224609375, 0.5933837890625, 0.664306640625, 0.7352294921875, 0.80615234375, 0.8770751953125, 0.947998046875, 1.0189208984375, 1.08984375, 1.1607666015625, 1.231689453125, 1.3026123046875, 1.37353515625, 1.4444580078125, 1.515380859375, 1.5863037109375, 1.6572265625, 1.7281494140625, 1.799072265625, 1.8699951171875, 1.94091796875, 2.0118408203125, 2.082763671875, 2.1536865234375, 2.224609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 8.0, 19.0, 81.0, 259.0, 383.0, 180.0, 48.0, 14.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-55.35602569580078, -54.29960632324219, -53.243186950683594, -52.186767578125, -51.130348205566406, -50.07392883300781, -49.01750946044922, -47.961090087890625, -46.90467071533203, -45.84825134277344, -44.791831970214844, -43.73541259765625, -42.678993225097656, -41.62257385253906, -40.56615447998047, -39.509735107421875, -38.453311920166016, -37.39689254760742, -36.34047317504883, -35.284053802490234, -34.22763442993164, -33.17121505737305, -32.11479568481445, -31.058374404907227, -30.001955032348633, -28.94553565979004, -27.889116287231445, -26.83269691467285, -25.776275634765625, -24.71985626220703, -23.663436889648438, -22.607017517089844, -21.55059814453125, -20.494178771972656, -19.437759399414062, -18.38134002685547, -17.324920654296875, -16.26850128173828, -15.212080001831055, -14.155660629272461, -13.099241256713867, -12.042821884155273, -10.98640251159668, -9.92998218536377, -8.873562812805176, -7.817143440246582, -6.76072359085083, -5.704303741455078, -4.647884368896484, -3.5914647579193115, -2.5350451469421387, -1.4786255359649658, -0.42220592498779297, 0.6342134475708008, 1.6906332969665527, 2.7470531463623047, 3.8034725189208984, 4.859891891479492, 5.916311740875244, 6.972731590270996, 8.02915096282959, 9.085570335388184, 10.141990661621094, 11.198410034179688, 12.254829406738281]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 9.0, 3.0, 7.0, 9.0, 14.0, 25.0, 17.0, 17.0, 30.0, 40.0, 45.0, 51.0, 39.0, 52.0, 53.0, 63.0, 61.0, 54.0, 56.0, 56.0, 58.0, 29.0, 25.0, 31.0, 29.0, 29.0, 14.0, 20.0, 12.0, 14.0, 14.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0], "bins": [-8.668121337890625, -8.4579496383667, -8.247777938842773, -8.037606239318848, -7.827434539794922, -7.617262840270996, -7.407090663909912, -7.196918964385986, -6.9867472648620605, -6.776575565338135, -6.566403865814209, -6.356232166290283, -6.146059989929199, -5.935888290405273, -5.725716590881348, -5.515544891357422, -5.305373191833496, -5.09520149230957, -4.8850297927856445, -4.674858093261719, -4.464686393737793, -4.254514694213867, -4.044342517852783, -3.8341708183288574, -3.6239991188049316, -3.413827419281006, -3.20365571975708, -2.993483781814575, -2.7833120822906494, -2.5731403827667236, -2.3629684448242188, -2.152796745300293, -1.9426250457763672, -1.7324533462524414, -1.522281527519226, -1.3121097087860107, -1.101938009262085, -0.8917663097381592, -0.6815944910049438, -0.4714226722717285, -0.26125097274780273, -0.05107921361923218, 0.15909254550933838, 0.36926430463790894, 0.5794360637664795, 0.7896077632904053, 0.9997795820236206, 1.209951400756836, 1.4201231002807617, 1.6302947998046875, 1.8404666185379028, 2.050638437271118, 2.260810136795044, 2.4709818363189697, 2.6811537742614746, 2.8913254737854004, 3.101497173309326, 3.311668872833252, 3.5218405723571777, 3.7320125102996826, 3.9421842098236084, 4.152356147766113, 4.362527847290039, 4.572699546813965, 4.782871246337891]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 11.0, 13.0, 35.0, 53.0, 80.0, 189.0, 469.0, 1466.0, 6668.0, 82216.0, 865299.0, 83069.0, 6661.0, 1424.0, 458.0, 205.0, 90.0, 57.0, 37.0, 23.0, 9.0, 12.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6796875, -11.2698974609375, -10.860107421875, -10.4503173828125, -10.04052734375, -9.6307373046875, -9.220947265625, -8.8111572265625, -8.4013671875, -7.9915771484375, -7.581787109375, -7.1719970703125, -6.76220703125, -6.3524169921875, -5.942626953125, -5.5328369140625, -5.123046875, -4.7132568359375, -4.303466796875, -3.8936767578125, -3.48388671875, -3.0740966796875, -2.664306640625, -2.2545166015625, -1.8447265625, -1.4349365234375, -1.025146484375, -0.6153564453125, -0.20556640625, 0.2042236328125, 0.614013671875, 1.0238037109375, 1.43359375, 1.8433837890625, 2.253173828125, 2.6629638671875, 3.07275390625, 3.4825439453125, 3.892333984375, 4.3021240234375, 4.7119140625, 5.1217041015625, 5.531494140625, 5.9412841796875, 6.35107421875, 6.7608642578125, 7.170654296875, 7.5804443359375, 7.990234375, 8.4000244140625, 8.809814453125, 9.2196044921875, 9.62939453125, 10.0391845703125, 10.448974609375, 10.8587646484375, 11.2685546875, 11.6783447265625, 12.088134765625, 12.4979248046875, 12.90771484375, 13.3175048828125, 13.727294921875, 14.1370849609375, 14.546875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 9.0, 7.0, 15.0, 13.0, 15.0, 23.0, 33.0, 46.0, 54.0, 48.0, 63.0, 58.0, 78.0, 45.0, 63.0, 58.0, 56.0, 62.0, 56.0, 40.0, 35.0, 30.0, 26.0, 12.0, 15.0, 12.0, 13.0, 1.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7109375, -0.6796722412109375, -0.648406982421875, -0.6171417236328125, -0.58587646484375, -0.5546112060546875, -0.523345947265625, -0.4920806884765625, -0.4608154296875, -0.4295501708984375, -0.398284912109375, -0.3670196533203125, -0.33575439453125, -0.3044891357421875, -0.273223876953125, -0.2419586181640625, -0.210693359375, -0.1794281005859375, -0.148162841796875, -0.1168975830078125, -0.08563232421875, -0.0543670654296875, -0.023101806640625, 0.0081634521484375, 0.0394287109375, 0.0706939697265625, 0.101959228515625, 0.1332244873046875, 0.16448974609375, 0.1957550048828125, 0.227020263671875, 0.2582855224609375, 0.28955078125, 0.3208160400390625, 0.352081298828125, 0.3833465576171875, 0.41461181640625, 0.4458770751953125, 0.477142333984375, 0.5084075927734375, 0.5396728515625, 0.5709381103515625, 0.602203369140625, 0.6334686279296875, 0.66473388671875, 0.6959991455078125, 0.727264404296875, 0.7585296630859375, 0.789794921875, 0.8210601806640625, 0.852325439453125, 0.8835906982421875, 0.91485595703125, 0.9461212158203125, 0.977386474609375, 1.0086517333984375, 1.0399169921875, 1.0711822509765625, 1.102447509765625, 1.1337127685546875, 1.16497802734375, 1.1962432861328125, 1.227508544921875, 1.2587738037109375, 1.2900390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 2.0, 7.0, 12.0, 16.0, 18.0, 34.0, 53.0, 77.0, 113.0, 169.0, 266.0, 456.0, 813.0, 1542.0, 3357.0, 8294.0, 25113.0, 93890.0, 374172.0, 396425.0, 100764.0, 27007.0, 8825.0, 3384.0, 1616.0, 861.0, 473.0, 275.0, 170.0, 119.0, 79.0, 35.0, 29.0, 28.0, 9.0, 16.0, 6.0, 5.0, 8.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.359375, -4.23492431640625, -4.1104736328125, -3.98602294921875, -3.861572265625, -3.73712158203125, -3.6126708984375, -3.48822021484375, -3.36376953125, -3.23931884765625, -3.1148681640625, -2.99041748046875, -2.865966796875, -2.74151611328125, -2.6170654296875, -2.49261474609375, -2.3681640625, -2.24371337890625, -2.1192626953125, -1.99481201171875, -1.870361328125, -1.74591064453125, -1.6214599609375, -1.49700927734375, -1.37255859375, -1.24810791015625, -1.1236572265625, -0.99920654296875, -0.874755859375, -0.75030517578125, -0.6258544921875, -0.50140380859375, -0.376953125, -0.25250244140625, -0.1280517578125, -0.00360107421875, 0.120849609375, 0.24530029296875, 0.3697509765625, 0.49420166015625, 0.61865234375, 0.74310302734375, 0.8675537109375, 0.99200439453125, 1.116455078125, 1.24090576171875, 1.3653564453125, 1.48980712890625, 1.6142578125, 1.73870849609375, 1.8631591796875, 1.98760986328125, 2.112060546875, 2.23651123046875, 2.3609619140625, 2.48541259765625, 2.60986328125, 2.73431396484375, 2.8587646484375, 2.98321533203125, 3.107666015625, 3.23211669921875, 3.3565673828125, 3.48101806640625, 3.60546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 7.0, 4.0, 17.0, 11.0, 16.0, 24.0, 20.0, 29.0, 30.0, 38.0, 52.0, 49.0, 59.0, 47.0, 51.0, 71.0, 70.0, 54.0, 62.0, 38.0, 43.0, 38.0, 23.0, 26.0, 21.0, 15.0, 16.0, 15.0, 10.0, 10.0, 8.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41015625, -3.295989990234375, -3.18182373046875, -3.067657470703125, -2.9534912109375, -2.839324951171875, -2.72515869140625, -2.610992431640625, -2.496826171875, -2.382659912109375, -2.26849365234375, -2.154327392578125, -2.0401611328125, -1.925994873046875, -1.81182861328125, -1.697662353515625, -1.58349609375, -1.469329833984375, -1.35516357421875, -1.240997314453125, -1.1268310546875, -1.012664794921875, -0.89849853515625, -0.784332275390625, -0.670166015625, -0.555999755859375, -0.44183349609375, -0.327667236328125, -0.2135009765625, -0.099334716796875, 0.01483154296875, 0.128997802734375, 0.2431640625, 0.357330322265625, 0.47149658203125, 0.585662841796875, 0.6998291015625, 0.813995361328125, 0.92816162109375, 1.042327880859375, 1.156494140625, 1.270660400390625, 1.38482666015625, 1.498992919921875, 1.6131591796875, 1.727325439453125, 1.84149169921875, 1.955657958984375, 2.06982421875, 2.183990478515625, 2.29815673828125, 2.412322998046875, 2.5264892578125, 2.640655517578125, 2.75482177734375, 2.868988037109375, 2.983154296875, 3.097320556640625, 3.21148681640625, 3.325653076171875, 3.4398193359375, 3.553985595703125, 3.66815185546875, 3.782318115234375, 3.896484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 21.0, 45.0, 73.0, 152.0, 379.0, 1060.0, 4129.0, 26018.0, 883412.0, 121707.0, 8637.0, 1846.0, 584.0, 232.0, 114.0, 64.0, 27.0, 14.0, 15.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1796875, -5.97857666015625, -5.7774658203125, -5.57635498046875, -5.375244140625, -5.17413330078125, -4.9730224609375, -4.77191162109375, -4.57080078125, -4.36968994140625, -4.1685791015625, -3.96746826171875, -3.766357421875, -3.56524658203125, -3.3641357421875, -3.16302490234375, -2.9619140625, -2.76080322265625, -2.5596923828125, -2.35858154296875, -2.157470703125, -1.95635986328125, -1.7552490234375, -1.55413818359375, -1.35302734375, -1.15191650390625, -0.9508056640625, -0.74969482421875, -0.548583984375, -0.34747314453125, -0.1463623046875, 0.05474853515625, 0.255859375, 0.45697021484375, 0.6580810546875, 0.85919189453125, 1.060302734375, 1.26141357421875, 1.4625244140625, 1.66363525390625, 1.86474609375, 2.06585693359375, 2.2669677734375, 2.46807861328125, 2.669189453125, 2.87030029296875, 3.0714111328125, 3.27252197265625, 3.4736328125, 3.67474365234375, 3.8758544921875, 4.07696533203125, 4.278076171875, 4.47918701171875, 4.6802978515625, 4.88140869140625, 5.08251953125, 5.28363037109375, 5.4847412109375, 5.68585205078125, 5.886962890625, 6.08807373046875, 6.2891845703125, 6.49029541015625, 6.69140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 5.0, 5.0, 6.0, 6.0, 8.0, 17.0, 18.0, 37.0, 43.0, 94.0, 266.0, 263.0, 95.0, 45.0, 36.0, 18.0, 9.0, 7.0, 10.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0006971359252929688, -0.0006792396306991577, -0.0006613433361053467, -0.0006434470415115356, -0.0006255507469177246, -0.0006076544523239136, -0.0005897581577301025, -0.0005718618631362915, -0.0005539655685424805, -0.0005360692739486694, -0.0005181729793548584, -0.0005002766847610474, -0.00048238039016723633, -0.0004644840955734253, -0.00044658780097961426, -0.0004286915063858032, -0.0004107952117919922, -0.00039289891719818115, -0.0003750026226043701, -0.0003571063280105591, -0.00033921003341674805, -0.000321313738822937, -0.000303417444229126, -0.00028552114963531494, -0.0002676248550415039, -0.00024972856044769287, -0.00023183226585388184, -0.0002139359712600708, -0.00019603967666625977, -0.00017814338207244873, -0.0001602470874786377, -0.00014235079288482666, -0.00012445449829101562, -0.00010655820369720459, -8.866190910339355e-05, -7.076561450958252e-05, -5.2869319915771484e-05, -3.497302532196045e-05, -1.7076730728149414e-05, 8.195638656616211e-07, 1.8715858459472656e-05, 3.661215305328369e-05, 5.4508447647094727e-05, 7.240474224090576e-05, 9.03010368347168e-05, 0.00010819733142852783, 0.00012609362602233887, 0.0001439899206161499, 0.00016188621520996094, 0.00017978250980377197, 0.000197678804397583, 0.00021557509899139404, 0.00023347139358520508, 0.0002513676881790161, 0.00026926398277282715, 0.0002871602773666382, 0.0003050565719604492, 0.00032295286655426025, 0.0003408491611480713, 0.0003587454557418823, 0.00037664175033569336, 0.0003945380449295044, 0.00041243433952331543, 0.00043033063411712646, 0.0004482269287109375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 21.0, 21.0, 37.0, 68.0, 111.0, 264.0, 640.0, 2366.0, 11492.0, 191275.0, 815513.0, 21418.0, 3744.0, 931.0, 321.0, 143.0, 76.0, 44.0, 32.0, 14.0, 7.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.05859375, -4.84918212890625, -4.6397705078125, -4.43035888671875, -4.220947265625, -4.01153564453125, -3.8021240234375, -3.59271240234375, -3.38330078125, -3.17388916015625, -2.9644775390625, -2.75506591796875, -2.545654296875, -2.33624267578125, -2.1268310546875, -1.91741943359375, -1.7080078125, -1.49859619140625, -1.2891845703125, -1.07977294921875, -0.870361328125, -0.66094970703125, -0.4515380859375, -0.24212646484375, -0.03271484375, 0.17669677734375, 0.3861083984375, 0.59552001953125, 0.804931640625, 1.01434326171875, 1.2237548828125, 1.43316650390625, 1.642578125, 1.85198974609375, 2.0614013671875, 2.27081298828125, 2.480224609375, 2.68963623046875, 2.8990478515625, 3.10845947265625, 3.31787109375, 3.52728271484375, 3.7366943359375, 3.94610595703125, 4.155517578125, 4.36492919921875, 4.5743408203125, 4.78375244140625, 4.9931640625, 5.20257568359375, 5.4119873046875, 5.62139892578125, 5.830810546875, 6.04022216796875, 6.2496337890625, 6.45904541015625, 6.66845703125, 6.87786865234375, 7.0872802734375, 7.29669189453125, 7.506103515625, 7.71551513671875, 7.9249267578125, 8.13433837890625, 8.34375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 5.0, 5.0, 4.0, 9.0, 14.0, 12.0, 16.0, 16.0, 32.0, 54.0, 94.0, 156.0, 167.0, 130.0, 85.0, 60.0, 30.0, 27.0, 19.0, 11.0, 9.0, 6.0, 8.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.30859375, -2.23291015625, -2.1572265625, -2.08154296875, -2.005859375, -1.93017578125, -1.8544921875, -1.77880859375, -1.703125, -1.62744140625, -1.5517578125, -1.47607421875, -1.400390625, -1.32470703125, -1.2490234375, -1.17333984375, -1.09765625, -1.02197265625, -0.9462890625, -0.87060546875, -0.794921875, -0.71923828125, -0.6435546875, -0.56787109375, -0.4921875, -0.41650390625, -0.3408203125, -0.26513671875, -0.189453125, -0.11376953125, -0.0380859375, 0.03759765625, 0.11328125, 0.18896484375, 0.2646484375, 0.34033203125, 0.416015625, 0.49169921875, 0.5673828125, 0.64306640625, 0.71875, 0.79443359375, 0.8701171875, 0.94580078125, 1.021484375, 1.09716796875, 1.1728515625, 1.24853515625, 1.32421875, 1.39990234375, 1.4755859375, 1.55126953125, 1.626953125, 1.70263671875, 1.7783203125, 1.85400390625, 1.9296875, 2.00537109375, 2.0810546875, 2.15673828125, 2.232421875, 2.30810546875, 2.3837890625, 2.45947265625, 2.53515625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 7.0, 10.0, 22.0, 48.0, 50.0, 111.0, 139.0, 173.0, 145.0, 106.0, 79.0, 53.0, 26.0, 18.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-56.092018127441406, -54.839561462402344, -53.58710479736328, -52.33464813232422, -51.08218765258789, -49.82973098754883, -48.577274322509766, -47.3248176574707, -46.07236099243164, -44.81990432739258, -43.567447662353516, -42.31498718261719, -41.062530517578125, -39.81007385253906, -38.5576171875, -37.30516052246094, -36.052703857421875, -34.80024719238281, -33.54779052734375, -32.29533386230469, -31.042875289916992, -29.790416717529297, -28.537960052490234, -27.285503387451172, -26.033042907714844, -24.78058624267578, -23.528127670288086, -22.275671005249023, -21.02321434020996, -19.770755767822266, -18.518299102783203, -17.26584243774414, -16.013385772705078, -14.7609281539917, -13.508471488952637, -12.256013870239258, -11.003557205200195, -9.751099586486816, -8.498641967773438, -7.246185302734375, -5.993727684020996, -4.741270542144775, -3.4888131618499756, -2.236355781555176, -0.9838986396789551, 0.2685585021972656, 1.5210161209106445, 2.773472785949707, 4.025930404663086, 5.278387546539307, 6.530844688415527, 7.783302307128906, 9.035758972167969, 10.288216590881348, 11.540674209594727, 12.793130874633789, 14.045588493347168, 15.298046112060547, 16.55050277709961, 17.802959442138672, 19.055418014526367, 20.30787467956543, 21.560333251953125, 22.812789916992188, 24.06524658203125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 2.0, 4.0, 8.0, 9.0, 12.0, 19.0, 12.0, 21.0, 26.0, 30.0, 39.0, 31.0, 37.0, 50.0, 33.0, 46.0, 41.0, 37.0, 41.0, 44.0, 50.0, 50.0, 42.0, 36.0, 51.0, 34.0, 25.0, 24.0, 30.0, 19.0, 15.0, 16.0, 16.0, 6.0, 13.0, 11.0, 4.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-19.359045028686523, -18.80318260192871, -18.2473201751709, -17.691455841064453, -17.13559341430664, -16.579730987548828, -16.023868560791016, -15.468005180358887, -14.912141799926758, -14.356279373168945, -13.800415992736816, -13.244553565979004, -12.688690185546875, -12.132827758789062, -11.57696533203125, -11.021101951599121, -10.465239524841309, -9.909377098083496, -9.353513717651367, -8.797651290893555, -8.241787910461426, -7.685925483703613, -7.130062580108643, -6.574199676513672, -6.018336772918701, -5.4624738693237305, -4.90661096572876, -4.350748062133789, -3.7948853969573975, -3.2390224933624268, -2.683159828186035, -2.1272969245910645, -1.5714340209960938, -1.015571117401123, -0.4597083330154419, 0.09615445137023926, 0.65201735496521, 1.2078802585601807, 1.7637429237365723, 2.319605827331543, 2.8754687309265137, 3.4313316345214844, 3.987194538116455, 4.543057441711426, 5.098919868469238, 5.654783248901367, 6.21064567565918, 6.76650857925415, 7.322371482849121, 7.878234386444092, 8.434097290039062, 8.989959716796875, 9.545823097229004, 10.101685523986816, 10.657548904418945, 11.213411331176758, 11.76927375793457, 12.325136184692383, 12.880999565124512, 13.436861991882324, 13.992725372314453, 14.548587799072266, 15.104450225830078, 15.660313606262207, 16.216176986694336]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 8.0, 7.0, 13.0, 23.0, 35.0, 58.0, 120.0, 207.0, 310.0, 547.0, 1297.0, 3661.0, 15961.0, 171517.0, 3912361.0, 74122.0, 9494.0, 2436.0, 911.0, 474.0, 215.0, 139.0, 105.0, 70.0, 55.0, 42.0, 31.0, 17.0, 15.0, 12.0, 3.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.7578125, -8.4871826171875, -8.216552734375, -7.9459228515625, -7.67529296875, -7.4046630859375, -7.134033203125, -6.8634033203125, -6.5927734375, -6.3221435546875, -6.051513671875, -5.7808837890625, -5.51025390625, -5.2396240234375, -4.968994140625, -4.6983642578125, -4.427734375, -4.1571044921875, -3.886474609375, -3.6158447265625, -3.34521484375, -3.0745849609375, -2.803955078125, -2.5333251953125, -2.2626953125, -1.9920654296875, -1.721435546875, -1.4508056640625, -1.18017578125, -0.9095458984375, -0.638916015625, -0.3682861328125, -0.09765625, 0.1729736328125, 0.443603515625, 0.7142333984375, 0.98486328125, 1.2554931640625, 1.526123046875, 1.7967529296875, 2.0673828125, 2.3380126953125, 2.608642578125, 2.8792724609375, 3.14990234375, 3.4205322265625, 3.691162109375, 3.9617919921875, 4.232421875, 4.5030517578125, 4.773681640625, 5.0443115234375, 5.31494140625, 5.5855712890625, 5.856201171875, 6.1268310546875, 6.3974609375, 6.6680908203125, 6.938720703125, 7.2093505859375, 7.47998046875, 7.7506103515625, 8.021240234375, 8.2918701171875, 8.5625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 11.0, 14.0, 16.0, 14.0, 22.0, 22.0, 27.0, 32.0, 36.0, 36.0, 43.0, 45.0, 39.0, 48.0, 60.0, 50.0, 49.0, 55.0, 51.0, 44.0, 43.0, 30.0, 33.0, 33.0, 31.0, 22.0, 25.0, 11.0, 17.0, 6.0, 9.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.73388671875, -0.70703125, -0.68017578125, -0.6533203125, -0.62646484375, -0.599609375, -0.57275390625, -0.5458984375, -0.51904296875, -0.4921875, -0.46533203125, -0.4384765625, -0.41162109375, -0.384765625, -0.35791015625, -0.3310546875, -0.30419921875, -0.27734375, -0.25048828125, -0.2236328125, -0.19677734375, -0.169921875, -0.14306640625, -0.1162109375, -0.08935546875, -0.0625, -0.03564453125, -0.0087890625, 0.01806640625, 0.044921875, 0.07177734375, 0.0986328125, 0.12548828125, 0.15234375, 0.17919921875, 0.2060546875, 0.23291015625, 0.259765625, 0.28662109375, 0.3134765625, 0.34033203125, 0.3671875, 0.39404296875, 0.4208984375, 0.44775390625, 0.474609375, 0.50146484375, 0.5283203125, 0.55517578125, 0.58203125, 0.60888671875, 0.6357421875, 0.66259765625, 0.689453125, 0.71630859375, 0.7431640625, 0.77001953125, 0.796875, 0.82373046875, 0.8505859375, 0.87744140625, 0.904296875, 0.93115234375, 0.9580078125, 0.98486328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 11.0, 8.0, 6.0, 23.0, 33.0, 37.0, 53.0, 58.0, 70.0, 114.0, 169.0, 242.0, 424.0, 673.0, 1499.0, 3745.0, 15265.0, 129268.0, 3885352.0, 134323.0, 15527.0, 4015.0, 1483.0, 673.0, 384.0, 230.0, 184.0, 98.0, 78.0, 68.0, 40.0, 27.0, 27.0, 24.0, 6.0, 15.0, 4.0, 8.0, 2.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8125, -7.5477294921875, -7.282958984375, -7.0181884765625, -6.75341796875, -6.4886474609375, -6.223876953125, -5.9591064453125, -5.6943359375, -5.4295654296875, -5.164794921875, -4.9000244140625, -4.63525390625, -4.3704833984375, -4.105712890625, -3.8409423828125, -3.576171875, -3.3114013671875, -3.046630859375, -2.7818603515625, -2.51708984375, -2.2523193359375, -1.987548828125, -1.7227783203125, -1.4580078125, -1.1932373046875, -0.928466796875, -0.6636962890625, -0.39892578125, -0.1341552734375, 0.130615234375, 0.3953857421875, 0.66015625, 0.9249267578125, 1.189697265625, 1.4544677734375, 1.71923828125, 1.9840087890625, 2.248779296875, 2.5135498046875, 2.7783203125, 3.0430908203125, 3.307861328125, 3.5726318359375, 3.83740234375, 4.1021728515625, 4.366943359375, 4.6317138671875, 4.896484375, 5.1612548828125, 5.426025390625, 5.6907958984375, 5.95556640625, 6.2203369140625, 6.485107421875, 6.7498779296875, 7.0146484375, 7.2794189453125, 7.544189453125, 7.8089599609375, 8.07373046875, 8.3385009765625, 8.603271484375, 8.8680419921875, 9.1328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 10.0, 25.0, 34.0, 50.0, 89.0, 288.0, 1626.0, 1474.0, 259.0, 96.0, 44.0, 17.0, 14.0, 17.0, 8.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.095703125, -2.998931884765625, -2.90216064453125, -2.805389404296875, -2.7086181640625, -2.611846923828125, -2.51507568359375, -2.418304443359375, -2.321533203125, -2.224761962890625, -2.12799072265625, -2.031219482421875, -1.9344482421875, -1.837677001953125, -1.74090576171875, -1.644134521484375, -1.54736328125, -1.450592041015625, -1.35382080078125, -1.257049560546875, -1.1602783203125, -1.063507080078125, -0.96673583984375, -0.869964599609375, -0.773193359375, -0.676422119140625, -0.57965087890625, -0.482879638671875, -0.3861083984375, -0.289337158203125, -0.19256591796875, -0.095794677734375, 0.0009765625, 0.097747802734375, 0.19451904296875, 0.291290283203125, 0.3880615234375, 0.484832763671875, 0.58160400390625, 0.678375244140625, 0.775146484375, 0.871917724609375, 0.96868896484375, 1.065460205078125, 1.1622314453125, 1.259002685546875, 1.35577392578125, 1.452545166015625, 1.54931640625, 1.646087646484375, 1.74285888671875, 1.839630126953125, 1.9364013671875, 2.033172607421875, 2.12994384765625, 2.226715087890625, 2.323486328125, 2.420257568359375, 2.51702880859375, 2.613800048828125, 2.7105712890625, 2.807342529296875, 2.90411376953125, 3.000885009765625, 3.09765625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 7.0, 5.0, 16.0, 58.0, 101.0, 240.0, 310.0, 172.0, 49.0, 20.0, 9.0, 1.0, 4.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.20721435546875, -29.35400390625, -28.500791549682617, -27.647581100463867, -26.794370651245117, -25.941158294677734, -25.087947845458984, -24.234737396240234, -23.381526947021484, -22.528316497802734, -21.67510414123535, -20.8218936920166, -19.96868324279785, -19.11547088623047, -18.26226043701172, -17.40904998779297, -16.555837631225586, -15.70262622833252, -14.84941577911377, -13.996204376220703, -13.142993927001953, -12.289782524108887, -11.43657112121582, -10.58336067199707, -9.730149269104004, -8.876937866210938, -8.023727416992188, -7.170516014099121, -6.317305088043213, -5.464094161987305, -4.610882759094238, -3.75767183303833, -2.904460906982422, -2.0512499809265137, -1.1980388164520264, -0.34482765197753906, 0.5083832740783691, 1.3615942001342773, 2.2148056030273438, 3.068016529083252, 3.92122745513916, 4.774438381195068, 5.627649307250977, 6.480860710144043, 7.334071636199951, 8.18728256225586, 9.040493965148926, 9.893705368041992, 10.746915817260742, 11.600127220153809, 12.453337669372559, 13.306549072265625, 14.159759521484375, 15.012970924377441, 15.866182327270508, 16.719392776489258, 17.57260513305664, 18.42581558227539, 19.279027938842773, 20.132238388061523, 20.985448837280273, 21.838661193847656, 22.691871643066406, 23.545082092285156, 24.398292541503906]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 5.0, 6.0, 5.0, 8.0, 11.0, 16.0, 14.0, 27.0, 17.0, 37.0, 32.0, 44.0, 40.0, 65.0, 49.0, 49.0, 55.0, 60.0, 57.0, 51.0, 45.0, 41.0, 38.0, 38.0, 26.0, 20.0, 30.0, 27.0, 17.0, 21.0, 10.0, 7.0, 8.0, 4.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.509624004364014, -6.294403076171875, -6.079182147979736, -5.863961219787598, -5.648739814758301, -5.43351936340332, -5.218297958374023, -5.003077030181885, -4.787856101989746, -4.572635173797607, -4.357414245605469, -4.14219331741333, -3.9269721508026123, -3.7117512226104736, -3.496530055999756, -3.281309127807617, -3.0660881996154785, -2.85086727142334, -2.635646343231201, -2.4204251766204834, -2.2052042484283447, -1.989983320236206, -1.7747622728347778, -1.5595412254333496, -1.344320297241211, -1.1290993690490723, -0.913878321647644, -0.6986573338508606, -0.48343634605407715, -0.2682154178619385, -0.052994370460510254, 0.16222667694091797, 0.37744760513305664, 0.5926685929298401, 0.8078895807266235, 1.0231106281280518, 1.2383315563201904, 1.453552484512329, 1.6687735319137573, 1.8839945793151855, 2.099215507507324, 2.314436435699463, 2.5296573638916016, 2.7448785305023193, 2.960099458694458, 3.1753203868865967, 3.3905415534973145, 3.605762481689453, 3.820983409881592, 4.0362043380737305, 4.251425266265869, 4.466646194458008, 4.681867599487305, 4.897088050842285, 5.112309455871582, 5.327530384063721, 5.542751312255859, 5.757972240447998, 5.973193168640137, 6.188414096832275, 6.403635025024414, 6.618856430053711, 6.83407735824585, 7.049298286437988, 7.264519214630127]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 11.0, 5.0, 20.0, 18.0, 30.0, 36.0, 41.0, 71.0, 83.0, 149.0, 255.0, 357.0, 708.0, 1575.0, 3842.0, 12971.0, 58486.0, 323976.0, 515527.0, 99906.0, 20672.0, 5603.0, 2021.0, 939.0, 466.0, 279.0, 135.0, 110.0, 67.0, 48.0, 38.0, 23.0, 14.0, 16.0, 13.0, 5.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.484375, -5.282470703125, -5.08056640625, -4.878662109375, -4.6767578125, -4.474853515625, -4.27294921875, -4.071044921875, -3.869140625, -3.667236328125, -3.46533203125, -3.263427734375, -3.0615234375, -2.859619140625, -2.65771484375, -2.455810546875, -2.25390625, -2.052001953125, -1.85009765625, -1.648193359375, -1.4462890625, -1.244384765625, -1.04248046875, -0.840576171875, -0.638671875, -0.436767578125, -0.23486328125, -0.032958984375, 0.1689453125, 0.370849609375, 0.57275390625, 0.774658203125, 0.9765625, 1.178466796875, 1.38037109375, 1.582275390625, 1.7841796875, 1.986083984375, 2.18798828125, 2.389892578125, 2.591796875, 2.793701171875, 2.99560546875, 3.197509765625, 3.3994140625, 3.601318359375, 3.80322265625, 4.005126953125, 4.20703125, 4.408935546875, 4.61083984375, 4.812744140625, 5.0146484375, 5.216552734375, 5.41845703125, 5.620361328125, 5.822265625, 6.024169921875, 6.22607421875, 6.427978515625, 6.6298828125, 6.831787109375, 7.03369140625, 7.235595703125, 7.4375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 8.0, 9.0, 16.0, 16.0, 19.0, 24.0, 21.0, 28.0, 44.0, 50.0, 47.0, 64.0, 55.0, 61.0, 52.0, 59.0, 55.0, 61.0, 47.0, 55.0, 48.0, 42.0, 27.0, 15.0, 18.0, 21.0, 14.0, 9.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81494140625, -0.7830429077148438, -0.7511444091796875, -0.7192459106445312, -0.687347412109375, -0.6554489135742188, -0.6235504150390625, -0.5916519165039062, -0.55975341796875, -0.5278549194335938, -0.4959564208984375, -0.46405792236328125, -0.432159423828125, -0.40026092529296875, -0.3683624267578125, -0.33646392822265625, -0.3045654296875, -0.27266693115234375, -0.2407684326171875, -0.20886993408203125, -0.176971435546875, -0.14507293701171875, -0.1131744384765625, -0.08127593994140625, -0.04937744140625, -0.01747894287109375, 0.0144195556640625, 0.04631805419921875, 0.078216552734375, 0.11011505126953125, 0.1420135498046875, 0.17391204833984375, 0.205810546875, 0.23770904541015625, 0.2696075439453125, 0.30150604248046875, 0.333404541015625, 0.36530303955078125, 0.3972015380859375, 0.42910003662109375, 0.46099853515625, 0.49289703369140625, 0.5247955322265625, 0.5566940307617188, 0.588592529296875, 0.6204910278320312, 0.6523895263671875, 0.6842880249023438, 0.7161865234375, 0.7480850219726562, 0.7799835205078125, 0.8118820190429688, 0.843780517578125, 0.8756790161132812, 0.9075775146484375, 0.9394760131835938, 0.97137451171875, 1.0032730102539062, 1.0351715087890625, 1.0670700073242188, 1.098968505859375, 1.1308670043945312, 1.1627655029296875, 1.1946640014648438, 1.2265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 10.0, 11.0, 12.0, 16.0, 20.0, 22.0, 38.0, 57.0, 96.0, 123.0, 183.0, 276.0, 510.0, 934.0, 1916.0, 4547.0, 11324.0, 31432.0, 94264.0, 302785.0, 396779.0, 133966.0, 42702.0, 15378.0, 5916.0, 2509.0, 1115.0, 630.0, 333.0, 224.0, 130.0, 76.0, 55.0, 49.0, 33.0, 15.0, 24.0, 15.0, 4.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9765625, -2.870819091796875, -2.76507568359375, -2.659332275390625, -2.5535888671875, -2.447845458984375, -2.34210205078125, -2.236358642578125, -2.130615234375, -2.024871826171875, -1.91912841796875, -1.813385009765625, -1.7076416015625, -1.601898193359375, -1.49615478515625, -1.390411376953125, -1.28466796875, -1.178924560546875, -1.07318115234375, -0.967437744140625, -0.8616943359375, -0.755950927734375, -0.65020751953125, -0.544464111328125, -0.438720703125, -0.332977294921875, -0.22723388671875, -0.121490478515625, -0.0157470703125, 0.089996337890625, 0.19573974609375, 0.301483154296875, 0.4072265625, 0.512969970703125, 0.61871337890625, 0.724456787109375, 0.8302001953125, 0.935943603515625, 1.04168701171875, 1.147430419921875, 1.253173828125, 1.358917236328125, 1.46466064453125, 1.570404052734375, 1.6761474609375, 1.781890869140625, 1.88763427734375, 1.993377685546875, 2.09912109375, 2.204864501953125, 2.31060791015625, 2.416351318359375, 2.5220947265625, 2.627838134765625, 2.73358154296875, 2.839324951171875, 2.945068359375, 3.050811767578125, 3.15655517578125, 3.262298583984375, 3.3680419921875, 3.473785400390625, 3.57952880859375, 3.685272216796875, 3.791015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 0.0, 3.0, 3.0, 7.0, 4.0, 7.0, 5.0, 7.0, 10.0, 13.0, 9.0, 21.0, 21.0, 15.0, 19.0, 25.0, 26.0, 33.0, 35.0, 41.0, 36.0, 36.0, 46.0, 35.0, 41.0, 49.0, 40.0, 32.0, 31.0, 42.0, 30.0, 37.0, 33.0, 26.0, 37.0, 15.0, 19.0, 22.0, 15.0, 11.0, 10.0, 7.0, 12.0, 7.0, 5.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.552734375, -2.473236083984375, -2.39373779296875, -2.314239501953125, -2.2347412109375, -2.155242919921875, -2.07574462890625, -1.996246337890625, -1.916748046875, -1.837249755859375, -1.75775146484375, -1.678253173828125, -1.5987548828125, -1.519256591796875, -1.43975830078125, -1.360260009765625, -1.28076171875, -1.201263427734375, -1.12176513671875, -1.042266845703125, -0.9627685546875, -0.883270263671875, -0.80377197265625, -0.724273681640625, -0.644775390625, -0.565277099609375, -0.48577880859375, -0.406280517578125, -0.3267822265625, -0.247283935546875, -0.16778564453125, -0.088287353515625, -0.0087890625, 0.070709228515625, 0.15020751953125, 0.229705810546875, 0.3092041015625, 0.388702392578125, 0.46820068359375, 0.547698974609375, 0.627197265625, 0.706695556640625, 0.78619384765625, 0.865692138671875, 0.9451904296875, 1.024688720703125, 1.10418701171875, 1.183685302734375, 1.26318359375, 1.342681884765625, 1.42218017578125, 1.501678466796875, 1.5811767578125, 1.660675048828125, 1.74017333984375, 1.819671630859375, 1.899169921875, 1.978668212890625, 2.05816650390625, 2.137664794921875, 2.2171630859375, 2.296661376953125, 2.37615966796875, 2.455657958984375, 2.53515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 9.0, 17.0, 14.0, 30.0, 53.0, 79.0, 153.0, 295.0, 630.0, 1471.0, 4130.0, 13801.0, 64366.0, 649455.0, 264930.0, 35547.0, 8679.0, 2799.0, 1071.0, 448.0, 260.0, 131.0, 67.0, 45.0, 29.0, 17.0, 9.0, 4.0, 7.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1875, -2.099365234375, -2.01123046875, -1.923095703125, -1.8349609375, -1.746826171875, -1.65869140625, -1.570556640625, -1.482421875, -1.394287109375, -1.30615234375, -1.218017578125, -1.1298828125, -1.041748046875, -0.95361328125, -0.865478515625, -0.77734375, -0.689208984375, -0.60107421875, -0.512939453125, -0.4248046875, -0.336669921875, -0.24853515625, -0.160400390625, -0.072265625, 0.015869140625, 0.10400390625, 0.192138671875, 0.2802734375, 0.368408203125, 0.45654296875, 0.544677734375, 0.6328125, 0.720947265625, 0.80908203125, 0.897216796875, 0.9853515625, 1.073486328125, 1.16162109375, 1.249755859375, 1.337890625, 1.426025390625, 1.51416015625, 1.602294921875, 1.6904296875, 1.778564453125, 1.86669921875, 1.954833984375, 2.04296875, 2.131103515625, 2.21923828125, 2.307373046875, 2.3955078125, 2.483642578125, 2.57177734375, 2.659912109375, 2.748046875, 2.836181640625, 2.92431640625, 3.012451171875, 3.1005859375, 3.188720703125, 3.27685546875, 3.364990234375, 3.453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 9.0, 7.0, 12.0, 17.0, 18.0, 28.0, 63.0, 161.0, 424.0, 119.0, 46.0, 26.0, 23.0, 15.0, 14.0, 4.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005025863647460938, -0.0004810541868209839, -0.000459522008895874, -0.00043798983097076416, -0.0004164576530456543, -0.00039492547512054443, -0.00037339329719543457, -0.0003518611192703247, -0.00033032894134521484, -0.000308796763420105, -0.0002872645854949951, -0.00026573240756988525, -0.0002442002296447754, -0.00022266805171966553, -0.00020113587379455566, -0.0001796036958694458, -0.00015807151794433594, -0.00013653934001922607, -0.00011500716209411621, -9.347498416900635e-05, -7.194280624389648e-05, -5.041062831878662e-05, -2.8878450393676758e-05, -7.3462724685668945e-06, 1.4185905456542969e-05, 3.571808338165283e-05, 5.7250261306762695e-05, 7.878243923187256e-05, 0.00010031461715698242, 0.00012184679508209229, 0.00014337897300720215, 0.000164911150932312, 0.00018644332885742188, 0.00020797550678253174, 0.0002295076847076416, 0.00025103986263275146, 0.00027257204055786133, 0.0002941042184829712, 0.00031563639640808105, 0.0003371685743331909, 0.0003587007522583008, 0.00038023293018341064, 0.0004017651081085205, 0.00042329728603363037, 0.00044482946395874023, 0.0004663616418838501, 0.00048789381980895996, 0.0005094259977340698, 0.0005309581756591797, 0.0005524903535842896, 0.0005740225315093994, 0.0005955547094345093, 0.0006170868873596191, 0.000638619065284729, 0.0006601512432098389, 0.0006816834211349487, 0.0007032155990600586, 0.0007247477769851685, 0.0007462799549102783, 0.0007678121328353882, 0.000789344310760498, 0.0008108764886856079, 0.0008324086666107178, 0.0008539408445358276, 0.0008754730224609375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 10.0, 16.0, 26.0, 48.0, 85.0, 100.0, 235.0, 465.0, 1117.0, 3432.0, 14086.0, 78659.0, 816688.0, 109187.0, 17848.0, 4148.0, 1277.0, 522.0, 253.0, 147.0, 92.0, 41.0, 24.0, 16.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.794921875, -2.685638427734375, -2.57635498046875, -2.467071533203125, -2.3577880859375, -2.248504638671875, -2.13922119140625, -2.029937744140625, -1.920654296875, -1.811370849609375, -1.70208740234375, -1.592803955078125, -1.4835205078125, -1.374237060546875, -1.26495361328125, -1.155670166015625, -1.04638671875, -0.937103271484375, -0.82781982421875, -0.718536376953125, -0.6092529296875, -0.499969482421875, -0.39068603515625, -0.281402587890625, -0.172119140625, -0.062835693359375, 0.04644775390625, 0.155731201171875, 0.2650146484375, 0.374298095703125, 0.48358154296875, 0.592864990234375, 0.7021484375, 0.811431884765625, 0.92071533203125, 1.029998779296875, 1.1392822265625, 1.248565673828125, 1.35784912109375, 1.467132568359375, 1.576416015625, 1.685699462890625, 1.79498291015625, 1.904266357421875, 2.0135498046875, 2.122833251953125, 2.23211669921875, 2.341400146484375, 2.45068359375, 2.559967041015625, 2.66925048828125, 2.778533935546875, 2.8878173828125, 2.997100830078125, 3.10638427734375, 3.215667724609375, 3.324951171875, 3.434234619140625, 3.54351806640625, 3.652801513671875, 3.7620849609375, 3.871368408203125, 3.98065185546875, 4.089935302734375, 4.19921875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 10.0, 11.0, 11.0, 9.0, 19.0, 23.0, 39.0, 76.0, 129.0, 209.0, 191.0, 103.0, 54.0, 22.0, 20.0, 11.0, 16.0, 8.0, 10.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.083984375, -2.002838134765625, -1.92169189453125, -1.840545654296875, -1.7593994140625, -1.678253173828125, -1.59710693359375, -1.515960693359375, -1.434814453125, -1.353668212890625, -1.27252197265625, -1.191375732421875, -1.1102294921875, -1.029083251953125, -0.94793701171875, -0.866790771484375, -0.78564453125, -0.704498291015625, -0.62335205078125, -0.542205810546875, -0.4610595703125, -0.379913330078125, -0.29876708984375, -0.217620849609375, -0.136474609375, -0.055328369140625, 0.02581787109375, 0.106964111328125, 0.1881103515625, 0.269256591796875, 0.35040283203125, 0.431549072265625, 0.5126953125, 0.593841552734375, 0.67498779296875, 0.756134033203125, 0.8372802734375, 0.918426513671875, 0.99957275390625, 1.080718994140625, 1.161865234375, 1.243011474609375, 1.32415771484375, 1.405303955078125, 1.4864501953125, 1.567596435546875, 1.64874267578125, 1.729888916015625, 1.81103515625, 1.892181396484375, 1.97332763671875, 2.054473876953125, 2.1356201171875, 2.216766357421875, 2.29791259765625, 2.379058837890625, 2.460205078125, 2.541351318359375, 2.62249755859375, 2.703643798828125, 2.7847900390625, 2.865936279296875, 2.94708251953125, 3.028228759765625, 3.109375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 9.0, 6.0, 16.0, 47.0, 97.0, 168.0, 241.0, 221.0, 120.0, 52.0, 22.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-85.15440368652344, -83.44251251220703, -81.73062133789062, -80.01873779296875, -78.30684661865234, -76.59495544433594, -74.88306427001953, -73.17117309570312, -71.45928955078125, -69.74739837646484, -68.03550720214844, -66.32362365722656, -64.61173248291016, -62.89984130859375, -61.187950134277344, -59.4760627746582, -57.76416778564453, -56.052276611328125, -54.340389251708984, -52.62849807739258, -50.91661071777344, -49.20471954345703, -47.492828369140625, -45.780941009521484, -44.069053649902344, -42.35716247558594, -40.6452751159668, -38.93338394165039, -37.22149658203125, -35.509605407714844, -33.79771423339844, -32.0858268737793, -30.373937606811523, -28.66204833984375, -26.950159072875977, -25.238269805908203, -23.526378631591797, -21.814489364624023, -20.10260009765625, -18.390708923339844, -16.678821563720703, -14.96693229675293, -13.25504207611084, -11.543152809143066, -9.831262588500977, -8.119373321533203, -6.40748405456543, -4.69559383392334, -2.98370361328125, -1.271813988685608, 0.4400756359100342, 2.1519651412963867, 3.8638548851013184, 5.57574462890625, 7.287633895874023, 8.999524116516113, 10.711413383483887, 12.42330265045166, 14.13519287109375, 15.847082138061523, 17.558971405029297, 19.270862579345703, 20.982749938964844, 22.69464111328125, 24.406530380249023]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 2.0, 16.0, 10.0, 19.0, 23.0, 21.0, 29.0, 41.0, 43.0, 35.0, 36.0, 51.0, 35.0, 52.0, 50.0, 44.0, 41.0, 52.0, 39.0, 45.0, 52.0, 35.0, 36.0, 28.0, 23.0, 24.0, 20.0, 17.0, 14.0, 16.0, 6.0, 9.0, 7.0, 7.0, 3.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.921579360961914, -17.432241439819336, -16.942903518676758, -16.45356559753418, -15.964228630065918, -15.474891662597656, -14.985553741455078, -14.4962158203125, -14.006877899169922, -13.517539978027344, -13.028203010559082, -12.538865089416504, -12.049527168273926, -11.560190200805664, -11.070852279663086, -10.581514358520508, -10.09217643737793, -9.602838516235352, -9.11350154876709, -8.624163627624512, -8.134825706481934, -7.645488262176514, -7.156150817871094, -6.666812896728516, -6.177475929260254, -5.688138484954834, -5.198800563812256, -4.709463119506836, -4.220125198364258, -3.730787754058838, -3.241450071334839, -2.75211238861084, -2.2627744674682617, -1.7734367847442627, -1.2840991020202637, -0.7947615385055542, -0.3054238557815552, 0.1839137077331543, 0.6732513904571533, 1.1625890731811523, 1.6519267559051514, 2.1412644386291504, 2.6306021213531494, 3.1199398040771484, 3.6092772483825684, 4.098614692687988, 4.587952613830566, 5.0772905349731445, 5.5666279792785645, 6.055965423583984, 6.5453033447265625, 7.034640789031982, 7.5239787101745605, 8.01331615447998, 8.502654075622559, 8.99199104309082, 9.481328964233398, 9.970666885375977, 10.460003852844238, 10.949341773986816, 11.438679695129395, 11.928016662597656, 12.417354583740234, 12.906692504882812, 13.39603042602539]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 10.0, 8.0, 10.0, 25.0, 47.0, 96.0, 170.0, 365.0, 804.0, 2690.0, 16182.0, 3841798.0, 319259.0, 9438.0, 1943.0, 703.0, 322.0, 174.0, 109.0, 56.0, 27.0, 21.0, 15.0, 9.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9375, -12.318359375, -11.69921875, -11.080078125, -10.4609375, -9.841796875, -9.22265625, -8.603515625, -7.984375, -7.365234375, -6.74609375, -6.126953125, -5.5078125, -4.888671875, -4.26953125, -3.650390625, -3.03125, -2.412109375, -1.79296875, -1.173828125, -0.5546875, 0.064453125, 0.68359375, 1.302734375, 1.921875, 2.541015625, 3.16015625, 3.779296875, 4.3984375, 5.017578125, 5.63671875, 6.255859375, 6.875, 7.494140625, 8.11328125, 8.732421875, 9.3515625, 9.970703125, 10.58984375, 11.208984375, 11.828125, 12.447265625, 13.06640625, 13.685546875, 14.3046875, 14.923828125, 15.54296875, 16.162109375, 16.78125, 17.400390625, 18.01953125, 18.638671875, 19.2578125, 19.876953125, 20.49609375, 21.115234375, 21.734375, 22.353515625, 22.97265625, 23.591796875, 24.2109375, 24.830078125, 25.44921875, 26.068359375, 26.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 1.0, 6.0, 8.0, 10.0, 14.0, 12.0, 22.0, 29.0, 28.0, 44.0, 48.0, 48.0, 53.0, 59.0, 44.0, 56.0, 45.0, 48.0, 64.0, 61.0, 49.0, 42.0, 35.0, 34.0, 26.0, 27.0, 20.0, 16.0, 11.0, 8.0, 5.0, 12.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83203125, -0.8003082275390625, -0.768585205078125, -0.7368621826171875, -0.70513916015625, -0.6734161376953125, -0.641693115234375, -0.6099700927734375, -0.5782470703125, -0.5465240478515625, -0.514801025390625, -0.4830780029296875, -0.45135498046875, -0.4196319580078125, -0.387908935546875, -0.3561859130859375, -0.324462890625, -0.2927398681640625, -0.261016845703125, -0.2292938232421875, -0.19757080078125, -0.1658477783203125, -0.134124755859375, -0.1024017333984375, -0.0706787109375, -0.0389556884765625, -0.007232666015625, 0.0244903564453125, 0.05621337890625, 0.0879364013671875, 0.119659423828125, 0.1513824462890625, 0.18310546875, 0.2148284912109375, 0.246551513671875, 0.2782745361328125, 0.30999755859375, 0.3417205810546875, 0.373443603515625, 0.4051666259765625, 0.4368896484375, 0.4686126708984375, 0.500335693359375, 0.5320587158203125, 0.56378173828125, 0.5955047607421875, 0.627227783203125, 0.6589508056640625, 0.690673828125, 0.7223968505859375, 0.754119873046875, 0.7858428955078125, 0.81756591796875, 0.8492889404296875, 0.881011962890625, 0.9127349853515625, 0.9444580078125, 0.9761810302734375, 1.007904052734375, 1.0396270751953125, 1.07135009765625, 1.1030731201171875, 1.134796142578125, 1.1665191650390625, 1.1982421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 14.0, 13.0, 10.0, 22.0, 26.0, 31.0, 38.0, 53.0, 69.0, 110.0, 144.0, 199.0, 316.0, 443.0, 779.0, 1527.0, 3207.0, 8612.0, 30712.0, 187621.0, 3757744.0, 159987.0, 27808.0, 8010.0, 3057.0, 1439.0, 797.0, 446.0, 284.0, 210.0, 148.0, 123.0, 72.0, 48.0, 49.0, 29.0, 22.0, 19.0, 12.0, 8.0, 9.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.03125, -7.8048095703125, -7.578369140625, -7.3519287109375, -7.12548828125, -6.8990478515625, -6.672607421875, -6.4461669921875, -6.2197265625, -5.9932861328125, -5.766845703125, -5.5404052734375, -5.31396484375, -5.0875244140625, -4.861083984375, -4.6346435546875, -4.408203125, -4.1817626953125, -3.955322265625, -3.7288818359375, -3.50244140625, -3.2760009765625, -3.049560546875, -2.8231201171875, -2.5966796875, -2.3702392578125, -2.143798828125, -1.9173583984375, -1.69091796875, -1.4644775390625, -1.238037109375, -1.0115966796875, -0.78515625, -0.5587158203125, -0.332275390625, -0.1058349609375, 0.12060546875, 0.3470458984375, 0.573486328125, 0.7999267578125, 1.0263671875, 1.2528076171875, 1.479248046875, 1.7056884765625, 1.93212890625, 2.1585693359375, 2.385009765625, 2.6114501953125, 2.837890625, 3.0643310546875, 3.290771484375, 3.5172119140625, 3.74365234375, 3.9700927734375, 4.196533203125, 4.4229736328125, 4.6494140625, 4.8758544921875, 5.102294921875, 5.3287353515625, 5.55517578125, 5.7816162109375, 6.008056640625, 6.2344970703125, 6.4609375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 12.0, 16.0, 20.0, 29.0, 40.0, 79.0, 179.0, 535.0, 2467.0, 359.0, 140.0, 68.0, 36.0, 22.0, 21.0, 10.0, 9.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.63671875, -2.549957275390625, -2.46319580078125, -2.376434326171875, -2.2896728515625, -2.202911376953125, -2.11614990234375, -2.029388427734375, -1.942626953125, -1.855865478515625, -1.76910400390625, -1.682342529296875, -1.5955810546875, -1.508819580078125, -1.42205810546875, -1.335296630859375, -1.24853515625, -1.161773681640625, -1.07501220703125, -0.988250732421875, -0.9014892578125, -0.814727783203125, -0.72796630859375, -0.641204833984375, -0.554443359375, -0.467681884765625, -0.38092041015625, -0.294158935546875, -0.2073974609375, -0.120635986328125, -0.03387451171875, 0.052886962890625, 0.1396484375, 0.226409912109375, 0.31317138671875, 0.399932861328125, 0.4866943359375, 0.573455810546875, 0.66021728515625, 0.746978759765625, 0.833740234375, 0.920501708984375, 1.00726318359375, 1.094024658203125, 1.1807861328125, 1.267547607421875, 1.35430908203125, 1.441070556640625, 1.52783203125, 1.614593505859375, 1.70135498046875, 1.788116455078125, 1.8748779296875, 1.961639404296875, 2.04840087890625, 2.135162353515625, 2.221923828125, 2.308685302734375, 2.39544677734375, 2.482208251953125, 2.5689697265625, 2.655731201171875, 2.74249267578125, 2.829254150390625, 2.916015625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 11.0, 12.0, 26.0, 65.0, 130.0, 214.0, 218.0, 171.0, 80.0, 33.0, 17.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.114950180053711, -13.449872970581055, -12.784795761108398, -12.119719505310059, -11.454642295837402, -10.789565086364746, -10.124488830566406, -9.45941162109375, -8.794334411621094, -8.129257202148438, -7.4641804695129395, -6.799103736877441, -6.134026527404785, -5.468949317932129, -4.803872585296631, -4.138795852661133, -3.4737186431884766, -2.8086416721343994, -2.1435647010803223, -1.4784877300262451, -0.813410758972168, -0.14833378791809082, 0.5167431831359863, 1.1818199157714844, 1.8468971252441406, 2.5119740962982178, 3.177051067352295, 3.842128038406372, 4.507205009460449, 5.1722822189331055, 5.8373589515686035, 6.502435684204102, 7.167514801025391, 7.832592010498047, 8.497669219970703, 9.162745475769043, 9.8278226852417, 10.492899894714355, 11.157976150512695, 11.823053359985352, 12.488130569458008, 13.153207778930664, 13.81828498840332, 14.48336124420166, 15.148438453674316, 15.813515663146973, 16.478591918945312, 17.14366912841797, 17.808746337890625, 18.47382354736328, 19.138900756835938, 19.803977966308594, 20.46905517578125, 21.134130477905273, 21.79920768737793, 22.464284896850586, 23.129362106323242, 23.7944393157959, 24.459516525268555, 25.12459373474121, 25.789669036865234, 26.45474624633789, 27.119823455810547, 27.784900665283203, 28.44997787475586]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 1.0, 2.0, 6.0, 5.0, 11.0, 13.0, 16.0, 15.0, 29.0, 31.0, 32.0, 38.0, 43.0, 39.0, 50.0, 52.0, 51.0, 45.0, 62.0, 61.0, 56.0, 47.0, 45.0, 33.0, 42.0, 24.0, 23.0, 30.0, 21.0, 13.0, 11.0, 13.0, 8.0, 5.0, 6.0, 2.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.027642250061035, -5.8280744552612305, -5.628506660461426, -5.428938865661621, -5.229371070861816, -5.029803276062012, -4.830235481262207, -4.630667686462402, -4.431099891662598, -4.231532096862793, -4.031964302062988, -3.8323965072631836, -3.632828712463379, -3.433260917663574, -3.2336928844451904, -3.0341250896453857, -2.834557056427002, -2.6349892616271973, -2.4354214668273926, -2.235853672027588, -2.036285877227783, -1.836717963218689, -1.6371500492095947, -1.43758225440979, -1.2380144596099854, -1.0384466648101807, -0.8388788104057312, -0.6393109560012817, -0.43974316120147705, -0.24017536640167236, -0.040607452392578125, 0.15896034240722656, 0.35852813720703125, 0.5580959320068359, 0.7576637864112854, 0.9572316408157349, 1.1567994356155396, 1.3563672304153442, 1.5559351444244385, 1.7555029392242432, 1.9550707340240479, 2.1546385288238525, 2.3542063236236572, 2.553774356842041, 2.7533421516418457, 2.9529099464416504, 3.152477741241455, 3.3520455360412598, 3.5516133308410645, 3.751181125640869, 3.950748920440674, 4.1503167152404785, 4.349884510040283, 4.549452304840088, 4.749020576477051, 4.9485883712768555, 5.14815616607666, 5.347723960876465, 5.5472917556762695, 5.746859550476074, 5.946427345275879, 6.145995140075684, 6.345562934875488, 6.545130729675293, 6.744698524475098]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 7.0, 7.0, 13.0, 23.0, 38.0, 58.0, 123.0, 217.0, 484.0, 1189.0, 3697.0, 17807.0, 141723.0, 701777.0, 156067.0, 19114.0, 3961.0, 1256.0, 485.0, 228.0, 106.0, 65.0, 43.0, 27.0, 16.0, 4.0, 2.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.53125, -14.1812744140625, -13.831298828125, -13.4813232421875, -13.13134765625, -12.7813720703125, -12.431396484375, -12.0814208984375, -11.7314453125, -11.3814697265625, -11.031494140625, -10.6815185546875, -10.33154296875, -9.9815673828125, -9.631591796875, -9.2816162109375, -8.931640625, -8.5816650390625, -8.231689453125, -7.8817138671875, -7.53173828125, -7.1817626953125, -6.831787109375, -6.4818115234375, -6.1318359375, -5.7818603515625, -5.431884765625, -5.0819091796875, -4.73193359375, -4.3819580078125, -4.031982421875, -3.6820068359375, -3.33203125, -2.9820556640625, -2.632080078125, -2.2821044921875, -1.93212890625, -1.5821533203125, -1.232177734375, -0.8822021484375, -0.5322265625, -0.1822509765625, 0.167724609375, 0.5177001953125, 0.86767578125, 1.2176513671875, 1.567626953125, 1.9176025390625, 2.267578125, 2.6175537109375, 2.967529296875, 3.3175048828125, 3.66748046875, 4.0174560546875, 4.367431640625, 4.7174072265625, 5.0673828125, 5.4173583984375, 5.767333984375, 6.1173095703125, 6.46728515625, 6.8172607421875, 7.167236328125, 7.5172119140625, 7.8671875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 8.0, 6.0, 23.0, 20.0, 34.0, 28.0, 38.0, 45.0, 48.0, 56.0, 46.0, 66.0, 56.0, 58.0, 49.0, 56.0, 57.0, 37.0, 42.0, 35.0, 37.0, 26.0, 33.0, 19.0, 16.0, 9.0, 10.0, 10.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82861328125, -0.7946395874023438, -0.7606658935546875, -0.7266921997070312, -0.692718505859375, -0.6587448120117188, -0.6247711181640625, -0.5907974243164062, -0.55682373046875, -0.5228500366210938, -0.4888763427734375, -0.45490264892578125, -0.420928955078125, -0.38695526123046875, -0.3529815673828125, -0.31900787353515625, -0.2850341796875, -0.25106048583984375, -0.2170867919921875, -0.18311309814453125, -0.149139404296875, -0.11516571044921875, -0.0811920166015625, -0.04721832275390625, -0.01324462890625, 0.02072906494140625, 0.0547027587890625, 0.08867645263671875, 0.122650146484375, 0.15662384033203125, 0.1905975341796875, 0.22457122802734375, 0.258544921875, 0.29251861572265625, 0.3264923095703125, 0.36046600341796875, 0.394439697265625, 0.42841339111328125, 0.4623870849609375, 0.49636077880859375, 0.53033447265625, 0.5643081665039062, 0.5982818603515625, 0.6322555541992188, 0.666229248046875, 0.7002029418945312, 0.7341766357421875, 0.7681503295898438, 0.8021240234375, 0.8360977172851562, 0.8700714111328125, 0.9040451049804688, 0.938018798828125, 0.9719924926757812, 1.0059661865234375, 1.0399398803710938, 1.07391357421875, 1.1078872680664062, 1.1418609619140625, 1.1758346557617188, 1.209808349609375, 1.2437820434570312, 1.2777557373046875, 1.3117294311523438, 1.345703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 4.0, 14.0, 18.0, 16.0, 22.0, 38.0, 56.0, 84.0, 109.0, 183.0, 261.0, 349.0, 557.0, 878.0, 1459.0, 2627.0, 4952.0, 10199.0, 22161.0, 52999.0, 125126.0, 283392.0, 301396.0, 136763.0, 57542.0, 24221.0, 10970.0, 5292.0, 2755.0, 1492.0, 904.0, 554.0, 363.0, 251.0, 167.0, 111.0, 62.0, 56.0, 43.0, 34.0, 20.0, 23.0, 12.0, 7.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.84765625, -2.755950927734375, -2.66424560546875, -2.572540283203125, -2.4808349609375, -2.389129638671875, -2.29742431640625, -2.205718994140625, -2.114013671875, -2.022308349609375, -1.93060302734375, -1.838897705078125, -1.7471923828125, -1.655487060546875, -1.56378173828125, -1.472076416015625, -1.38037109375, -1.288665771484375, -1.19696044921875, -1.105255126953125, -1.0135498046875, -0.921844482421875, -0.83013916015625, -0.738433837890625, -0.646728515625, -0.555023193359375, -0.46331787109375, -0.371612548828125, -0.2799072265625, -0.188201904296875, -0.09649658203125, -0.004791259765625, 0.0869140625, 0.178619384765625, 0.27032470703125, 0.362030029296875, 0.4537353515625, 0.545440673828125, 0.63714599609375, 0.728851318359375, 0.820556640625, 0.912261962890625, 1.00396728515625, 1.095672607421875, 1.1873779296875, 1.279083251953125, 1.37078857421875, 1.462493896484375, 1.55419921875, 1.645904541015625, 1.73760986328125, 1.829315185546875, 1.9210205078125, 2.012725830078125, 2.10443115234375, 2.196136474609375, 2.287841796875, 2.379547119140625, 2.47125244140625, 2.562957763671875, 2.6546630859375, 2.746368408203125, 2.83807373046875, 2.929779052734375, 3.021484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 1.0, 6.0, 1.0, 10.0, 12.0, 13.0, 12.0, 5.0, 16.0, 13.0, 15.0, 29.0, 39.0, 27.0, 40.0, 40.0, 50.0, 49.0, 50.0, 60.0, 41.0, 38.0, 46.0, 51.0, 48.0, 32.0, 41.0, 33.0, 23.0, 28.0, 24.0, 19.0, 20.0, 10.0, 15.0, 10.0, 6.0, 10.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.056640625, -3.921875, -3.787109375, -3.65234375, -3.517578125, -3.3828125, -3.248046875, -3.11328125, -2.978515625, -2.84375, -2.708984375, -2.57421875, -2.439453125, -2.3046875, -2.169921875, -2.03515625, -1.900390625, -1.765625, -1.630859375, -1.49609375, -1.361328125, -1.2265625, -1.091796875, -0.95703125, -0.822265625, -0.6875, -0.552734375, -0.41796875, -0.283203125, -0.1484375, -0.013671875, 0.12109375, 0.255859375, 0.390625, 0.525390625, 0.66015625, 0.794921875, 0.9296875, 1.064453125, 1.19921875, 1.333984375, 1.46875, 1.603515625, 1.73828125, 1.873046875, 2.0078125, 2.142578125, 2.27734375, 2.412109375, 2.546875, 2.681640625, 2.81640625, 2.951171875, 3.0859375, 3.220703125, 3.35546875, 3.490234375, 3.625, 3.759765625, 3.89453125, 4.029296875, 4.1640625, 4.298828125, 4.43359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 12.0, 12.0, 16.0, 14.0, 29.0, 50.0, 66.0, 105.0, 167.0, 238.0, 414.0, 895.0, 1811.0, 4597.0, 13876.0, 61985.0, 732577.0, 189652.0, 28242.0, 8073.0, 2941.0, 1247.0, 659.0, 302.0, 196.0, 123.0, 82.0, 55.0, 31.0, 23.0, 22.0, 15.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.73828125, -6.51922607421875, -6.3001708984375, -6.08111572265625, -5.862060546875, -5.64300537109375, -5.4239501953125, -5.20489501953125, -4.98583984375, -4.76678466796875, -4.5477294921875, -4.32867431640625, -4.109619140625, -3.89056396484375, -3.6715087890625, -3.45245361328125, -3.2333984375, -3.01434326171875, -2.7952880859375, -2.57623291015625, -2.357177734375, -2.13812255859375, -1.9190673828125, -1.70001220703125, -1.48095703125, -1.26190185546875, -1.0428466796875, -0.82379150390625, -0.604736328125, -0.38568115234375, -0.1666259765625, 0.05242919921875, 0.271484375, 0.49053955078125, 0.7095947265625, 0.92864990234375, 1.147705078125, 1.36676025390625, 1.5858154296875, 1.80487060546875, 2.02392578125, 2.24298095703125, 2.4620361328125, 2.68109130859375, 2.900146484375, 3.11920166015625, 3.3382568359375, 3.55731201171875, 3.7763671875, 3.99542236328125, 4.2144775390625, 4.43353271484375, 4.652587890625, 4.87164306640625, 5.0906982421875, 5.30975341796875, 5.52880859375, 5.74786376953125, 5.9669189453125, 6.18597412109375, 6.405029296875, 6.62408447265625, 6.8431396484375, 7.06219482421875, 7.28125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 9.0, 10.0, 12.0, 23.0, 51.0, 78.0, 131.0, 366.0, 130.0, 80.0, 47.0, 23.0, 17.0, 12.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00148773193359375, -0.0014535412192344666, -0.001419350504875183, -0.0013851597905158997, -0.0013509690761566162, -0.0013167783617973328, -0.0012825876474380493, -0.0012483969330787659, -0.0012142062187194824, -0.001180015504360199, -0.0011458247900009155, -0.001111634075641632, -0.0010774433612823486, -0.0010432526469230652, -0.0010090619325637817, -0.0009748712182044983, -0.0009406805038452148, -0.0009064897894859314, -0.000872299075126648, -0.0008381083607673645, -0.0008039176464080811, -0.0007697269320487976, -0.0007355362176895142, -0.0007013455033302307, -0.0006671547889709473, -0.0006329640746116638, -0.0005987733602523804, -0.0005645826458930969, -0.0005303919315338135, -0.00049620121717453, -0.0004620105028152466, -0.00042781978845596313, -0.0003936290740966797, -0.00035943835973739624, -0.0003252476453781128, -0.00029105693101882935, -0.0002568662166595459, -0.00022267550230026245, -0.000188484787940979, -0.00015429407358169556, -0.00012010335922241211, -8.591264486312866e-05, -5.1721930503845215e-05, -1.7531216144561768e-05, 1.665949821472168e-05, 5.085021257400513e-05, 8.504092693328857e-05, 0.00011923164129257202, 0.00015342235565185547, 0.00018761307001113892, 0.00022180378437042236, 0.0002559944987297058, 0.00029018521308898926, 0.0003243759274482727, 0.00035856664180755615, 0.0003927573561668396, 0.00042694807052612305, 0.0004611387848854065, 0.0004953294992446899, 0.0005295202136039734, 0.0005637109279632568, 0.0005979016423225403, 0.0006320923566818237, 0.0006662830710411072, 0.0007004737854003906]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 2.0, 14.0, 10.0, 17.0, 25.0, 40.0, 71.0, 125.0, 219.0, 417.0, 912.0, 2112.0, 5688.0, 21778.0, 176540.0, 773864.0, 50869.0, 9961.0, 3213.0, 1344.0, 604.0, 306.0, 165.0, 86.0, 56.0, 29.0, 16.0, 22.0, 13.0, 10.0, 5.0, 7.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.8828125, -10.590576171875, -10.29833984375, -10.006103515625, -9.7138671875, -9.421630859375, -9.12939453125, -8.837158203125, -8.544921875, -8.252685546875, -7.96044921875, -7.668212890625, -7.3759765625, -7.083740234375, -6.79150390625, -6.499267578125, -6.20703125, -5.914794921875, -5.62255859375, -5.330322265625, -5.0380859375, -4.745849609375, -4.45361328125, -4.161376953125, -3.869140625, -3.576904296875, -3.28466796875, -2.992431640625, -2.7001953125, -2.407958984375, -2.11572265625, -1.823486328125, -1.53125, -1.239013671875, -0.94677734375, -0.654541015625, -0.3623046875, -0.070068359375, 0.22216796875, 0.514404296875, 0.806640625, 1.098876953125, 1.39111328125, 1.683349609375, 1.9755859375, 2.267822265625, 2.56005859375, 2.852294921875, 3.14453125, 3.436767578125, 3.72900390625, 4.021240234375, 4.3134765625, 4.605712890625, 4.89794921875, 5.190185546875, 5.482421875, 5.774658203125, 6.06689453125, 6.359130859375, 6.6513671875, 6.943603515625, 7.23583984375, 7.528076171875, 7.8203125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 7.0, 10.0, 10.0, 9.0, 10.0, 18.0, 19.0, 20.0, 48.0, 79.0, 165.0, 300.0, 108.0, 61.0, 28.0, 27.0, 14.0, 13.0, 11.0, 7.0, 7.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.8302001953125, -9.535400390625, -9.2406005859375, -8.94580078125, -8.6510009765625, -8.356201171875, -8.0614013671875, -7.7666015625, -7.4718017578125, -7.177001953125, -6.8822021484375, -6.58740234375, -6.2926025390625, -5.997802734375, -5.7030029296875, -5.408203125, -5.1134033203125, -4.818603515625, -4.5238037109375, -4.22900390625, -3.9342041015625, -3.639404296875, -3.3446044921875, -3.0498046875, -2.7550048828125, -2.460205078125, -2.1654052734375, -1.87060546875, -1.5758056640625, -1.281005859375, -0.9862060546875, -0.69140625, -0.3966064453125, -0.101806640625, 0.1929931640625, 0.48779296875, 0.7825927734375, 1.077392578125, 1.3721923828125, 1.6669921875, 1.9617919921875, 2.256591796875, 2.5513916015625, 2.84619140625, 3.1409912109375, 3.435791015625, 3.7305908203125, 4.025390625, 4.3201904296875, 4.614990234375, 4.9097900390625, 5.20458984375, 5.4993896484375, 5.794189453125, 6.0889892578125, 6.3837890625, 6.6785888671875, 6.973388671875, 7.2681884765625, 7.56298828125, 7.8577880859375, 8.152587890625, 8.4473876953125, 8.7421875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 18.0, 32.0, 79.0, 160.0, 263.0, 234.0, 127.0, 50.0, 23.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.15533447265625, -72.27813720703125, -68.40093231201172, -64.52373504638672, -60.64653015136719, -56.76933288574219, -52.89213180541992, -49.014930725097656, -45.13772964477539, -41.260528564453125, -37.38332748413086, -33.506126403808594, -29.62892723083496, -25.751726150512695, -21.874526977539062, -17.997325897216797, -14.120124816894531, -10.242923736572266, -6.365723609924316, -2.488523483276367, 1.3886775970458984, 5.265878677368164, 9.143077850341797, 13.020278930664062, 16.897480010986328, 20.774681091308594, 24.65188217163086, 28.529081344604492, 32.406280517578125, 36.283485412597656, 40.160682678222656, 44.03788375854492, 47.91508483886719, 51.79228591918945, 55.66948699951172, 59.54668426513672, 63.42388916015625, 67.30108642578125, 71.17828369140625, 75.05548858642578, 78.93269348144531, 82.80989074707031, 86.68709564208984, 90.56429290771484, 94.44149780273438, 98.31869506835938, 102.19589233398438, 106.0730972290039, 109.9502944946289, 113.8274917602539, 117.70469665527344, 121.58189392089844, 125.45909881591797, 129.3363037109375, 133.2135009765625, 137.0906982421875, 140.9678955078125, 144.8450927734375, 148.7222900390625, 152.59950256347656, 156.47669982910156, 160.35389709472656, 164.23109436035156, 168.10830688476562, 171.98550415039062]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 7.0, 0.0, 1.0, 7.0, 6.0, 13.0, 7.0, 14.0, 19.0, 15.0, 19.0, 27.0, 27.0, 34.0, 31.0, 42.0, 34.0, 32.0, 38.0, 36.0, 43.0, 47.0, 39.0, 45.0, 39.0, 39.0, 42.0, 29.0, 25.0, 38.0, 36.0, 31.0, 23.0, 21.0, 22.0, 17.0, 6.0, 17.0, 7.0, 5.0, 10.0, 6.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.76896667480469, -32.675357818603516, -31.581745147705078, -30.488136291503906, -29.3945255279541, -28.300914764404297, -27.207305908203125, -26.11369514465332, -25.020084381103516, -23.92647361755371, -22.832862854003906, -21.739253997802734, -20.64564323425293, -19.552032470703125, -18.458423614501953, -17.36481285095215, -16.271202087402344, -15.177591323852539, -14.08398151397705, -12.990371704101562, -11.896760940551758, -10.803150177001953, -9.709540367126465, -8.615930557250977, -7.522319793701172, -6.428709506988525, -5.335099220275879, -4.241488933563232, -3.147878646850586, -2.0542683601379395, -0.960658073425293, 0.13295221328735352, 1.2265586853027344, 2.320168972015381, 3.4137792587280273, 4.507389545440674, 5.60099983215332, 6.694610118865967, 7.788220405578613, 8.881830215454102, 9.975440979003906, 11.069051742553711, 12.1626615524292, 13.256271362304688, 14.349882125854492, 15.443492889404297, 16.53710174560547, 17.630712509155273, 18.724323272705078, 19.817934036254883, 20.911544799804688, 22.00515365600586, 23.098764419555664, 24.19237518310547, 25.28598403930664, 26.379594802856445, 27.47320556640625, 28.566816329956055, 29.66042709350586, 30.75403594970703, 31.847646713256836, 32.94125747680664, 34.03486633300781, 35.12847900390625, 36.22208786010742]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 15.0, 18.0, 21.0, 30.0, 38.0, 78.0, 163.0, 281.0, 568.0, 1140.0, 2362.0, 6124.0, 18660.0, 81058.0, 3473173.0, 541970.0, 47660.0, 12669.0, 4521.0, 1815.0, 872.0, 407.0, 230.0, 160.0, 74.0, 48.0, 33.0, 27.0, 17.0, 13.0, 9.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.375, -10.05908203125, -9.7431640625, -9.42724609375, -9.111328125, -8.79541015625, -8.4794921875, -8.16357421875, -7.84765625, -7.53173828125, -7.2158203125, -6.89990234375, -6.583984375, -6.26806640625, -5.9521484375, -5.63623046875, -5.3203125, -5.00439453125, -4.6884765625, -4.37255859375, -4.056640625, -3.74072265625, -3.4248046875, -3.10888671875, -2.79296875, -2.47705078125, -2.1611328125, -1.84521484375, -1.529296875, -1.21337890625, -0.8974609375, -0.58154296875, -0.265625, 0.05029296875, 0.3662109375, 0.68212890625, 0.998046875, 1.31396484375, 1.6298828125, 1.94580078125, 2.26171875, 2.57763671875, 2.8935546875, 3.20947265625, 3.525390625, 3.84130859375, 4.1572265625, 4.47314453125, 4.7890625, 5.10498046875, 5.4208984375, 5.73681640625, 6.052734375, 6.36865234375, 6.6845703125, 7.00048828125, 7.31640625, 7.63232421875, 7.9482421875, 8.26416015625, 8.580078125, 8.89599609375, 9.2119140625, 9.52783203125, 9.84375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 9.0, 6.0, 5.0, 11.0, 23.0, 33.0, 29.0, 34.0, 46.0, 43.0, 55.0, 48.0, 57.0, 68.0, 63.0, 52.0, 50.0, 54.0, 45.0, 50.0, 27.0, 41.0, 23.0, 28.0, 24.0, 16.0, 12.0, 6.0, 10.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.291015625, -1.2422943115234375, -1.193572998046875, -1.1448516845703125, -1.09613037109375, -1.0474090576171875, -0.998687744140625, -0.9499664306640625, -0.9012451171875, -0.8525238037109375, -0.803802490234375, -0.7550811767578125, -0.70635986328125, -0.6576385498046875, -0.608917236328125, -0.5601959228515625, -0.511474609375, -0.4627532958984375, -0.414031982421875, -0.3653106689453125, -0.31658935546875, -0.2678680419921875, -0.219146728515625, -0.1704254150390625, -0.1217041015625, -0.0729827880859375, -0.024261474609375, 0.0244598388671875, 0.07318115234375, 0.1219024658203125, 0.170623779296875, 0.2193450927734375, 0.26806640625, 0.3167877197265625, 0.365509033203125, 0.4142303466796875, 0.46295166015625, 0.5116729736328125, 0.560394287109375, 0.6091156005859375, 0.6578369140625, 0.7065582275390625, 0.755279541015625, 0.8040008544921875, 0.85272216796875, 0.9014434814453125, 0.950164794921875, 0.9988861083984375, 1.047607421875, 1.0963287353515625, 1.145050048828125, 1.1937713623046875, 1.24249267578125, 1.2912139892578125, 1.339935302734375, 1.3886566162109375, 1.4373779296875, 1.4860992431640625, 1.534820556640625, 1.5835418701171875, 1.63226318359375, 1.6809844970703125, 1.729705810546875, 1.7784271240234375, 1.8271484375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 8.0, 0.0, 7.0, 8.0, 9.0, 7.0, 9.0, 15.0, 19.0, 29.0, 31.0, 46.0, 57.0, 90.0, 143.0, 203.0, 236.0, 443.0, 660.0, 1014.0, 1914.0, 3500.0, 7041.0, 15543.0, 41236.0, 160763.0, 3227773.0, 604661.0, 80613.0, 25989.0, 10554.0, 5071.0, 2633.0, 1425.0, 838.0, 551.0, 349.0, 259.0, 152.0, 89.0, 80.0, 58.0, 41.0, 33.0, 20.0, 18.0, 14.0, 6.0, 12.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.62890625, -6.41351318359375, -6.1981201171875, -5.98272705078125, -5.767333984375, -5.55194091796875, -5.3365478515625, -5.12115478515625, -4.90576171875, -4.69036865234375, -4.4749755859375, -4.25958251953125, -4.044189453125, -3.82879638671875, -3.6134033203125, -3.39801025390625, -3.1826171875, -2.96722412109375, -2.7518310546875, -2.53643798828125, -2.321044921875, -2.10565185546875, -1.8902587890625, -1.67486572265625, -1.45947265625, -1.24407958984375, -1.0286865234375, -0.81329345703125, -0.597900390625, -0.38250732421875, -0.1671142578125, 0.04827880859375, 0.263671875, 0.47906494140625, 0.6944580078125, 0.90985107421875, 1.125244140625, 1.34063720703125, 1.5560302734375, 1.77142333984375, 1.98681640625, 2.20220947265625, 2.4176025390625, 2.63299560546875, 2.848388671875, 3.06378173828125, 3.2791748046875, 3.49456787109375, 3.7099609375, 3.92535400390625, 4.1407470703125, 4.35614013671875, 4.571533203125, 4.78692626953125, 5.0023193359375, 5.21771240234375, 5.43310546875, 5.64849853515625, 5.8638916015625, 6.07928466796875, 6.294677734375, 6.51007080078125, 6.7254638671875, 6.94085693359375, 7.15625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 10.0, 7.0, 21.0, 17.0, 28.0, 41.0, 75.0, 152.0, 371.0, 2285.0, 669.0, 180.0, 81.0, 44.0, 26.0, 20.0, 15.0, 10.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.4296875, -6.25421142578125, -6.0787353515625, -5.90325927734375, -5.727783203125, -5.55230712890625, -5.3768310546875, -5.20135498046875, -5.02587890625, -4.85040283203125, -4.6749267578125, -4.49945068359375, -4.323974609375, -4.14849853515625, -3.9730224609375, -3.79754638671875, -3.6220703125, -3.44659423828125, -3.2711181640625, -3.09564208984375, -2.920166015625, -2.74468994140625, -2.5692138671875, -2.39373779296875, -2.21826171875, -2.04278564453125, -1.8673095703125, -1.69183349609375, -1.516357421875, -1.34088134765625, -1.1654052734375, -0.98992919921875, -0.814453125, -0.63897705078125, -0.4635009765625, -0.28802490234375, -0.112548828125, 0.06292724609375, 0.2384033203125, 0.41387939453125, 0.58935546875, 0.76483154296875, 0.9403076171875, 1.11578369140625, 1.291259765625, 1.46673583984375, 1.6422119140625, 1.81768798828125, 1.9931640625, 2.16864013671875, 2.3441162109375, 2.51959228515625, 2.695068359375, 2.87054443359375, 3.0460205078125, 3.22149658203125, 3.39697265625, 3.57244873046875, 3.7479248046875, 3.92340087890625, 4.098876953125, 4.27435302734375, 4.4498291015625, 4.62530517578125, 4.80078125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 13.0, 16.0, 37.0, 77.0, 180.0, 270.0, 225.0, 124.0, 29.0, 12.0, 9.0, 1.0, 0.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.36759567260742, -39.81059265136719, -38.25358581542969, -36.69658279418945, -35.13957977294922, -33.58257293701172, -32.025569915771484, -30.468564987182617, -28.91156005859375, -27.354555130004883, -25.797550201416016, -24.24054718017578, -22.683542251586914, -21.126537322998047, -19.569534301757812, -18.012529373168945, -16.455524444580078, -14.898519515991211, -13.34151554107666, -11.78451156616211, -10.227506637573242, -8.670501708984375, -7.113497734069824, -5.556493759155273, -3.9994888305664062, -2.4424843788146973, -0.8854799270629883, 0.6715245246887207, 2.2285289764404297, 3.7855334281921387, 5.342537879943848, 6.899541854858398, 8.456550598144531, 10.013555526733398, 11.57055950164795, 13.1275634765625, 14.684568405151367, 16.241573333740234, 17.79857635498047, 19.355581283569336, 20.912586212158203, 22.46959114074707, 24.026596069335938, 25.583599090576172, 27.14060401916504, 28.697608947753906, 30.25461196899414, 31.811616897583008, 33.368621826171875, 34.92562484741211, 36.48263168334961, 38.039634704589844, 39.596641540527344, 41.15364456176758, 42.71064758300781, 44.26765441894531, 45.82465744018555, 47.38166046142578, 48.93866729736328, 50.495670318603516, 52.05267333984375, 53.60968017578125, 55.166683197021484, 56.72368621826172, 58.28069305419922]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 11.0, 6.0, 10.0, 20.0, 25.0, 19.0, 28.0, 42.0, 45.0, 56.0, 66.0, 65.0, 64.0, 67.0, 62.0, 68.0, 55.0, 47.0, 51.0, 44.0, 30.0, 26.0, 19.0, 15.0, 14.0, 10.0, 13.0, 9.0, 7.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.784072875976562, -16.225439071655273, -15.666804313659668, -15.108170509338379, -14.54953670501709, -13.990901947021484, -13.432268142700195, -12.873634338378906, -12.315000534057617, -11.756366729736328, -11.197731971740723, -10.639098167419434, -10.080464363098145, -9.521829605102539, -8.96319580078125, -8.404561996459961, -7.8459272384643555, -7.287292957305908, -6.728659152984619, -6.170024871826172, -5.611391067504883, -5.0527567863464355, -4.494122505187988, -3.93548846244812, -3.376854419708252, -2.818220376968384, -2.2595863342285156, -1.7009520530700684, -1.1423180103302002, -0.583683967590332, -0.025049686431884766, 0.5335843563079834, 1.0922183990478516, 1.6508524417877197, 2.209486484527588, 2.768120765686035, 3.3267548084259033, 3.8853888511657715, 4.444023132324219, 5.002656936645508, 5.561291217803955, 6.119925498962402, 6.678559303283691, 7.237193584442139, 7.795827865600586, 8.354461669921875, 8.913095474243164, 9.47173023223877, 10.030364036560059, 10.588997840881348, 11.147632598876953, 11.706266403198242, 12.264900207519531, 12.82353401184082, 13.382168769836426, 13.940802574157715, 14.49943733215332, 15.05807113647461, 15.616705894470215, 16.175338745117188, 16.73397445678711, 17.2926082611084, 17.851242065429688, 18.409875869750977, 18.968509674072266]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 7.0, 6.0, 8.0, 19.0, 16.0, 46.0, 36.0, 63.0, 91.0, 148.0, 241.0, 387.0, 625.0, 1202.0, 2357.0, 4873.0, 11490.0, 29456.0, 82827.0, 227589.0, 358347.0, 207021.0, 75170.0, 26344.0, 10617.0, 4609.0, 2186.0, 1137.0, 655.0, 366.0, 219.0, 131.0, 71.0, 60.0, 40.0, 24.0, 14.0, 16.0, 12.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.11328125, -4.927001953125, -4.74072265625, -4.554443359375, -4.3681640625, -4.181884765625, -3.99560546875, -3.809326171875, -3.623046875, -3.436767578125, -3.25048828125, -3.064208984375, -2.8779296875, -2.691650390625, -2.50537109375, -2.319091796875, -2.1328125, -1.946533203125, -1.76025390625, -1.573974609375, -1.3876953125, -1.201416015625, -1.01513671875, -0.828857421875, -0.642578125, -0.456298828125, -0.27001953125, -0.083740234375, 0.1025390625, 0.288818359375, 0.47509765625, 0.661376953125, 0.84765625, 1.033935546875, 1.22021484375, 1.406494140625, 1.5927734375, 1.779052734375, 1.96533203125, 2.151611328125, 2.337890625, 2.524169921875, 2.71044921875, 2.896728515625, 3.0830078125, 3.269287109375, 3.45556640625, 3.641845703125, 3.828125, 4.014404296875, 4.20068359375, 4.386962890625, 4.5732421875, 4.759521484375, 4.94580078125, 5.132080078125, 5.318359375, 5.504638671875, 5.69091796875, 5.877197265625, 6.0634765625, 6.249755859375, 6.43603515625, 6.622314453125, 6.80859375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 10.0, 6.0, 9.0, 13.0, 5.0, 12.0, 17.0, 28.0, 25.0, 31.0, 43.0, 51.0, 47.0, 44.0, 52.0, 46.0, 56.0, 61.0, 40.0, 44.0, 32.0, 43.0, 43.0, 35.0, 34.0, 27.0, 28.0, 23.0, 9.0, 13.0, 22.0, 10.0, 6.0, 10.0, 7.0, 4.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3251953125, -1.281463623046875, -1.23773193359375, -1.194000244140625, -1.1502685546875, -1.106536865234375, -1.06280517578125, -1.019073486328125, -0.975341796875, -0.931610107421875, -0.88787841796875, -0.844146728515625, -0.8004150390625, -0.756683349609375, -0.71295166015625, -0.669219970703125, -0.62548828125, -0.581756591796875, -0.53802490234375, -0.494293212890625, -0.4505615234375, -0.406829833984375, -0.36309814453125, -0.319366455078125, -0.275634765625, -0.231903076171875, -0.18817138671875, -0.144439697265625, -0.1007080078125, -0.056976318359375, -0.01324462890625, 0.030487060546875, 0.07421875, 0.117950439453125, 0.16168212890625, 0.205413818359375, 0.2491455078125, 0.292877197265625, 0.33660888671875, 0.380340576171875, 0.424072265625, 0.467803955078125, 0.51153564453125, 0.555267333984375, 0.5989990234375, 0.642730712890625, 0.68646240234375, 0.730194091796875, 0.77392578125, 0.817657470703125, 0.86138916015625, 0.905120849609375, 0.9488525390625, 0.992584228515625, 1.03631591796875, 1.080047607421875, 1.123779296875, 1.167510986328125, 1.21124267578125, 1.254974365234375, 1.2987060546875, 1.342437744140625, 1.38616943359375, 1.429901123046875, 1.4736328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 11.0, 12.0, 16.0, 30.0, 50.0, 89.0, 155.0, 250.0, 410.0, 879.0, 2085.0, 5855.0, 19927.0, 89884.0, 404221.0, 404419.0, 90438.0, 19926.0, 5740.0, 2142.0, 906.0, 487.0, 249.0, 161.0, 74.0, 39.0, 41.0, 22.0, 14.0, 7.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.9609375, -7.712158203125, -7.46337890625, -7.214599609375, -6.9658203125, -6.717041015625, -6.46826171875, -6.219482421875, -5.970703125, -5.721923828125, -5.47314453125, -5.224365234375, -4.9755859375, -4.726806640625, -4.47802734375, -4.229248046875, -3.98046875, -3.731689453125, -3.48291015625, -3.234130859375, -2.9853515625, -2.736572265625, -2.48779296875, -2.239013671875, -1.990234375, -1.741455078125, -1.49267578125, -1.243896484375, -0.9951171875, -0.746337890625, -0.49755859375, -0.248779296875, 0.0, 0.248779296875, 0.49755859375, 0.746337890625, 0.9951171875, 1.243896484375, 1.49267578125, 1.741455078125, 1.990234375, 2.239013671875, 2.48779296875, 2.736572265625, 2.9853515625, 3.234130859375, 3.48291015625, 3.731689453125, 3.98046875, 4.229248046875, 4.47802734375, 4.726806640625, 4.9755859375, 5.224365234375, 5.47314453125, 5.721923828125, 5.970703125, 6.219482421875, 6.46826171875, 6.717041015625, 6.9658203125, 7.214599609375, 7.46337890625, 7.712158203125, 7.9609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 4.0, 3.0, 1.0, 5.0, 9.0, 11.0, 11.0, 21.0, 21.0, 22.0, 24.0, 22.0, 43.0, 42.0, 41.0, 47.0, 42.0, 64.0, 54.0, 61.0, 48.0, 63.0, 46.0, 49.0, 51.0, 35.0, 30.0, 27.0, 24.0, 19.0, 10.0, 15.0, 16.0, 4.0, 4.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.772216796875, -5.49755859375, -5.222900390625, -4.9482421875, -4.673583984375, -4.39892578125, -4.124267578125, -3.849609375, -3.574951171875, -3.30029296875, -3.025634765625, -2.7509765625, -2.476318359375, -2.20166015625, -1.927001953125, -1.65234375, -1.377685546875, -1.10302734375, -0.828369140625, -0.5537109375, -0.279052734375, -0.00439453125, 0.270263671875, 0.544921875, 0.819580078125, 1.09423828125, 1.368896484375, 1.6435546875, 1.918212890625, 2.19287109375, 2.467529296875, 2.7421875, 3.016845703125, 3.29150390625, 3.566162109375, 3.8408203125, 4.115478515625, 4.39013671875, 4.664794921875, 4.939453125, 5.214111328125, 5.48876953125, 5.763427734375, 6.0380859375, 6.312744140625, 6.58740234375, 6.862060546875, 7.13671875, 7.411376953125, 7.68603515625, 7.960693359375, 8.2353515625, 8.510009765625, 8.78466796875, 9.059326171875, 9.333984375, 9.608642578125, 9.88330078125, 10.157958984375, 10.4326171875, 10.707275390625, 10.98193359375, 11.256591796875, 11.53125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 13.0, 17.0, 46.0, 68.0, 95.0, 137.0, 233.0, 446.0, 753.0, 1447.0, 2841.0, 7017.0, 23913.0, 160078.0, 695762.0, 123158.0, 20418.0, 6471.0, 2598.0, 1296.0, 707.0, 353.0, 220.0, 169.0, 91.0, 64.0, 39.0, 29.0, 13.0, 20.0, 4.0, 8.0, 0.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8984375, -7.66912841796875, -7.4398193359375, -7.21051025390625, -6.981201171875, -6.75189208984375, -6.5225830078125, -6.29327392578125, -6.06396484375, -5.83465576171875, -5.6053466796875, -5.37603759765625, -5.146728515625, -4.91741943359375, -4.6881103515625, -4.45880126953125, -4.2294921875, -4.00018310546875, -3.7708740234375, -3.54156494140625, -3.312255859375, -3.08294677734375, -2.8536376953125, -2.62432861328125, -2.39501953125, -2.16571044921875, -1.9364013671875, -1.70709228515625, -1.477783203125, -1.24847412109375, -1.0191650390625, -0.78985595703125, -0.560546875, -0.33123779296875, -0.1019287109375, 0.12738037109375, 0.356689453125, 0.58599853515625, 0.8153076171875, 1.04461669921875, 1.27392578125, 1.50323486328125, 1.7325439453125, 1.96185302734375, 2.191162109375, 2.42047119140625, 2.6497802734375, 2.87908935546875, 3.1083984375, 3.33770751953125, 3.5670166015625, 3.79632568359375, 4.025634765625, 4.25494384765625, 4.4842529296875, 4.71356201171875, 4.94287109375, 5.17218017578125, 5.4014892578125, 5.63079833984375, 5.860107421875, 6.08941650390625, 6.3187255859375, 6.54803466796875, 6.77734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 5.0, 6.0, 15.0, 14.0, 24.0, 32.0, 56.0, 75.0, 111.0, 157.0, 150.0, 103.0, 76.0, 52.0, 46.0, 20.0, 15.0, 12.0, 5.0, 3.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001087188720703125, -0.0010599493980407715, -0.001032710075378418, -0.0010054707527160645, -0.000978231430053711, -0.0009509921073913574, -0.0009237527847290039, -0.0008965134620666504, -0.0008692741394042969, -0.0008420348167419434, -0.0008147954940795898, -0.0007875561714172363, -0.0007603168487548828, -0.0007330775260925293, -0.0007058382034301758, -0.0006785988807678223, -0.0006513595581054688, -0.0006241202354431152, -0.0005968809127807617, -0.0005696415901184082, -0.0005424022674560547, -0.0005151629447937012, -0.00048792362213134766, -0.00046068429946899414, -0.0004334449768066406, -0.0004062056541442871, -0.0003789663314819336, -0.0003517270088195801, -0.00032448768615722656, -0.00029724836349487305, -0.00027000904083251953, -0.00024276971817016602, -0.0002155303955078125, -0.00018829107284545898, -0.00016105175018310547, -0.00013381242752075195, -0.00010657310485839844, -7.933378219604492e-05, -5.2094459533691406e-05, -2.485513687133789e-05, 2.384185791015625e-06, 2.962350845336914e-05, 5.6862831115722656e-05, 8.410215377807617e-05, 0.00011134147644042969, 0.0001385807991027832, 0.00016582012176513672, 0.00019305944442749023, 0.00022029876708984375, 0.00024753808975219727, 0.0002747774124145508, 0.0003020167350769043, 0.0003292560577392578, 0.00035649538040161133, 0.00038373470306396484, 0.00041097402572631836, 0.0004382133483886719, 0.0004654526710510254, 0.0004926919937133789, 0.0005199313163757324, 0.0005471706390380859, 0.0005744099617004395, 0.000601649284362793, 0.0006288886070251465, 0.0006561279296875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 9.0, 19.0, 24.0, 57.0, 85.0, 161.0, 359.0, 830.0, 2770.0, 12367.0, 135339.0, 829750.0, 56338.0, 7488.0, 1801.0, 615.0, 253.0, 112.0, 54.0, 23.0, 29.0, 20.0, 10.0, 13.0, 6.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.9122314453125, -11.519775390625, -11.1273193359375, -10.73486328125, -10.3424072265625, -9.949951171875, -9.5574951171875, -9.1650390625, -8.7725830078125, -8.380126953125, -7.9876708984375, -7.59521484375, -7.2027587890625, -6.810302734375, -6.4178466796875, -6.025390625, -5.6329345703125, -5.240478515625, -4.8480224609375, -4.45556640625, -4.0631103515625, -3.670654296875, -3.2781982421875, -2.8857421875, -2.4932861328125, -2.100830078125, -1.7083740234375, -1.31591796875, -0.9234619140625, -0.531005859375, -0.1385498046875, 0.25390625, 0.6463623046875, 1.038818359375, 1.4312744140625, 1.82373046875, 2.2161865234375, 2.608642578125, 3.0010986328125, 3.3935546875, 3.7860107421875, 4.178466796875, 4.5709228515625, 4.96337890625, 5.3558349609375, 5.748291015625, 6.1407470703125, 6.533203125, 6.9256591796875, 7.318115234375, 7.7105712890625, 8.10302734375, 8.4954833984375, 8.887939453125, 9.2803955078125, 9.6728515625, 10.0653076171875, 10.457763671875, 10.8502197265625, 11.24267578125, 11.6351318359375, 12.027587890625, 12.4200439453125, 12.8125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 9.0, 4.0, 3.0, 7.0, 4.0, 10.0, 14.0, 19.0, 28.0, 55.0, 70.0, 129.0, 170.0, 148.0, 106.0, 86.0, 39.0, 28.0, 18.0, 12.0, 9.0, 9.0, 8.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-12.640625, -12.34613037109375, -12.0516357421875, -11.75714111328125, -11.462646484375, -11.16815185546875, -10.8736572265625, -10.57916259765625, -10.28466796875, -9.99017333984375, -9.6956787109375, -9.40118408203125, -9.106689453125, -8.81219482421875, -8.5177001953125, -8.22320556640625, -7.9287109375, -7.63421630859375, -7.3397216796875, -7.04522705078125, -6.750732421875, -6.45623779296875, -6.1617431640625, -5.86724853515625, -5.57275390625, -5.27825927734375, -4.9837646484375, -4.68927001953125, -4.394775390625, -4.10028076171875, -3.8057861328125, -3.51129150390625, -3.216796875, -2.92230224609375, -2.6278076171875, -2.33331298828125, -2.038818359375, -1.74432373046875, -1.4498291015625, -1.15533447265625, -0.86083984375, -0.56634521484375, -0.2718505859375, 0.02264404296875, 0.317138671875, 0.61163330078125, 0.9061279296875, 1.20062255859375, 1.4951171875, 1.78961181640625, 2.0841064453125, 2.37860107421875, 2.673095703125, 2.96759033203125, 3.2620849609375, 3.55657958984375, 3.85107421875, 4.14556884765625, 4.4400634765625, 4.73455810546875, 5.029052734375, 5.32354736328125, 5.6180419921875, 5.91253662109375, 6.20703125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 8.0, 18.0, 52.0, 143.0, 264.0, 261.0, 141.0, 64.0, 35.0, 6.0, 7.0, 7.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-223.3384552001953, -218.7727508544922, -214.20706176757812, -209.641357421875, -205.07566833496094, -200.5099639892578, -195.94427490234375, -191.37857055664062, -186.81288146972656, -182.24717712402344, -177.68148803710938, -173.11578369140625, -168.5500946044922, -163.98439025878906, -159.418701171875, -154.85299682617188, -150.28729248046875, -145.72158813476562, -141.15589904785156, -136.59019470214844, -132.02450561523438, -127.45880889892578, -122.89311218261719, -118.32740783691406, -113.76171875, -109.1960220336914, -104.63032531738281, -100.06462860107422, -95.49893188476562, -90.93323516845703, -86.36753845214844, -81.80183410644531, -77.23614501953125, -72.67044830322266, -68.10475158691406, -63.53905487060547, -58.973358154296875, -54.40766143798828, -49.84196090698242, -45.27626419067383, -40.710567474365234, -36.14487075805664, -31.579174041748047, -27.01347541809082, -22.447778701782227, -17.882081985473633, -13.316383361816406, -8.750686645507812, -4.184989929199219, 0.3807072639465332, 4.946404457092285, 9.512102127075195, 14.077798843383789, 18.643495559692383, 23.20919418334961, 27.774890899658203, 32.3405876159668, 36.90628433227539, 41.471981048583984, 46.037681579589844, 50.60337829589844, 55.16907501220703, 59.734771728515625, 64.30046844482422, 68.86616516113281]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 8.0, 0.0, 2.0, 5.0, 12.0, 7.0, 7.0, 8.0, 10.0, 15.0, 17.0, 25.0, 26.0, 24.0, 33.0, 28.0, 29.0, 51.0, 42.0, 38.0, 40.0, 47.0, 37.0, 35.0, 48.0, 40.0, 38.0, 50.0, 33.0, 34.0, 33.0, 36.0, 22.0, 23.0, 22.0, 13.0, 13.0, 19.0, 10.0, 4.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-41.61396789550781, -40.37482833862305, -39.13568878173828, -37.89654541015625, -36.657405853271484, -35.41826629638672, -34.17912673950195, -32.93998718261719, -31.700847625732422, -30.461708068847656, -29.222566604614258, -27.983427047729492, -26.744287490844727, -25.505146026611328, -24.266006469726562, -23.026866912841797, -21.7877254486084, -20.548585891723633, -19.309444427490234, -18.07030487060547, -16.831165313720703, -15.592024803161621, -14.352884292602539, -13.113744735717773, -11.874604225158691, -10.63546371459961, -9.396324157714844, -8.157183647155762, -6.918043613433838, -5.678903579711914, -4.439763069152832, -3.2006235122680664, -1.9614830017089844, -0.722342848777771, 0.5167973041534424, 1.7559375762939453, 2.995077610015869, 4.234217643737793, 5.473358154296875, 6.712497711181641, 7.951638221740723, 9.190778732299805, 10.42991828918457, 11.669058799743652, 12.908199310302734, 14.1473388671875, 15.386479377746582, 16.62561798095703, 17.86475944519043, 19.103899002075195, 20.343040466308594, 21.58218002319336, 22.821319580078125, 24.06045913696289, 25.29960060119629, 26.538740158081055, 27.777881622314453, 29.01702117919922, 30.256162643432617, 31.495302200317383, 32.73444366455078, 33.97358322143555, 35.21272277832031, 36.45186233520508, 37.691001892089844]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 7.0, 11.0, 14.0, 33.0, 60.0, 121.0, 235.0, 721.0, 3661.0, 203980.0, 3979171.0, 4916.0, 829.0, 288.0, 99.0, 60.0, 36.0, 17.0, 14.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.9375, -33.941162109375, -32.94482421875, -31.948486328125, -30.9521484375, -29.955810546875, -28.95947265625, -27.963134765625, -26.966796875, -25.970458984375, -24.97412109375, -23.977783203125, -22.9814453125, -21.985107421875, -20.98876953125, -19.992431640625, -18.99609375, -17.999755859375, -17.00341796875, -16.007080078125, -15.0107421875, -14.014404296875, -13.01806640625, -12.021728515625, -11.025390625, -10.029052734375, -9.03271484375, -8.036376953125, -7.0400390625, -6.043701171875, -5.04736328125, -4.051025390625, -3.0546875, -2.058349609375, -1.06201171875, -0.065673828125, 0.9306640625, 1.927001953125, 2.92333984375, 3.919677734375, 4.916015625, 5.912353515625, 6.90869140625, 7.905029296875, 8.9013671875, 9.897705078125, 10.89404296875, 11.890380859375, 12.88671875, 13.883056640625, 14.87939453125, 15.875732421875, 16.8720703125, 17.868408203125, 18.86474609375, 19.861083984375, 20.857421875, 21.853759765625, 22.85009765625, 23.846435546875, 24.8427734375, 25.839111328125, 26.83544921875, 27.831787109375, 28.828125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 8.0, 8.0, 8.0, 13.0, 12.0, 16.0, 24.0, 40.0, 26.0, 28.0, 44.0, 37.0, 52.0, 50.0, 47.0, 48.0, 52.0, 46.0, 47.0, 50.0, 42.0, 41.0, 31.0, 33.0, 36.0, 32.0, 25.0, 25.0, 11.0, 17.0, 13.0, 3.0, 7.0, 2.0, 4.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6865234375, -1.6273651123046875, -1.568206787109375, -1.5090484619140625, -1.44989013671875, -1.3907318115234375, -1.331573486328125, -1.2724151611328125, -1.2132568359375, -1.1540985107421875, -1.094940185546875, -1.0357818603515625, -0.97662353515625, -0.9174652099609375, -0.858306884765625, -0.7991485595703125, -0.739990234375, -0.6808319091796875, -0.621673583984375, -0.5625152587890625, -0.50335693359375, -0.4441986083984375, -0.385040283203125, -0.3258819580078125, -0.2667236328125, -0.2075653076171875, -0.148406982421875, -0.0892486572265625, -0.03009033203125, 0.0290679931640625, 0.088226318359375, 0.1473846435546875, 0.20654296875, 0.2657012939453125, 0.324859619140625, 0.3840179443359375, 0.44317626953125, 0.5023345947265625, 0.561492919921875, 0.6206512451171875, 0.6798095703125, 0.7389678955078125, 0.798126220703125, 0.8572845458984375, 0.91644287109375, 0.9756011962890625, 1.034759521484375, 1.0939178466796875, 1.153076171875, 1.2122344970703125, 1.271392822265625, 1.3305511474609375, 1.38970947265625, 1.4488677978515625, 1.508026123046875, 1.5671844482421875, 1.6263427734375, 1.6855010986328125, 1.744659423828125, 1.8038177490234375, 1.86297607421875, 1.9221343994140625, 1.981292724609375, 2.0404510498046875, 2.099609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 8.0, 5.0, 7.0, 16.0, 25.0, 35.0, 36.0, 57.0, 97.0, 168.0, 286.0, 501.0, 985.0, 2117.0, 6057.0, 28502.0, 3534160.0, 586681.0, 24729.0, 5567.0, 2014.0, 955.0, 477.0, 299.0, 182.0, 88.0, 68.0, 40.0, 36.0, 23.0, 22.0, 10.0, 3.0, 4.0, 6.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0], "bins": [-13.1875, -12.840087890625, -12.49267578125, -12.145263671875, -11.7978515625, -11.450439453125, -11.10302734375, -10.755615234375, -10.408203125, -10.060791015625, -9.71337890625, -9.365966796875, -9.0185546875, -8.671142578125, -8.32373046875, -7.976318359375, -7.62890625, -7.281494140625, -6.93408203125, -6.586669921875, -6.2392578125, -5.891845703125, -5.54443359375, -5.197021484375, -4.849609375, -4.502197265625, -4.15478515625, -3.807373046875, -3.4599609375, -3.112548828125, -2.76513671875, -2.417724609375, -2.0703125, -1.722900390625, -1.37548828125, -1.028076171875, -0.6806640625, -0.333251953125, 0.01416015625, 0.361572265625, 0.708984375, 1.056396484375, 1.40380859375, 1.751220703125, 2.0986328125, 2.446044921875, 2.79345703125, 3.140869140625, 3.48828125, 3.835693359375, 4.18310546875, 4.530517578125, 4.8779296875, 5.225341796875, 5.57275390625, 5.920166015625, 6.267578125, 6.614990234375, 6.96240234375, 7.309814453125, 7.6572265625, 8.004638671875, 8.35205078125, 8.699462890625, 9.046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 21.0, 26.0, 46.0, 119.0, 544.0, 2972.0, 164.0, 70.0, 19.0, 26.0, 15.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2392578125, -1.1806488037109375, -1.122039794921875, -1.0634307861328125, -1.00482177734375, -0.9462127685546875, -0.887603759765625, -0.8289947509765625, -0.7703857421875, -0.7117767333984375, -0.653167724609375, -0.5945587158203125, -0.53594970703125, -0.4773406982421875, -0.418731689453125, -0.3601226806640625, -0.301513671875, -0.2429046630859375, -0.184295654296875, -0.1256866455078125, -0.06707763671875, -0.0084686279296875, 0.050140380859375, 0.1087493896484375, 0.1673583984375, 0.2259674072265625, 0.284576416015625, 0.3431854248046875, 0.40179443359375, 0.4604034423828125, 0.519012451171875, 0.5776214599609375, 0.63623046875, 0.6948394775390625, 0.753448486328125, 0.8120574951171875, 0.87066650390625, 0.9292755126953125, 0.987884521484375, 1.0464935302734375, 1.1051025390625, 1.1637115478515625, 1.222320556640625, 1.2809295654296875, 1.33953857421875, 1.3981475830078125, 1.456756591796875, 1.5153656005859375, 1.573974609375, 1.6325836181640625, 1.691192626953125, 1.7498016357421875, 1.80841064453125, 1.8670196533203125, 1.925628662109375, 1.9842376708984375, 2.0428466796875, 2.1014556884765625, 2.160064697265625, 2.2186737060546875, 2.27728271484375, 2.3358917236328125, 2.394500732421875, 2.4531097412109375, 2.51171875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 10.0, 20.0, 29.0, 102.0, 162.0, 206.0, 168.0, 141.0, 73.0, 37.0, 19.0, 13.0, 6.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.58432388305664, -8.231667518615723, -7.8790106773376465, -7.5263543128967285, -7.173697471618652, -6.821041107177734, -6.468384742736816, -6.11572790145874, -5.763071060180664, -5.410414695739746, -5.05775785446167, -4.705101490020752, -4.352444648742676, -3.999788284301758, -3.6471316814422607, -3.2944750785827637, -2.9418187141418457, -2.5891621112823486, -2.2365055084228516, -1.883849024772644, -1.531192421913147, -1.17853581905365, -0.8258793354034424, -0.4732227325439453, -0.12056612968444824, 0.23209044337272644, 0.5847470164299011, 0.9374035596847534, 1.2900601625442505, 1.6427167654037476, 1.995373249053955, 2.348029851913452, 2.700686454772949, 3.0533430576324463, 3.4059996604919434, 3.7586560249328613, 4.1113128662109375, 4.4639692306518555, 4.816625595092773, 5.16928243637085, 5.521939277648926, 5.874595642089844, 6.22725248336792, 6.579908847808838, 6.932565689086914, 7.285222053527832, 7.63787841796875, 7.990535259246826, 8.343191146850586, 8.695847511291504, 9.048503875732422, 9.401161193847656, 9.753817558288574, 10.106473922729492, 10.45913028717041, 10.811786651611328, 11.164443969726562, 11.51710033416748, 11.869756698608398, 12.222414016723633, 12.57507038116455, 12.927726745605469, 13.280383110046387, 13.633039474487305, 13.985696792602539]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 8.0, 5.0, 9.0, 14.0, 19.0, 20.0, 22.0, 28.0, 32.0, 36.0, 39.0, 36.0, 37.0, 54.0, 58.0, 54.0, 53.0, 69.0, 54.0, 47.0, 40.0, 42.0, 52.0, 36.0, 29.0, 24.0, 26.0, 15.0, 6.0, 10.0, 7.0, 6.0, 3.0, 2.0, 2.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.750594139099121, -3.610170841217041, -3.469747304916382, -3.3293240070343018, -3.1889004707336426, -3.0484771728515625, -2.9080538749694824, -2.7676305770874023, -2.627207040786743, -2.486783742904663, -2.346360206604004, -2.205936908721924, -2.0655136108398438, -1.9250900745391846, -1.7846667766571045, -1.6442433595657349, -1.5038199424743652, -1.3633965253829956, -1.222973108291626, -1.082549810409546, -0.9421263933181763, -0.8017029762268066, -0.6612796187400818, -0.5208562612533569, -0.3804328441619873, -0.24000945687294006, -0.09958606958389282, 0.04083731770515442, 0.18126070499420166, 0.3216841220855713, 0.46210747957229614, 0.602530837059021, 0.7429537773132324, 0.883377194404602, 1.0238006114959717, 1.1642239093780518, 1.3046473264694214, 1.445070743560791, 1.585494041442871, 1.7259174585342407, 1.8663408756256104, 2.0067641735076904, 2.1471877098083496, 2.2876110076904297, 2.4280343055725098, 2.568457841873169, 2.708881139755249, 2.849304676055908, 2.9897279739379883, 3.1301512718200684, 3.2705748081207275, 3.4109981060028076, 3.551421642303467, 3.691844940185547, 3.832268238067627, 3.972691535949707, 4.113115310668945, 4.253538608551025, 4.3939619064331055, 4.534385681152344, 4.674808979034424, 4.815232276916504, 4.955655574798584, 5.096078872680664, 5.236502170562744]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 6.0, 1.0, 4.0, 6.0, 2.0, 7.0, 13.0, 15.0, 35.0, 33.0, 56.0, 82.0, 156.0, 283.0, 491.0, 1015.0, 2291.0, 5724.0, 16174.0, 48071.0, 144949.0, 326761.0, 307576.0, 128270.0, 42907.0, 14317.0, 5268.0, 2065.0, 912.0, 453.0, 225.0, 133.0, 89.0, 59.0, 32.0, 23.0, 13.0, 10.0, 8.0, 8.0, 6.0, 6.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.4140625, -6.22509765625, -6.0361328125, -5.84716796875, -5.658203125, -5.46923828125, -5.2802734375, -5.09130859375, -4.90234375, -4.71337890625, -4.5244140625, -4.33544921875, -4.146484375, -3.95751953125, -3.7685546875, -3.57958984375, -3.390625, -3.20166015625, -3.0126953125, -2.82373046875, -2.634765625, -2.44580078125, -2.2568359375, -2.06787109375, -1.87890625, -1.68994140625, -1.5009765625, -1.31201171875, -1.123046875, -0.93408203125, -0.7451171875, -0.55615234375, -0.3671875, -0.17822265625, 0.0107421875, 0.19970703125, 0.388671875, 0.57763671875, 0.7666015625, 0.95556640625, 1.14453125, 1.33349609375, 1.5224609375, 1.71142578125, 1.900390625, 2.08935546875, 2.2783203125, 2.46728515625, 2.65625, 2.84521484375, 3.0341796875, 3.22314453125, 3.412109375, 3.60107421875, 3.7900390625, 3.97900390625, 4.16796875, 4.35693359375, 4.5458984375, 4.73486328125, 4.923828125, 5.11279296875, 5.3017578125, 5.49072265625, 5.6796875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 0.0, 1.0, 5.0, 5.0, 14.0, 15.0, 8.0, 18.0, 14.0, 20.0, 22.0, 29.0, 43.0, 46.0, 43.0, 35.0, 35.0, 55.0, 54.0, 48.0, 42.0, 53.0, 49.0, 46.0, 45.0, 42.0, 33.0, 37.0, 36.0, 21.0, 5.0, 21.0, 14.0, 16.0, 5.0, 8.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.986328125, -1.923583984375, -1.86083984375, -1.798095703125, -1.7353515625, -1.672607421875, -1.60986328125, -1.547119140625, -1.484375, -1.421630859375, -1.35888671875, -1.296142578125, -1.2333984375, -1.170654296875, -1.10791015625, -1.045166015625, -0.982421875, -0.919677734375, -0.85693359375, -0.794189453125, -0.7314453125, -0.668701171875, -0.60595703125, -0.543212890625, -0.48046875, -0.417724609375, -0.35498046875, -0.292236328125, -0.2294921875, -0.166748046875, -0.10400390625, -0.041259765625, 0.021484375, 0.084228515625, 0.14697265625, 0.209716796875, 0.2724609375, 0.335205078125, 0.39794921875, 0.460693359375, 0.5234375, 0.586181640625, 0.64892578125, 0.711669921875, 0.7744140625, 0.837158203125, 0.89990234375, 0.962646484375, 1.025390625, 1.088134765625, 1.15087890625, 1.213623046875, 1.2763671875, 1.339111328125, 1.40185546875, 1.464599609375, 1.52734375, 1.590087890625, 1.65283203125, 1.715576171875, 1.7783203125, 1.841064453125, 1.90380859375, 1.966552734375, 2.029296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 6.0, 4.0, 14.0, 8.0, 14.0, 16.0, 34.0, 42.0, 55.0, 55.0, 78.0, 120.0, 176.0, 258.0, 428.0, 774.0, 1516.0, 3786.0, 10828.0, 37556.0, 143977.0, 456819.0, 285354.0, 74250.0, 20668.0, 6592.0, 2473.0, 1018.0, 600.0, 325.0, 202.0, 155.0, 95.0, 56.0, 58.0, 41.0, 23.0, 29.0, 23.0, 7.0, 5.0, 6.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-7.34765625, -7.1300048828125, -6.912353515625, -6.6947021484375, -6.47705078125, -6.2593994140625, -6.041748046875, -5.8240966796875, -5.6064453125, -5.3887939453125, -5.171142578125, -4.9534912109375, -4.73583984375, -4.5181884765625, -4.300537109375, -4.0828857421875, -3.865234375, -3.6475830078125, -3.429931640625, -3.2122802734375, -2.99462890625, -2.7769775390625, -2.559326171875, -2.3416748046875, -2.1240234375, -1.9063720703125, -1.688720703125, -1.4710693359375, -1.25341796875, -1.0357666015625, -0.818115234375, -0.6004638671875, -0.3828125, -0.1651611328125, 0.052490234375, 0.2701416015625, 0.48779296875, 0.7054443359375, 0.923095703125, 1.1407470703125, 1.3583984375, 1.5760498046875, 1.793701171875, 2.0113525390625, 2.22900390625, 2.4466552734375, 2.664306640625, 2.8819580078125, 3.099609375, 3.3172607421875, 3.534912109375, 3.7525634765625, 3.97021484375, 4.1878662109375, 4.405517578125, 4.6231689453125, 4.8408203125, 5.0584716796875, 5.276123046875, 5.4937744140625, 5.71142578125, 5.9290771484375, 6.146728515625, 6.3643798828125, 6.58203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 8.0, 6.0, 9.0, 17.0, 10.0, 12.0, 20.0, 13.0, 26.0, 32.0, 22.0, 35.0, 31.0, 41.0, 45.0, 51.0, 38.0, 48.0, 36.0, 45.0, 55.0, 45.0, 44.0, 50.0, 32.0, 32.0, 29.0, 38.0, 19.0, 18.0, 12.0, 16.0, 8.0, 12.0, 10.0, 4.0, 6.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.8046875, -10.48779296875, -10.1708984375, -9.85400390625, -9.537109375, -9.22021484375, -8.9033203125, -8.58642578125, -8.26953125, -7.95263671875, -7.6357421875, -7.31884765625, -7.001953125, -6.68505859375, -6.3681640625, -6.05126953125, -5.734375, -5.41748046875, -5.1005859375, -4.78369140625, -4.466796875, -4.14990234375, -3.8330078125, -3.51611328125, -3.19921875, -2.88232421875, -2.5654296875, -2.24853515625, -1.931640625, -1.61474609375, -1.2978515625, -0.98095703125, -0.6640625, -0.34716796875, -0.0302734375, 0.28662109375, 0.603515625, 0.92041015625, 1.2373046875, 1.55419921875, 1.87109375, 2.18798828125, 2.5048828125, 2.82177734375, 3.138671875, 3.45556640625, 3.7724609375, 4.08935546875, 4.40625, 4.72314453125, 5.0400390625, 5.35693359375, 5.673828125, 5.99072265625, 6.3076171875, 6.62451171875, 6.94140625, 7.25830078125, 7.5751953125, 7.89208984375, 8.208984375, 8.52587890625, 8.8427734375, 9.15966796875, 9.4765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 10.0, 7.0, 10.0, 19.0, 43.0, 59.0, 117.0, 193.0, 449.0, 1061.0, 3125.0, 13067.0, 73894.0, 502704.0, 384655.0, 54675.0, 10038.0, 2687.0, 900.0, 384.0, 211.0, 97.0, 65.0, 32.0, 15.0, 17.0, 5.0, 1.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.52734375, -4.38092041015625, -4.2344970703125, -4.08807373046875, -3.941650390625, -3.79522705078125, -3.6488037109375, -3.50238037109375, -3.35595703125, -3.20953369140625, -3.0631103515625, -2.91668701171875, -2.770263671875, -2.62384033203125, -2.4774169921875, -2.33099365234375, -2.1845703125, -2.03814697265625, -1.8917236328125, -1.74530029296875, -1.598876953125, -1.45245361328125, -1.3060302734375, -1.15960693359375, -1.01318359375, -0.86676025390625, -0.7203369140625, -0.57391357421875, -0.427490234375, -0.28106689453125, -0.1346435546875, 0.01177978515625, 0.158203125, 0.30462646484375, 0.4510498046875, 0.59747314453125, 0.743896484375, 0.89031982421875, 1.0367431640625, 1.18316650390625, 1.32958984375, 1.47601318359375, 1.6224365234375, 1.76885986328125, 1.915283203125, 2.06170654296875, 2.2081298828125, 2.35455322265625, 2.5009765625, 2.64739990234375, 2.7938232421875, 2.94024658203125, 3.086669921875, 3.23309326171875, 3.3795166015625, 3.52593994140625, 3.67236328125, 3.81878662109375, 3.9652099609375, 4.11163330078125, 4.258056640625, 4.40447998046875, 4.5509033203125, 4.69732666015625, 4.84375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 5.0, 1.0, 3.0, 8.0, 8.0, 9.0, 7.0, 20.0, 23.0, 31.0, 28.0, 40.0, 62.0, 62.0, 61.0, 60.0, 79.0, 73.0, 84.0, 67.0, 57.0, 50.0, 37.0, 21.0, 23.0, 27.0, 19.0, 10.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00039958953857421875, -0.0003860965371131897, -0.00037260353565216064, -0.0003591105341911316, -0.00034561753273010254, -0.0003321245312690735, -0.00031863152980804443, -0.0003051385283470154, -0.00029164552688598633, -0.0002781525254249573, -0.0002646595239639282, -0.00025116652250289917, -0.00023767352104187012, -0.00022418051958084106, -0.000210687518119812, -0.00019719451665878296, -0.0001837015151977539, -0.00017020851373672485, -0.0001567155122756958, -0.00014322251081466675, -0.0001297295093536377, -0.00011623650789260864, -0.00010274350643157959, -8.925050497055054e-05, -7.575750350952148e-05, -6.226450204849243e-05, -4.877150058746338e-05, -3.5278499126434326e-05, -2.1785497665405273e-05, -8.29249620437622e-06, 5.200505256652832e-06, 1.8693506717681885e-05, 3.218650817871094e-05, 4.567950963973999e-05, 5.917251110076904e-05, 7.26655125617981e-05, 8.615851402282715e-05, 9.96515154838562e-05, 0.00011314451694488525, 0.0001266375184059143, 0.00014013051986694336, 0.0001536235213279724, 0.00016711652278900146, 0.00018060952425003052, 0.00019410252571105957, 0.00020759552717208862, 0.00022108852863311768, 0.00023458153009414673, 0.0002480745315551758, 0.00026156753301620483, 0.0002750605344772339, 0.00028855353593826294, 0.000302046537399292, 0.00031553953886032104, 0.0003290325403213501, 0.00034252554178237915, 0.0003560185432434082, 0.00036951154470443726, 0.0003830045461654663, 0.00039649754762649536, 0.0004099905490875244, 0.00042348355054855347, 0.0004369765520095825, 0.00045046955347061157, 0.0004639625549316406]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 10.0, 11.0, 15.0, 29.0, 52.0, 58.0, 100.0, 155.0, 257.0, 436.0, 940.0, 2129.0, 5577.0, 18772.0, 87141.0, 438911.0, 391602.0, 76262.0, 16998.0, 5062.0, 2026.0, 863.0, 457.0, 269.0, 138.0, 88.0, 67.0, 45.0, 29.0, 15.0, 8.0, 3.0, 8.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.81640625, -3.68902587890625, -3.5616455078125, -3.43426513671875, -3.306884765625, -3.17950439453125, -3.0521240234375, -2.92474365234375, -2.79736328125, -2.66998291015625, -2.5426025390625, -2.41522216796875, -2.287841796875, -2.16046142578125, -2.0330810546875, -1.90570068359375, -1.7783203125, -1.65093994140625, -1.5235595703125, -1.39617919921875, -1.268798828125, -1.14141845703125, -1.0140380859375, -0.88665771484375, -0.75927734375, -0.63189697265625, -0.5045166015625, -0.37713623046875, -0.249755859375, -0.12237548828125, 0.0050048828125, 0.13238525390625, 0.259765625, 0.38714599609375, 0.5145263671875, 0.64190673828125, 0.769287109375, 0.89666748046875, 1.0240478515625, 1.15142822265625, 1.27880859375, 1.40618896484375, 1.5335693359375, 1.66094970703125, 1.788330078125, 1.91571044921875, 2.0430908203125, 2.17047119140625, 2.2978515625, 2.42523193359375, 2.5526123046875, 2.67999267578125, 2.807373046875, 2.93475341796875, 3.0621337890625, 3.18951416015625, 3.31689453125, 3.44427490234375, 3.5716552734375, 3.69903564453125, 3.826416015625, 3.95379638671875, 4.0811767578125, 4.20855712890625, 4.3359375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 5.0, 7.0, 2.0, 9.0, 11.0, 11.0, 22.0, 20.0, 38.0, 67.0, 68.0, 91.0, 104.0, 89.0, 101.0, 78.0, 72.0, 55.0, 45.0, 25.0, 33.0, 15.0, 14.0, 2.0, 8.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.14501953125, -5.9619140625, -5.77880859375, -5.595703125, -5.41259765625, -5.2294921875, -5.04638671875, -4.86328125, -4.68017578125, -4.4970703125, -4.31396484375, -4.130859375, -3.94775390625, -3.7646484375, -3.58154296875, -3.3984375, -3.21533203125, -3.0322265625, -2.84912109375, -2.666015625, -2.48291015625, -2.2998046875, -2.11669921875, -1.93359375, -1.75048828125, -1.5673828125, -1.38427734375, -1.201171875, -1.01806640625, -0.8349609375, -0.65185546875, -0.46875, -0.28564453125, -0.1025390625, 0.08056640625, 0.263671875, 0.44677734375, 0.6298828125, 0.81298828125, 0.99609375, 1.17919921875, 1.3623046875, 1.54541015625, 1.728515625, 1.91162109375, 2.0947265625, 2.27783203125, 2.4609375, 2.64404296875, 2.8271484375, 3.01025390625, 3.193359375, 3.37646484375, 3.5595703125, 3.74267578125, 3.92578125, 4.10888671875, 4.2919921875, 4.47509765625, 4.658203125, 4.84130859375, 5.0244140625, 5.20751953125, 5.390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 7.0, 8.0, 20.0, 31.0, 59.0, 102.0, 122.0, 166.0, 141.0, 117.0, 91.0, 61.0, 34.0, 19.0, 9.0, 7.0, 5.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.46234130859375, -81.20864868164062, -78.9549560546875, -76.70126342773438, -74.44757080078125, -72.19387817382812, -69.940185546875, -67.68649291992188, -65.43280029296875, -63.179107666015625, -60.9254150390625, -58.671722412109375, -56.41802978515625, -54.164337158203125, -51.910640716552734, -49.65694808959961, -47.40325164794922, -45.149559020996094, -42.89586639404297, -40.642173767089844, -38.38848114013672, -36.134788513183594, -33.8810920715332, -31.627399444580078, -29.373706817626953, -27.120014190673828, -24.866321563720703, -22.612627029418945, -20.35893440246582, -18.105241775512695, -15.851548194885254, -13.597854614257812, -11.344161987304688, -9.090469360351562, -6.836775779724121, -4.583082675933838, -2.3293895721435547, -0.07569694519042969, 2.1779966354370117, 4.431690216064453, 6.685382843017578, 8.939075469970703, 11.192769050598145, 13.446462631225586, 15.700155258178711, 17.953847885131836, 20.207542419433594, 22.46123504638672, 24.714927673339844, 26.96862030029297, 29.222312927246094, 31.47600746154785, 33.729698181152344, 35.98339080810547, 38.23708724975586, 40.490779876708984, 42.74447250366211, 44.998165130615234, 47.25185775756836, 49.505550384521484, 51.759246826171875, 54.012939453125, 56.266632080078125, 58.52032470703125, 60.774017333984375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 5.0, 6.0, 14.0, 12.0, 17.0, 21.0, 19.0, 17.0, 31.0, 29.0, 28.0, 29.0, 40.0, 28.0, 41.0, 45.0, 53.0, 36.0, 44.0, 37.0, 52.0, 46.0, 41.0, 43.0, 35.0, 42.0, 24.0, 24.0, 15.0, 26.0, 13.0, 12.0, 12.0, 11.0, 13.0, 4.0, 3.0, 5.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-51.33143615722656, -49.90367126464844, -48.47590637207031, -47.04814147949219, -45.62037658691406, -44.19261169433594, -42.76484680175781, -41.33708190917969, -39.90931701660156, -38.48155212402344, -37.05378723144531, -35.62602233886719, -34.19825744628906, -32.77049255371094, -31.342727661132812, -29.914962768554688, -28.487199783325195, -27.05943489074707, -25.631669998168945, -24.20390510559082, -22.776140213012695, -21.34837532043457, -19.920612335205078, -18.492847442626953, -17.065082550048828, -15.637317657470703, -14.209552764892578, -12.781787872314453, -11.354022979736328, -9.926258087158203, -8.498494148254395, -7.0707292556762695, -5.642963409423828, -4.215198516845703, -2.7874338626861572, -1.3596692085266113, 0.06809568405151367, 1.4958605766296387, 2.9236249923706055, 4.3513898849487305, 5.7791547775268555, 7.2069196701049805, 8.634684562683105, 10.062448501586914, 11.490213394165039, 12.917978286743164, 14.345743179321289, 15.773508071899414, 17.20127296447754, 18.629037857055664, 20.05680274963379, 21.484567642211914, 22.91233253479004, 24.340097427368164, 25.767860412597656, 27.19562530517578, 28.623390197753906, 30.05115509033203, 31.478919982910156, 32.90668487548828, 34.334449768066406, 35.76221466064453, 37.189979553222656, 38.61774444580078, 40.045509338378906]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 12.0, 11.0, 16.0, 25.0, 36.0, 41.0, 74.0, 115.0, 200.0, 333.0, 483.0, 953.0, 1884.0, 4805.0, 18507.0, 527524.0, 3608668.0, 20927.0, 5229.0, 2030.0, 997.0, 541.0, 317.0, 216.0, 105.0, 78.0, 46.0, 24.0, 25.0, 13.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.609375, -8.30224609375, -7.9951171875, -7.68798828125, -7.380859375, -7.07373046875, -6.7666015625, -6.45947265625, -6.15234375, -5.84521484375, -5.5380859375, -5.23095703125, -4.923828125, -4.61669921875, -4.3095703125, -4.00244140625, -3.6953125, -3.38818359375, -3.0810546875, -2.77392578125, -2.466796875, -2.15966796875, -1.8525390625, -1.54541015625, -1.23828125, -0.93115234375, -0.6240234375, -0.31689453125, -0.009765625, 0.29736328125, 0.6044921875, 0.91162109375, 1.21875, 1.52587890625, 1.8330078125, 2.14013671875, 2.447265625, 2.75439453125, 3.0615234375, 3.36865234375, 3.67578125, 3.98291015625, 4.2900390625, 4.59716796875, 4.904296875, 5.21142578125, 5.5185546875, 5.82568359375, 6.1328125, 6.43994140625, 6.7470703125, 7.05419921875, 7.361328125, 7.66845703125, 7.9755859375, 8.28271484375, 8.58984375, 8.89697265625, 9.2041015625, 9.51123046875, 9.818359375, 10.12548828125, 10.4326171875, 10.73974609375, 11.046875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 7.0, 5.0, 6.0, 8.0, 20.0, 23.0, 13.0, 18.0, 19.0, 30.0, 30.0, 29.0, 41.0, 46.0, 40.0, 46.0, 64.0, 34.0, 53.0, 49.0, 47.0, 49.0, 51.0, 39.0, 31.0, 30.0, 23.0, 20.0, 24.0, 19.0, 15.0, 13.0, 16.0, 6.0, 10.0, 2.0, 6.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.009765625, -1.9471435546875, -1.884521484375, -1.8218994140625, -1.75927734375, -1.6966552734375, -1.634033203125, -1.5714111328125, -1.5087890625, -1.4461669921875, -1.383544921875, -1.3209228515625, -1.25830078125, -1.1956787109375, -1.133056640625, -1.0704345703125, -1.0078125, -0.9451904296875, -0.882568359375, -0.8199462890625, -0.75732421875, -0.6947021484375, -0.632080078125, -0.5694580078125, -0.5068359375, -0.4442138671875, -0.381591796875, -0.3189697265625, -0.25634765625, -0.1937255859375, -0.131103515625, -0.0684814453125, -0.005859375, 0.0567626953125, 0.119384765625, 0.1820068359375, 0.24462890625, 0.3072509765625, 0.369873046875, 0.4324951171875, 0.4951171875, 0.5577392578125, 0.620361328125, 0.6829833984375, 0.74560546875, 0.8082275390625, 0.870849609375, 0.9334716796875, 0.99609375, 1.0587158203125, 1.121337890625, 1.1839599609375, 1.24658203125, 1.3092041015625, 1.371826171875, 1.4344482421875, 1.4970703125, 1.5596923828125, 1.622314453125, 1.6849365234375, 1.74755859375, 1.8101806640625, 1.872802734375, 1.9354248046875, 1.998046875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 8.0, 2.0, 3.0, 3.0, 11.0, 9.0, 13.0, 21.0, 27.0, 47.0, 50.0, 60.0, 90.0, 124.0, 160.0, 258.0, 328.0, 500.0, 749.0, 1212.0, 2011.0, 3789.0, 8433.0, 24123.0, 127028.0, 3830960.0, 149077.0, 26473.0, 8833.0, 3991.0, 2119.0, 1278.0, 731.0, 505.0, 352.0, 237.0, 174.0, 133.0, 95.0, 67.0, 49.0, 41.0, 36.0, 23.0, 10.0, 8.0, 12.0, 4.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.19140625, -5.015625, -4.83984375, -4.6640625, -4.48828125, -4.3125, -4.13671875, -3.9609375, -3.78515625, -3.609375, -3.43359375, -3.2578125, -3.08203125, -2.90625, -2.73046875, -2.5546875, -2.37890625, -2.203125, -2.02734375, -1.8515625, -1.67578125, -1.5, -1.32421875, -1.1484375, -0.97265625, -0.796875, -0.62109375, -0.4453125, -0.26953125, -0.09375, 0.08203125, 0.2578125, 0.43359375, 0.609375, 0.78515625, 0.9609375, 1.13671875, 1.3125, 1.48828125, 1.6640625, 1.83984375, 2.015625, 2.19140625, 2.3671875, 2.54296875, 2.71875, 2.89453125, 3.0703125, 3.24609375, 3.421875, 3.59765625, 3.7734375, 3.94921875, 4.125, 4.30078125, 4.4765625, 4.65234375, 4.828125, 5.00390625, 5.1796875, 5.35546875, 5.53125, 5.70703125, 5.8828125, 6.05859375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 6.0, 4.0, 12.0, 13.0, 20.0, 37.0, 94.0, 306.0, 3155.0, 230.0, 97.0, 36.0, 23.0, 11.0, 14.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9638671875, -1.8971405029296875, -1.830413818359375, -1.7636871337890625, -1.69696044921875, -1.6302337646484375, -1.563507080078125, -1.4967803955078125, -1.4300537109375, -1.3633270263671875, -1.296600341796875, -1.2298736572265625, -1.16314697265625, -1.0964202880859375, -1.029693603515625, -0.9629669189453125, -0.896240234375, -0.8295135498046875, -0.762786865234375, -0.6960601806640625, -0.62933349609375, -0.5626068115234375, -0.495880126953125, -0.4291534423828125, -0.3624267578125, -0.2957000732421875, -0.228973388671875, -0.1622467041015625, -0.09552001953125, -0.0287933349609375, 0.037933349609375, 0.1046600341796875, 0.17138671875, 0.2381134033203125, 0.304840087890625, 0.3715667724609375, 0.43829345703125, 0.5050201416015625, 0.571746826171875, 0.6384735107421875, 0.7052001953125, 0.7719268798828125, 0.838653564453125, 0.9053802490234375, 0.97210693359375, 1.0388336181640625, 1.105560302734375, 1.1722869873046875, 1.239013671875, 1.3057403564453125, 1.372467041015625, 1.4391937255859375, 1.50592041015625, 1.5726470947265625, 1.639373779296875, 1.7061004638671875, 1.7728271484375, 1.8395538330078125, 1.906280517578125, 1.9730072021484375, 2.03973388671875, 2.1064605712890625, 2.173187255859375, 2.2399139404296875, 2.306640625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 6.0, 9.0, 10.0, 24.0, 30.0, 40.0, 45.0, 64.0, 81.0, 101.0, 112.0, 116.0, 98.0, 82.0, 68.0, 25.0, 35.0, 13.0, 13.0, 5.0, 7.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7738471031188965, -5.586650848388672, -5.399454593658447, -5.212258338928223, -5.02506160736084, -4.837865352630615, -4.650669097900391, -4.463472843170166, -4.276276588439941, -4.089080333709717, -3.901884078979492, -3.7146875858306885, -3.527491331100464, -3.3402950763702393, -3.1530985832214355, -2.965902328491211, -2.7787060737609863, -2.5915098190307617, -2.404313564300537, -2.2171170711517334, -2.029920816421509, -1.8427245616912842, -1.65552818775177, -1.4683318138122559, -1.2811355590820312, -1.0939393043518066, -0.9067429304122925, -0.7195466160774231, -0.5323503017425537, -0.3451539874076843, -0.15795767307281494, 0.02923870086669922, 0.21643495559692383, 0.4036312699317932, 0.5908275842666626, 0.778023898601532, 0.9652202129364014, 1.152416467666626, 1.3396128416061401, 1.5268092155456543, 1.714005470275879, 1.9012017250061035, 2.088397979736328, 2.275594472885132, 2.4627907276153564, 2.649986982345581, 2.8371834754943848, 3.0243797302246094, 3.211575984954834, 3.3987722396850586, 3.585968494415283, 3.773164987564087, 3.9603612422943115, 4.147557735443115, 4.33475399017334, 4.5219502449035645, 4.709146499633789, 4.896342754364014, 5.083539009094238, 5.270735263824463, 5.4579315185546875, 5.64512825012207, 5.832324504852295, 6.0195207595825195, 6.206717014312744]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 8.0, 7.0, 15.0, 14.0, 10.0, 12.0, 23.0, 37.0, 22.0, 35.0, 28.0, 35.0, 28.0, 36.0, 38.0, 43.0, 59.0, 45.0, 53.0, 43.0, 39.0, 34.0, 34.0, 29.0, 34.0, 38.0, 31.0, 19.0, 19.0, 18.0, 17.0, 16.0, 11.0, 15.0, 15.0, 5.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.4429473876953125, -3.337775945663452, -3.232604503631592, -3.1274330615997314, -3.022261619567871, -2.9170899391174316, -2.8119187355041504, -2.706747055053711, -2.6015756130218506, -2.4964041709899902, -2.39123272895813, -2.2860612869262695, -2.180889844894409, -2.075718402862549, -1.970546841621399, -1.865375280380249, -1.7602039575576782, -1.6550325155258179, -1.5498610734939575, -1.4446895122528076, -1.3395180702209473, -1.234346628189087, -1.1291751861572266, -1.0240037441253662, -0.9188322424888611, -0.8136608004570007, -0.7084892988204956, -0.6033178567886353, -0.4981463849544525, -0.3929749131202698, -0.2878034710884094, -0.1826319694519043, -0.07746052742004395, 0.027710936963558197, 0.13288240134716034, 0.23805385828018188, 0.3432253301143646, 0.44839680194854736, 0.5535682439804077, 0.6587397456169128, 0.7639111876487732, 0.8690826296806335, 0.9742541313171387, 1.079425573348999, 1.1845970153808594, 1.2897684574127197, 1.39493989944458, 1.50011146068573, 1.6052829027175903, 1.7104543447494507, 1.815625786781311, 1.920797348022461, 2.0259687900543213, 2.1311402320861816, 2.236311674118042, 2.3414831161499023, 2.4466545581817627, 2.551826000213623, 2.6569974422454834, 2.7621688842773438, 2.867340326309204, 2.9725117683410645, 3.077683448791504, 3.1828548908233643, 3.2880263328552246]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 4.0, 13.0, 14.0, 16.0, 18.0, 32.0, 41.0, 68.0, 133.0, 232.0, 432.0, 922.0, 2220.0, 5901.0, 17478.0, 61141.0, 217873.0, 430403.0, 221831.0, 61832.0, 17772.0, 6041.0, 2224.0, 880.0, 470.0, 242.0, 124.0, 81.0, 47.0, 28.0, 12.0, 13.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1953125, -5.0130615234375, -4.830810546875, -4.6485595703125, -4.46630859375, -4.2840576171875, -4.101806640625, -3.9195556640625, -3.7373046875, -3.5550537109375, -3.372802734375, -3.1905517578125, -3.00830078125, -2.8260498046875, -2.643798828125, -2.4615478515625, -2.279296875, -2.0970458984375, -1.914794921875, -1.7325439453125, -1.55029296875, -1.3680419921875, -1.185791015625, -1.0035400390625, -0.8212890625, -0.6390380859375, -0.456787109375, -0.2745361328125, -0.09228515625, 0.0899658203125, 0.272216796875, 0.4544677734375, 0.63671875, 0.8189697265625, 1.001220703125, 1.1834716796875, 1.36572265625, 1.5479736328125, 1.730224609375, 1.9124755859375, 2.0947265625, 2.2769775390625, 2.459228515625, 2.6414794921875, 2.82373046875, 3.0059814453125, 3.188232421875, 3.3704833984375, 3.552734375, 3.7349853515625, 3.917236328125, 4.0994873046875, 4.28173828125, 4.4639892578125, 4.646240234375, 4.8284912109375, 5.0107421875, 5.1929931640625, 5.375244140625, 5.5574951171875, 5.73974609375, 5.9219970703125, 6.104248046875, 6.2864990234375, 6.46875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 5.0, 11.0, 11.0, 9.0, 16.0, 23.0, 7.0, 21.0, 24.0, 26.0, 31.0, 37.0, 36.0, 39.0, 59.0, 41.0, 47.0, 50.0, 40.0, 41.0, 44.0, 54.0, 38.0, 47.0, 32.0, 28.0, 29.0, 21.0, 18.0, 16.0, 16.0, 19.0, 12.0, 9.0, 8.0, 5.0, 4.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9384765625, -1.8778839111328125, -1.817291259765625, -1.7566986083984375, -1.69610595703125, -1.6355133056640625, -1.574920654296875, -1.5143280029296875, -1.4537353515625, -1.3931427001953125, -1.332550048828125, -1.2719573974609375, -1.21136474609375, -1.1507720947265625, -1.090179443359375, -1.0295867919921875, -0.968994140625, -0.9084014892578125, -0.847808837890625, -0.7872161865234375, -0.72662353515625, -0.6660308837890625, -0.605438232421875, -0.5448455810546875, -0.4842529296875, -0.4236602783203125, -0.363067626953125, -0.3024749755859375, -0.24188232421875, -0.1812896728515625, -0.120697021484375, -0.0601043701171875, 0.00048828125, 0.0610809326171875, 0.121673583984375, 0.1822662353515625, 0.24285888671875, 0.3034515380859375, 0.364044189453125, 0.4246368408203125, 0.4852294921875, 0.5458221435546875, 0.606414794921875, 0.6670074462890625, 0.72760009765625, 0.7881927490234375, 0.848785400390625, 0.9093780517578125, 0.969970703125, 1.0305633544921875, 1.091156005859375, 1.1517486572265625, 1.21234130859375, 1.2729339599609375, 1.333526611328125, 1.3941192626953125, 1.4547119140625, 1.5153045654296875, 1.575897216796875, 1.6364898681640625, 1.69708251953125, 1.7576751708984375, 1.818267822265625, 1.8788604736328125, 1.939453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 7.0, 12.0, 15.0, 10.0, 29.0, 25.0, 26.0, 46.0, 69.0, 94.0, 139.0, 220.0, 348.0, 557.0, 1055.0, 1873.0, 4289.0, 11851.0, 39909.0, 177040.0, 514017.0, 223432.0, 49405.0, 13992.0, 5072.0, 2226.0, 1074.0, 603.0, 365.0, 213.0, 152.0, 120.0, 64.0, 47.0, 32.0, 27.0, 21.0, 19.0, 18.0, 11.0, 4.0, 3.0, 6.0, 0.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.11328125, -5.919677734375, -5.72607421875, -5.532470703125, -5.3388671875, -5.145263671875, -4.95166015625, -4.758056640625, -4.564453125, -4.370849609375, -4.17724609375, -3.983642578125, -3.7900390625, -3.596435546875, -3.40283203125, -3.209228515625, -3.015625, -2.822021484375, -2.62841796875, -2.434814453125, -2.2412109375, -2.047607421875, -1.85400390625, -1.660400390625, -1.466796875, -1.273193359375, -1.07958984375, -0.885986328125, -0.6923828125, -0.498779296875, -0.30517578125, -0.111572265625, 0.08203125, 0.275634765625, 0.46923828125, 0.662841796875, 0.8564453125, 1.050048828125, 1.24365234375, 1.437255859375, 1.630859375, 1.824462890625, 2.01806640625, 2.211669921875, 2.4052734375, 2.598876953125, 2.79248046875, 2.986083984375, 3.1796875, 3.373291015625, 3.56689453125, 3.760498046875, 3.9541015625, 4.147705078125, 4.34130859375, 4.534912109375, 4.728515625, 4.922119140625, 5.11572265625, 5.309326171875, 5.5029296875, 5.696533203125, 5.89013671875, 6.083740234375, 6.27734375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 9.0, 7.0, 6.0, 11.0, 11.0, 10.0, 19.0, 20.0, 20.0, 33.0, 34.0, 35.0, 30.0, 28.0, 40.0, 37.0, 44.0, 37.0, 51.0, 46.0, 39.0, 42.0, 49.0, 36.0, 30.0, 45.0, 33.0, 37.0, 32.0, 27.0, 18.0, 13.0, 9.0, 13.0, 12.0, 10.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.1328125, -8.842041015625, -8.55126953125, -8.260498046875, -7.9697265625, -7.678955078125, -7.38818359375, -7.097412109375, -6.806640625, -6.515869140625, -6.22509765625, -5.934326171875, -5.6435546875, -5.352783203125, -5.06201171875, -4.771240234375, -4.48046875, -4.189697265625, -3.89892578125, -3.608154296875, -3.3173828125, -3.026611328125, -2.73583984375, -2.445068359375, -2.154296875, -1.863525390625, -1.57275390625, -1.281982421875, -0.9912109375, -0.700439453125, -0.40966796875, -0.118896484375, 0.171875, 0.462646484375, 0.75341796875, 1.044189453125, 1.3349609375, 1.625732421875, 1.91650390625, 2.207275390625, 2.498046875, 2.788818359375, 3.07958984375, 3.370361328125, 3.6611328125, 3.951904296875, 4.24267578125, 4.533447265625, 4.82421875, 5.114990234375, 5.40576171875, 5.696533203125, 5.9873046875, 6.278076171875, 6.56884765625, 6.859619140625, 7.150390625, 7.441162109375, 7.73193359375, 8.022705078125, 8.3134765625, 8.604248046875, 8.89501953125, 9.185791015625, 9.4765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 13.0, 22.0, 11.0, 22.0, 43.0, 75.0, 141.0, 297.0, 689.0, 1893.0, 6455.0, 35683.0, 741490.0, 238710.0, 16937.0, 3838.0, 1214.0, 486.0, 216.0, 121.0, 78.0, 44.0, 23.0, 14.0, 10.0, 5.0, 5.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7578125, -7.5213623046875, -7.284912109375, -7.0484619140625, -6.81201171875, -6.5755615234375, -6.339111328125, -6.1026611328125, -5.8662109375, -5.6297607421875, -5.393310546875, -5.1568603515625, -4.92041015625, -4.6839599609375, -4.447509765625, -4.2110595703125, -3.974609375, -3.7381591796875, -3.501708984375, -3.2652587890625, -3.02880859375, -2.7923583984375, -2.555908203125, -2.3194580078125, -2.0830078125, -1.8465576171875, -1.610107421875, -1.3736572265625, -1.13720703125, -0.9007568359375, -0.664306640625, -0.4278564453125, -0.19140625, 0.0450439453125, 0.281494140625, 0.5179443359375, 0.75439453125, 0.9908447265625, 1.227294921875, 1.4637451171875, 1.7001953125, 1.9366455078125, 2.173095703125, 2.4095458984375, 2.64599609375, 2.8824462890625, 3.118896484375, 3.3553466796875, 3.591796875, 3.8282470703125, 4.064697265625, 4.3011474609375, 4.53759765625, 4.7740478515625, 5.010498046875, 5.2469482421875, 5.4833984375, 5.7198486328125, 5.956298828125, 6.1927490234375, 6.42919921875, 6.6656494140625, 6.902099609375, 7.1385498046875, 7.375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 7.0, 10.0, 9.0, 21.0, 28.0, 36.0, 75.0, 136.0, 193.0, 179.0, 124.0, 74.0, 35.0, 22.0, 11.0, 10.0, 6.0, 4.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0009584426879882812, -0.0009292364120483398, -0.0009000301361083984, -0.000870823860168457, -0.0008416175842285156, -0.0008124113082885742, -0.0007832050323486328, -0.0007539987564086914, -0.00072479248046875, -0.0006955862045288086, -0.0006663799285888672, -0.0006371736526489258, -0.0006079673767089844, -0.000578761100769043, -0.0005495548248291016, -0.0005203485488891602, -0.0004911422729492188, -0.00046193599700927734, -0.00043272972106933594, -0.00040352344512939453, -0.0003743171691894531, -0.0003451108932495117, -0.0003159046173095703, -0.0002866983413696289, -0.0002574920654296875, -0.0002282857894897461, -0.0001990795135498047, -0.00016987323760986328, -0.00014066696166992188, -0.00011146068572998047, -8.225440979003906e-05, -5.3048133850097656e-05, -2.384185791015625e-05, 5.364418029785156e-06, 3.457069396972656e-05, 6.377696990966797e-05, 9.298324584960938e-05, 0.00012218952178955078, 0.0001513957977294922, 0.0001806020736694336, 0.000209808349609375, 0.0002390146255493164, 0.0002682209014892578, 0.0002974271774291992, 0.0003266334533691406, 0.00035583972930908203, 0.00038504600524902344, 0.00041425228118896484, 0.00044345855712890625, 0.00047266483306884766, 0.0005018711090087891, 0.0005310773849487305, 0.0005602836608886719, 0.0005894899368286133, 0.0006186962127685547, 0.0006479024887084961, 0.0006771087646484375, 0.0007063150405883789, 0.0007355213165283203, 0.0007647275924682617, 0.0007939338684082031, 0.0008231401443481445, 0.0008523464202880859, 0.0008815526962280273, 0.0009107589721679688]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 13.0, 13.0, 25.0, 45.0, 115.0, 263.0, 887.0, 6173.0, 210433.0, 815232.0, 13177.0, 1513.0, 354.0, 153.0, 72.0, 43.0, 23.0, 8.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6796875, -12.2972412109375, -11.914794921875, -11.5323486328125, -11.14990234375, -10.7674560546875, -10.385009765625, -10.0025634765625, -9.6201171875, -9.2376708984375, -8.855224609375, -8.4727783203125, -8.09033203125, -7.7078857421875, -7.325439453125, -6.9429931640625, -6.560546875, -6.1781005859375, -5.795654296875, -5.4132080078125, -5.03076171875, -4.6483154296875, -4.265869140625, -3.8834228515625, -3.5009765625, -3.1185302734375, -2.736083984375, -2.3536376953125, -1.97119140625, -1.5887451171875, -1.206298828125, -0.8238525390625, -0.44140625, -0.0589599609375, 0.323486328125, 0.7059326171875, 1.08837890625, 1.4708251953125, 1.853271484375, 2.2357177734375, 2.6181640625, 3.0006103515625, 3.383056640625, 3.7655029296875, 4.14794921875, 4.5303955078125, 4.912841796875, 5.2952880859375, 5.677734375, 6.0601806640625, 6.442626953125, 6.8250732421875, 7.20751953125, 7.5899658203125, 7.972412109375, 8.3548583984375, 8.7373046875, 9.1197509765625, 9.502197265625, 9.8846435546875, 10.26708984375, 10.6495361328125, 11.031982421875, 11.4144287109375, 11.796875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 4.0, 10.0, 16.0, 20.0, 30.0, 36.0, 56.0, 65.0, 71.0, 108.0, 100.0, 91.0, 85.0, 75.0, 50.0, 35.0, 32.0, 28.0, 12.0, 10.0, 15.0, 10.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.947265625, -3.804351806640625, -3.66143798828125, -3.518524169921875, -3.3756103515625, -3.232696533203125, -3.08978271484375, -2.946868896484375, -2.803955078125, -2.661041259765625, -2.51812744140625, -2.375213623046875, -2.2322998046875, -2.089385986328125, -1.94647216796875, -1.803558349609375, -1.66064453125, -1.517730712890625, -1.37481689453125, -1.231903076171875, -1.0889892578125, -0.946075439453125, -0.80316162109375, -0.660247802734375, -0.517333984375, -0.374420166015625, -0.23150634765625, -0.088592529296875, 0.0543212890625, 0.197235107421875, 0.34014892578125, 0.483062744140625, 0.6259765625, 0.768890380859375, 0.91180419921875, 1.054718017578125, 1.1976318359375, 1.340545654296875, 1.48345947265625, 1.626373291015625, 1.769287109375, 1.912200927734375, 2.05511474609375, 2.198028564453125, 2.3409423828125, 2.483856201171875, 2.62677001953125, 2.769683837890625, 2.91259765625, 3.055511474609375, 3.19842529296875, 3.341339111328125, 3.4842529296875, 3.627166748046875, 3.77008056640625, 3.912994384765625, 4.055908203125, 4.198822021484375, 4.34173583984375, 4.484649658203125, 4.6275634765625, 4.770477294921875, 4.91339111328125, 5.056304931640625, 5.19921875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 14.0, 27.0, 57.0, 117.0, 183.0, 189.0, 173.0, 111.0, 70.0, 26.0, 14.0, 6.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-98.72518920898438, -95.59812927246094, -92.4710693359375, -89.34400939941406, -86.21694946289062, -83.08988189697266, -79.96282196044922, -76.83576202392578, -73.70870208740234, -70.5816421508789, -67.45458221435547, -64.32752227783203, -61.20045852661133, -58.07339859008789, -54.94633483886719, -51.81927490234375, -48.69221496582031, -45.565155029296875, -42.43809509277344, -39.311031341552734, -36.1839714050293, -33.05691146850586, -29.92984962463379, -26.80278778076172, -23.67572784423828, -20.548667907714844, -17.421606063842773, -14.29454517364502, -11.167484283447266, -8.040423393249512, -4.913362503051758, -1.7863006591796875, 1.3407516479492188, 4.467812538146973, 7.594873428344727, 10.72193431854248, 13.848995208740234, 16.976055145263672, 20.103116989135742, 23.230178833007812, 26.35723876953125, 29.484298706054688, 32.611358642578125, 35.73842239379883, 38.865482330322266, 41.9925422668457, 45.119606018066406, 48.246665954589844, 51.37372589111328, 54.50078582763672, 57.627845764160156, 60.75490951538086, 63.8819694519043, 67.009033203125, 70.13609313964844, 73.26315307617188, 76.39021301269531, 79.51727294921875, 82.64433288574219, 85.77139282226562, 88.89845275878906, 92.02552032470703, 95.15258026123047, 98.2796401977539, 101.40670013427734]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 8.0, 6.0, 8.0, 8.0, 15.0, 15.0, 17.0, 16.0, 24.0, 27.0, 28.0, 29.0, 38.0, 30.0, 36.0, 47.0, 54.0, 47.0, 50.0, 52.0, 41.0, 47.0, 36.0, 48.0, 36.0, 35.0, 31.0, 27.0, 20.0, 20.0, 18.0, 15.0, 14.0, 12.0, 8.0, 8.0, 4.0, 1.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.74864959716797, -45.36009216308594, -43.97153091430664, -42.58297348022461, -41.19441223144531, -39.80585479736328, -38.41729736328125, -37.02873611450195, -35.64017868041992, -34.25162124633789, -32.863059997558594, -31.474502563476562, -30.0859432220459, -28.697383880615234, -27.30882453918457, -25.920265197753906, -24.531705856323242, -23.143146514892578, -21.754587173461914, -20.36602783203125, -18.97747039794922, -17.588911056518555, -16.20035171508789, -14.811793327331543, -13.423233985900879, -12.034674644470215, -10.646116256713867, -9.257556915283203, -7.868998050689697, -6.480439186096191, -5.091879844665527, -3.7033214569091797, -2.3147621154785156, -0.9262031316757202, 0.4623558521270752, 1.8509149551391602, 3.239473819732666, 4.628032684326172, 6.016592025756836, 7.405150413513184, 8.793709754943848, 10.182269096374512, 11.57082748413086, 12.959386825561523, 14.347946166992188, 15.736504554748535, 17.125064849853516, 18.513622283935547, 19.90218162536621, 21.290740966796875, 22.67930030822754, 24.067859649658203, 25.456417083740234, 26.8449764251709, 28.233535766601562, 29.622093200683594, 31.01065444946289, 32.39921188354492, 33.78777313232422, 35.17633056640625, 36.56489181518555, 37.95344924926758, 39.342010498046875, 40.730567932128906, 42.11912536621094]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 8.0, 5.0, 8.0, 15.0, 10.0, 17.0, 31.0, 32.0, 60.0, 102.0, 144.0, 202.0, 413.0, 671.0, 1410.0, 3134.0, 9521.0, 76718.0, 4058191.0, 32537.0, 6267.0, 2255.0, 1018.0, 607.0, 370.0, 195.0, 103.0, 79.0, 55.0, 34.0, 13.0, 13.0, 12.0, 9.0, 7.0, 5.0, 2.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.359375, -8.0535888671875, -7.747802734375, -7.4420166015625, -7.13623046875, -6.8304443359375, -6.524658203125, -6.2188720703125, -5.9130859375, -5.6072998046875, -5.301513671875, -4.9957275390625, -4.68994140625, -4.3841552734375, -4.078369140625, -3.7725830078125, -3.466796875, -3.1610107421875, -2.855224609375, -2.5494384765625, -2.24365234375, -1.9378662109375, -1.632080078125, -1.3262939453125, -1.0205078125, -0.7147216796875, -0.408935546875, -0.1031494140625, 0.20263671875, 0.5084228515625, 0.814208984375, 1.1199951171875, 1.42578125, 1.7315673828125, 2.037353515625, 2.3431396484375, 2.64892578125, 2.9547119140625, 3.260498046875, 3.5662841796875, 3.8720703125, 4.1778564453125, 4.483642578125, 4.7894287109375, 5.09521484375, 5.4010009765625, 5.706787109375, 6.0125732421875, 6.318359375, 6.6241455078125, 6.929931640625, 7.2357177734375, 7.54150390625, 7.8472900390625, 8.153076171875, 8.4588623046875, 8.7646484375, 9.0704345703125, 9.376220703125, 9.6820068359375, 9.98779296875, 10.2935791015625, 10.599365234375, 10.9051513671875, 11.2109375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 4.0, 8.0, 5.0, 6.0, 7.0, 9.0, 12.0, 18.0, 21.0, 21.0, 33.0, 41.0, 26.0, 52.0, 52.0, 45.0, 59.0, 52.0, 58.0, 52.0, 48.0, 54.0, 48.0, 44.0, 27.0, 39.0, 31.0, 34.0, 19.0, 19.0, 13.0, 11.0, 7.0, 8.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.279296875, -2.20892333984375, -2.1385498046875, -2.06817626953125, -1.997802734375, -1.92742919921875, -1.8570556640625, -1.78668212890625, -1.71630859375, -1.64593505859375, -1.5755615234375, -1.50518798828125, -1.434814453125, -1.36444091796875, -1.2940673828125, -1.22369384765625, -1.1533203125, -1.08294677734375, -1.0125732421875, -0.94219970703125, -0.871826171875, -0.80145263671875, -0.7310791015625, -0.66070556640625, -0.59033203125, -0.51995849609375, -0.4495849609375, -0.37921142578125, -0.308837890625, -0.23846435546875, -0.1680908203125, -0.09771728515625, -0.02734375, 0.04302978515625, 0.1134033203125, 0.18377685546875, 0.254150390625, 0.32452392578125, 0.3948974609375, 0.46527099609375, 0.53564453125, 0.60601806640625, 0.6763916015625, 0.74676513671875, 0.817138671875, 0.88751220703125, 0.9578857421875, 1.02825927734375, 1.0986328125, 1.16900634765625, 1.2393798828125, 1.30975341796875, 1.380126953125, 1.45050048828125, 1.5208740234375, 1.59124755859375, 1.66162109375, 1.73199462890625, 1.8023681640625, 1.87274169921875, 1.943115234375, 2.01348876953125, 2.0838623046875, 2.15423583984375, 2.224609375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 7.0, 13.0, 13.0, 8.0, 29.0, 34.0, 37.0, 64.0, 77.0, 97.0, 165.0, 205.0, 268.0, 369.0, 569.0, 970.0, 1674.0, 3415.0, 8000.0, 24551.0, 154927.0, 3916195.0, 56730.0, 14418.0, 5391.0, 2458.0, 1308.0, 709.0, 426.0, 314.0, 243.0, 186.0, 125.0, 78.0, 60.0, 50.0, 40.0, 22.0, 14.0, 4.0, 11.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.9375, -5.7642822265625, -5.591064453125, -5.4178466796875, -5.24462890625, -5.0714111328125, -4.898193359375, -4.7249755859375, -4.5517578125, -4.3785400390625, -4.205322265625, -4.0321044921875, -3.85888671875, -3.6856689453125, -3.512451171875, -3.3392333984375, -3.166015625, -2.9927978515625, -2.819580078125, -2.6463623046875, -2.47314453125, -2.2999267578125, -2.126708984375, -1.9534912109375, -1.7802734375, -1.6070556640625, -1.433837890625, -1.2606201171875, -1.08740234375, -0.9141845703125, -0.740966796875, -0.5677490234375, -0.39453125, -0.2213134765625, -0.048095703125, 0.1251220703125, 0.29833984375, 0.4715576171875, 0.644775390625, 0.8179931640625, 0.9912109375, 1.1644287109375, 1.337646484375, 1.5108642578125, 1.68408203125, 1.8572998046875, 2.030517578125, 2.2037353515625, 2.376953125, 2.5501708984375, 2.723388671875, 2.8966064453125, 3.06982421875, 3.2430419921875, 3.416259765625, 3.5894775390625, 3.7626953125, 3.9359130859375, 4.109130859375, 4.2823486328125, 4.45556640625, 4.6287841796875, 4.802001953125, 4.9752197265625, 5.1484375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 7.0, 8.0, 14.0, 26.0, 47.0, 126.0, 3442.0, 242.0, 62.0, 31.0, 24.0, 6.0, 13.0, 5.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.638824462890625, -2.57843017578125, -2.518035888671875, -2.4576416015625, -2.397247314453125, -2.33685302734375, -2.276458740234375, -2.216064453125, -2.155670166015625, -2.09527587890625, -2.034881591796875, -1.9744873046875, -1.914093017578125, -1.85369873046875, -1.793304443359375, -1.73291015625, -1.672515869140625, -1.61212158203125, -1.551727294921875, -1.4913330078125, -1.430938720703125, -1.37054443359375, -1.310150146484375, -1.249755859375, -1.189361572265625, -1.12896728515625, -1.068572998046875, -1.0081787109375, -0.947784423828125, -0.88739013671875, -0.826995849609375, -0.7666015625, -0.706207275390625, -0.64581298828125, -0.585418701171875, -0.5250244140625, -0.464630126953125, -0.40423583984375, -0.343841552734375, -0.283447265625, -0.223052978515625, -0.16265869140625, -0.102264404296875, -0.0418701171875, 0.018524169921875, 0.07891845703125, 0.139312744140625, 0.19970703125, 0.260101318359375, 0.32049560546875, 0.380889892578125, 0.4412841796875, 0.501678466796875, 0.56207275390625, 0.622467041015625, 0.682861328125, 0.743255615234375, 0.80364990234375, 0.864044189453125, 0.9244384765625, 0.984832763671875, 1.04522705078125, 1.105621337890625, 1.166015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 18.0, 37.0, 88.0, 197.0, 206.0, 213.0, 137.0, 51.0, 28.0, 10.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.398922443389893, -6.090103626251221, -5.781284332275391, -5.472465515136719, -5.163646221160889, -4.854827404022217, -4.546008110046387, -4.237189292907715, -3.928370237350464, -3.619551181793213, -3.310732126235962, -3.001913070678711, -2.693094253540039, -2.384274959564209, -2.075456142425537, -1.7666370868682861, -1.4578180313110352, -1.1489989757537842, -0.840179979801178, -0.5313609838485718, -0.2225419282913208, 0.08627712726593018, 0.3950960636138916, 0.7039151191711426, 1.0127341747283936, 1.3215532302856445, 1.6303722858428955, 1.939191222190857, 2.2480101585388184, 2.5568294525146484, 2.8656482696533203, 3.1744673252105713, 3.4832868576049805, 3.7921059131622314, 4.100924968719482, 4.409743785858154, 4.718563079833984, 5.027381896972656, 5.336200714111328, 5.645020008087158, 5.953839302062988, 6.26265811920166, 6.57147741317749, 6.880296230316162, 7.189115524291992, 7.497934341430664, 7.806753158569336, 8.115571975708008, 8.42439079284668, 8.733209609985352, 9.042028427124023, 9.350848197937012, 9.659667015075684, 9.968485832214355, 10.277304649353027, 10.586124420166016, 10.894943237304688, 11.20376205444336, 11.512580871582031, 11.82140064239502, 12.130219459533691, 12.439038276672363, 12.747857093811035, 13.056676864624023, 13.365495681762695]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 9.0, 2.0, 6.0, 15.0, 12.0, 20.0, 19.0, 22.0, 39.0, 46.0, 40.0, 46.0, 47.0, 41.0, 59.0, 50.0, 65.0, 54.0, 48.0, 57.0, 39.0, 46.0, 44.0, 33.0, 30.0, 21.0, 18.0, 18.0, 16.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0], "bins": [-4.374730110168457, -4.2638421058654785, -4.152954578399658, -4.04206657409668, -3.9311790466308594, -3.82029128074646, -3.7094035148620605, -3.598515510559082, -3.4876279830932617, -3.3767402172088623, -3.265852451324463, -3.1549646854400635, -3.044076919555664, -2.9331891536712646, -2.8223013877868652, -2.7114133834838867, -2.6005256175994873, -2.489637851715088, -2.3787500858306885, -2.267862319946289, -2.1569745540618896, -2.0460867881774902, -1.9351989030838013, -1.8243111371994019, -1.7134233713150024, -1.602535605430603, -1.4916478395462036, -1.3807599544525146, -1.2698721885681152, -1.1589844226837158, -1.0480966567993164, -0.937208890914917, -0.8263213634490967, -0.7154335975646973, -0.6045458316802979, -0.49365800619125366, -0.38277024030685425, -0.27188247442245483, -0.16099464893341064, -0.05010688304901123, 0.060780882835388184, 0.1716686636209488, 0.2825564444065094, 0.3934442400932312, 0.5043320059776306, 0.61521977186203, 0.7261075973510742, 0.8369953632354736, 0.947883129119873, 1.0587708950042725, 1.1696586608886719, 1.2805464267730713, 1.3914341926574707, 1.5023219585418701, 1.613209843635559, 1.7240976095199585, 1.834985375404358, 1.9458731412887573, 2.0567610263824463, 2.1676487922668457, 2.278536558151245, 2.3894243240356445, 2.500312089920044, 2.6111998558044434, 2.7220876216888428]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 13.0, 7.0, 9.0, 8.0, 17.0, 27.0, 53.0, 73.0, 146.0, 273.0, 727.0, 2782.0, 11697.0, 67891.0, 424152.0, 449256.0, 74490.0, 12579.0, 2927.0, 782.0, 298.0, 119.0, 67.0, 51.0, 32.0, 20.0, 11.0, 7.0, 11.0, 6.0, 6.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0], "bins": [-11.046875, -10.78399658203125, -10.5211181640625, -10.25823974609375, -9.995361328125, -9.73248291015625, -9.4696044921875, -9.20672607421875, -8.94384765625, -8.68096923828125, -8.4180908203125, -8.15521240234375, -7.892333984375, -7.62945556640625, -7.3665771484375, -7.10369873046875, -6.8408203125, -6.57794189453125, -6.3150634765625, -6.05218505859375, -5.789306640625, -5.52642822265625, -5.2635498046875, -5.00067138671875, -4.73779296875, -4.47491455078125, -4.2120361328125, -3.94915771484375, -3.686279296875, -3.42340087890625, -3.1605224609375, -2.89764404296875, -2.634765625, -2.37188720703125, -2.1090087890625, -1.84613037109375, -1.583251953125, -1.32037353515625, -1.0574951171875, -0.79461669921875, -0.53173828125, -0.26885986328125, -0.0059814453125, 0.25689697265625, 0.519775390625, 0.78265380859375, 1.0455322265625, 1.30841064453125, 1.5712890625, 1.83416748046875, 2.0970458984375, 2.35992431640625, 2.622802734375, 2.88568115234375, 3.1485595703125, 3.41143798828125, 3.67431640625, 3.93719482421875, 4.2000732421875, 4.46295166015625, 4.725830078125, 4.98870849609375, 5.2515869140625, 5.51446533203125, 5.77734375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 9.0, 5.0, 9.0, 10.0, 11.0, 17.0, 16.0, 18.0, 31.0, 31.0, 33.0, 48.0, 46.0, 38.0, 39.0, 52.0, 68.0, 57.0, 54.0, 45.0, 56.0, 50.0, 33.0, 32.0, 38.0, 31.0, 26.0, 24.0, 9.0, 16.0, 15.0, 8.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.18359375, -2.1131591796875, -2.042724609375, -1.9722900390625, -1.90185546875, -1.8314208984375, -1.760986328125, -1.6905517578125, -1.6201171875, -1.5496826171875, -1.479248046875, -1.4088134765625, -1.33837890625, -1.2679443359375, -1.197509765625, -1.1270751953125, -1.056640625, -0.9862060546875, -0.915771484375, -0.8453369140625, -0.77490234375, -0.7044677734375, -0.634033203125, -0.5635986328125, -0.4931640625, -0.4227294921875, -0.352294921875, -0.2818603515625, -0.21142578125, -0.1409912109375, -0.070556640625, -0.0001220703125, 0.0703125, 0.1407470703125, 0.211181640625, 0.2816162109375, 0.35205078125, 0.4224853515625, 0.492919921875, 0.5633544921875, 0.6337890625, 0.7042236328125, 0.774658203125, 0.8450927734375, 0.91552734375, 0.9859619140625, 1.056396484375, 1.1268310546875, 1.197265625, 1.2677001953125, 1.338134765625, 1.4085693359375, 1.47900390625, 1.5494384765625, 1.619873046875, 1.6903076171875, 1.7607421875, 1.8311767578125, 1.901611328125, 1.9720458984375, 2.04248046875, 2.1129150390625, 2.183349609375, 2.2537841796875, 2.32421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 8.0, 8.0, 10.0, 17.0, 22.0, 24.0, 48.0, 79.0, 109.0, 183.0, 311.0, 522.0, 1118.0, 2704.0, 8581.0, 38114.0, 258461.0, 605815.0, 105166.0, 18639.0, 4912.0, 1796.0, 822.0, 382.0, 249.0, 160.0, 91.0, 63.0, 33.0, 31.0, 17.0, 12.0, 9.0, 12.0, 7.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.6484375, -8.4100341796875, -8.171630859375, -7.9332275390625, -7.69482421875, -7.4564208984375, -7.218017578125, -6.9796142578125, -6.7412109375, -6.5028076171875, -6.264404296875, -6.0260009765625, -5.78759765625, -5.5491943359375, -5.310791015625, -5.0723876953125, -4.833984375, -4.5955810546875, -4.357177734375, -4.1187744140625, -3.88037109375, -3.6419677734375, -3.403564453125, -3.1651611328125, -2.9267578125, -2.6883544921875, -2.449951171875, -2.2115478515625, -1.97314453125, -1.7347412109375, -1.496337890625, -1.2579345703125, -1.01953125, -0.7811279296875, -0.542724609375, -0.3043212890625, -0.06591796875, 0.1724853515625, 0.410888671875, 0.6492919921875, 0.8876953125, 1.1260986328125, 1.364501953125, 1.6029052734375, 1.84130859375, 2.0797119140625, 2.318115234375, 2.5565185546875, 2.794921875, 3.0333251953125, 3.271728515625, 3.5101318359375, 3.74853515625, 3.9869384765625, 4.225341796875, 4.4637451171875, 4.7021484375, 4.9405517578125, 5.178955078125, 5.4173583984375, 5.65576171875, 5.8941650390625, 6.132568359375, 6.3709716796875, 6.609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 6.0, 10.0, 14.0, 17.0, 21.0, 30.0, 30.0, 27.0, 26.0, 34.0, 50.0, 35.0, 63.0, 54.0, 60.0, 54.0, 40.0, 47.0, 60.0, 41.0, 31.0, 32.0, 29.0, 30.0, 21.0, 25.0, 10.0, 18.0, 11.0, 11.0, 6.0, 11.0, 5.0, 6.0, 9.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-11.578125, -11.247314453125, -10.91650390625, -10.585693359375, -10.2548828125, -9.924072265625, -9.59326171875, -9.262451171875, -8.931640625, -8.600830078125, -8.27001953125, -7.939208984375, -7.6083984375, -7.277587890625, -6.94677734375, -6.615966796875, -6.28515625, -5.954345703125, -5.62353515625, -5.292724609375, -4.9619140625, -4.631103515625, -4.30029296875, -3.969482421875, -3.638671875, -3.307861328125, -2.97705078125, -2.646240234375, -2.3154296875, -1.984619140625, -1.65380859375, -1.322998046875, -0.9921875, -0.661376953125, -0.33056640625, 0.000244140625, 0.3310546875, 0.661865234375, 0.99267578125, 1.323486328125, 1.654296875, 1.985107421875, 2.31591796875, 2.646728515625, 2.9775390625, 3.308349609375, 3.63916015625, 3.969970703125, 4.30078125, 4.631591796875, 4.96240234375, 5.293212890625, 5.6240234375, 5.954833984375, 6.28564453125, 6.616455078125, 6.947265625, 7.278076171875, 7.60888671875, 7.939697265625, 8.2705078125, 8.601318359375, 8.93212890625, 9.262939453125, 9.59375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 5.0, 12.0, 14.0, 16.0, 26.0, 48.0, 72.0, 158.0, 309.0, 668.0, 1711.0, 5676.0, 35289.0, 794394.0, 191532.0, 13426.0, 3217.0, 1077.0, 393.0, 230.0, 115.0, 66.0, 30.0, 23.0, 13.0, 7.0, 3.0, 7.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-9.34375, -9.11456298828125, -8.8853759765625, -8.65618896484375, -8.427001953125, -8.19781494140625, -7.9686279296875, -7.73944091796875, -7.51025390625, -7.28106689453125, -7.0518798828125, -6.82269287109375, -6.593505859375, -6.36431884765625, -6.1351318359375, -5.90594482421875, -5.6767578125, -5.44757080078125, -5.2183837890625, -4.98919677734375, -4.760009765625, -4.53082275390625, -4.3016357421875, -4.07244873046875, -3.84326171875, -3.61407470703125, -3.3848876953125, -3.15570068359375, -2.926513671875, -2.69732666015625, -2.4681396484375, -2.23895263671875, -2.009765625, -1.78057861328125, -1.5513916015625, -1.32220458984375, -1.093017578125, -0.86383056640625, -0.6346435546875, -0.40545654296875, -0.17626953125, 0.05291748046875, 0.2821044921875, 0.51129150390625, 0.740478515625, 0.96966552734375, 1.1988525390625, 1.42803955078125, 1.6572265625, 1.88641357421875, 2.1156005859375, 2.34478759765625, 2.573974609375, 2.80316162109375, 3.0323486328125, 3.26153564453125, 3.49072265625, 3.71990966796875, 3.9490966796875, 4.17828369140625, 4.407470703125, 4.63665771484375, 4.8658447265625, 5.09503173828125, 5.32421875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 5.0, 6.0, 10.0, 15.0, 23.0, 31.0, 40.0, 65.0, 112.0, 137.0, 139.0, 118.0, 92.0, 63.0, 27.0, 29.0, 27.0, 21.0, 8.0, 8.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.000926971435546875, -0.0009051263332366943, -0.0008832812309265137, -0.000861436128616333, -0.0008395910263061523, -0.0008177459239959717, -0.000795900821685791, -0.0007740557193756104, -0.0007522106170654297, -0.000730365514755249, -0.0007085204124450684, -0.0006866753101348877, -0.000664830207824707, -0.0006429851055145264, -0.0006211400032043457, -0.000599294900894165, -0.0005774497985839844, -0.0005556046962738037, -0.000533759593963623, -0.0005119144916534424, -0.0004900693893432617, -0.00046822428703308105, -0.0004463791847229004, -0.0004245340824127197, -0.00040268898010253906, -0.0003808438777923584, -0.00035899877548217773, -0.00033715367317199707, -0.0003153085708618164, -0.00029346346855163574, -0.0002716183662414551, -0.0002497732639312744, -0.00022792816162109375, -0.00020608305931091309, -0.00018423795700073242, -0.00016239285469055176, -0.0001405477523803711, -0.00011870265007019043, -9.685754776000977e-05, -7.50124454498291e-05, -5.316734313964844e-05, -3.1322240829467773e-05, -9.47713851928711e-06, 1.2367963790893555e-05, 3.421306610107422e-05, 5.605816841125488e-05, 7.790327072143555e-05, 9.974837303161621e-05, 0.00012159347534179688, 0.00014343857765197754, 0.0001652836799621582, 0.00018712878227233887, 0.00020897388458251953, 0.0002308189868927002, 0.00025266408920288086, 0.0002745091915130615, 0.0002963542938232422, 0.00031819939613342285, 0.0003400444984436035, 0.0003618896007537842, 0.00038373470306396484, 0.0004055798053741455, 0.00042742490768432617, 0.00044927000999450684, 0.0004711151123046875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 1.0, 5.0, 6.0, 7.0, 9.0, 24.0, 31.0, 37.0, 60.0, 108.0, 178.0, 321.0, 648.0, 1428.0, 3868.0, 14929.0, 151112.0, 805321.0, 56734.0, 8751.0, 2655.0, 1122.0, 517.0, 283.0, 152.0, 76.0, 51.0, 29.0, 27.0, 20.0, 11.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.38671875, -6.1761474609375, -5.965576171875, -5.7550048828125, -5.54443359375, -5.3338623046875, -5.123291015625, -4.9127197265625, -4.7021484375, -4.4915771484375, -4.281005859375, -4.0704345703125, -3.85986328125, -3.6492919921875, -3.438720703125, -3.2281494140625, -3.017578125, -2.8070068359375, -2.596435546875, -2.3858642578125, -2.17529296875, -1.9647216796875, -1.754150390625, -1.5435791015625, -1.3330078125, -1.1224365234375, -0.911865234375, -0.7012939453125, -0.49072265625, -0.2801513671875, -0.069580078125, 0.1409912109375, 0.3515625, 0.5621337890625, 0.772705078125, 0.9832763671875, 1.19384765625, 1.4044189453125, 1.614990234375, 1.8255615234375, 2.0361328125, 2.2467041015625, 2.457275390625, 2.6678466796875, 2.87841796875, 3.0889892578125, 3.299560546875, 3.5101318359375, 3.720703125, 3.9312744140625, 4.141845703125, 4.3524169921875, 4.56298828125, 4.7735595703125, 4.984130859375, 5.1947021484375, 5.4052734375, 5.6158447265625, 5.826416015625, 6.0369873046875, 6.24755859375, 6.4581298828125, 6.668701171875, 6.8792724609375, 7.08984375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 2.0, 7.0, 20.0, 11.0, 24.0, 49.0, 58.0, 110.0, 140.0, 141.0, 120.0, 96.0, 72.0, 50.0, 33.0, 17.0, 10.0, 9.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.203125, -8.00579833984375, -7.8084716796875, -7.61114501953125, -7.413818359375, -7.21649169921875, -7.0191650390625, -6.82183837890625, -6.62451171875, -6.42718505859375, -6.2298583984375, -6.03253173828125, -5.835205078125, -5.63787841796875, -5.4405517578125, -5.24322509765625, -5.0458984375, -4.84857177734375, -4.6512451171875, -4.45391845703125, -4.256591796875, -4.05926513671875, -3.8619384765625, -3.66461181640625, -3.46728515625, -3.26995849609375, -3.0726318359375, -2.87530517578125, -2.677978515625, -2.48065185546875, -2.2833251953125, -2.08599853515625, -1.888671875, -1.69134521484375, -1.4940185546875, -1.29669189453125, -1.099365234375, -0.90203857421875, -0.7047119140625, -0.50738525390625, -0.31005859375, -0.11273193359375, 0.0845947265625, 0.28192138671875, 0.479248046875, 0.67657470703125, 0.8739013671875, 1.07122802734375, 1.2685546875, 1.46588134765625, 1.6632080078125, 1.86053466796875, 2.057861328125, 2.25518798828125, 2.4525146484375, 2.64984130859375, 2.84716796875, 3.04449462890625, 3.2418212890625, 3.43914794921875, 3.636474609375, 3.83380126953125, 4.0311279296875, 4.22845458984375, 4.42578125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 23.0, 60.0, 113.0, 207.0, 237.0, 198.0, 83.0, 40.0, 20.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-90.1890869140625, -86.89444732666016, -83.59981536865234, -80.30517578125, -77.01053619384766, -73.71589660644531, -70.4212646484375, -67.12662506103516, -63.83198547363281, -60.537349700927734, -57.24271011352539, -53.94807434082031, -50.65343475341797, -47.35879898071289, -44.06416320800781, -40.76952362060547, -37.47488784790039, -34.18025207519531, -30.88561248779297, -27.59097671508789, -24.296337127685547, -21.00170135498047, -17.707063674926758, -14.412425994873047, -11.117788314819336, -7.823150634765625, -4.528513431549072, -1.2338762283325195, 2.0607614517211914, 5.355398178100586, 8.650035858154297, 11.944673538208008, 15.239311218261719, 18.53394889831543, 21.82858657836914, 25.12322235107422, 28.417861938476562, 31.71249771118164, 35.00713348388672, 38.30177307128906, 41.596412658691406, 44.891048431396484, 48.18568801879883, 51.480323791503906, 54.77496337890625, 58.06959915161133, 61.364234924316406, 64.65887451171875, 67.95350646972656, 71.2481460571289, 74.54277801513672, 77.83741760253906, 81.1320571899414, 84.42669677734375, 87.72132873535156, 91.0159683227539, 94.31060791015625, 97.6052474975586, 100.8998794555664, 104.19451904296875, 107.4891586303711, 110.78379821777344, 114.07843017578125, 117.3730697631836, 120.66770935058594]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 10.0, 18.0, 19.0, 21.0, 24.0, 30.0, 41.0, 33.0, 34.0, 35.0, 54.0, 47.0, 59.0, 65.0, 53.0, 64.0, 60.0, 53.0, 43.0, 37.0, 42.0, 32.0, 23.0, 18.0, 16.0, 12.0, 7.0, 10.0, 3.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.30281066894531, -43.70671081542969, -42.11061096191406, -40.51451110839844, -38.91841125488281, -37.32231140136719, -35.72621154785156, -34.13011169433594, -32.53401184082031, -30.937911987304688, -29.341812133789062, -27.745712280273438, -26.149612426757812, -24.553512573242188, -22.957414627075195, -21.36131477355957, -19.765216827392578, -18.169116973876953, -16.573017120361328, -14.97691822052002, -13.380818367004395, -11.78471851348877, -10.188619613647461, -8.592519760131836, -6.996419906616211, -5.400320053100586, -3.804220676422119, -2.2081212997436523, -0.6120214462280273, 0.9840784072875977, 2.5801773071289062, 4.176277160644531, 5.772377014160156, 7.368476867675781, 8.964576721191406, 10.560675621032715, 12.15677547454834, 13.752875328063965, 15.348974227905273, 16.9450740814209, 18.541173934936523, 20.13727378845215, 21.733373641967773, 23.329471588134766, 24.92557144165039, 26.521671295166016, 28.11777114868164, 29.713871002197266, 31.30997085571289, 32.906070709228516, 34.50217056274414, 36.098270416259766, 37.69437026977539, 39.290470123291016, 40.886566162109375, 42.482666015625, 44.078765869140625, 45.67486572265625, 47.270965576171875, 48.8670654296875, 50.463165283203125, 52.05926513671875, 53.655364990234375, 55.25146484375, 56.847564697265625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 6.0, 20.0, 17.0, 26.0, 44.0, 68.0, 127.0, 220.0, 390.0, 783.0, 1787.0, 5102.0, 18970.0, 219701.0, 3895588.0, 38510.0, 8051.0, 2661.0, 1045.0, 510.0, 282.0, 133.0, 85.0, 50.0, 24.0, 27.0, 10.0, 8.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.41796875, -6.12884521484375, -5.8397216796875, -5.55059814453125, -5.261474609375, -4.97235107421875, -4.6832275390625, -4.39410400390625, -4.10498046875, -3.81585693359375, -3.5267333984375, -3.23760986328125, -2.948486328125, -2.65936279296875, -2.3702392578125, -2.08111572265625, -1.7919921875, -1.50286865234375, -1.2137451171875, -0.92462158203125, -0.635498046875, -0.34637451171875, -0.0572509765625, 0.23187255859375, 0.52099609375, 0.81011962890625, 1.0992431640625, 1.38836669921875, 1.677490234375, 1.96661376953125, 2.2557373046875, 2.54486083984375, 2.833984375, 3.12310791015625, 3.4122314453125, 3.70135498046875, 3.990478515625, 4.27960205078125, 4.5687255859375, 4.85784912109375, 5.14697265625, 5.43609619140625, 5.7252197265625, 6.01434326171875, 6.303466796875, 6.59259033203125, 6.8817138671875, 7.17083740234375, 7.4599609375, 7.74908447265625, 8.0382080078125, 8.32733154296875, 8.616455078125, 8.90557861328125, 9.1947021484375, 9.48382568359375, 9.77294921875, 10.06207275390625, 10.3511962890625, 10.64031982421875, 10.929443359375, 11.21856689453125, 11.5076904296875, 11.79681396484375, 12.0859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 19.0, 15.0, 20.0, 30.0, 43.0, 65.0, 76.0, 87.0, 99.0, 100.0, 95.0, 88.0, 69.0, 69.0, 38.0, 28.0, 24.0, 9.0, 11.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7421875, -2.624267578125, -2.50634765625, -2.388427734375, -2.2705078125, -2.152587890625, -2.03466796875, -1.916748046875, -1.798828125, -1.680908203125, -1.56298828125, -1.445068359375, -1.3271484375, -1.209228515625, -1.09130859375, -0.973388671875, -0.85546875, -0.737548828125, -0.61962890625, -0.501708984375, -0.3837890625, -0.265869140625, -0.14794921875, -0.030029296875, 0.087890625, 0.205810546875, 0.32373046875, 0.441650390625, 0.5595703125, 0.677490234375, 0.79541015625, 0.913330078125, 1.03125, 1.149169921875, 1.26708984375, 1.385009765625, 1.5029296875, 1.620849609375, 1.73876953125, 1.856689453125, 1.974609375, 2.092529296875, 2.21044921875, 2.328369140625, 2.4462890625, 2.564208984375, 2.68212890625, 2.800048828125, 2.91796875, 3.035888671875, 3.15380859375, 3.271728515625, 3.3896484375, 3.507568359375, 3.62548828125, 3.743408203125, 3.861328125, 3.979248046875, 4.09716796875, 4.215087890625, 4.3330078125, 4.450927734375, 4.56884765625, 4.686767578125, 4.8046875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 11.0, 9.0, 10.0, 26.0, 31.0, 34.0, 44.0, 81.0, 86.0, 119.0, 152.0, 212.0, 357.0, 776.0, 2906.0, 37632.0, 4125531.0, 22220.0, 2266.0, 643.0, 313.0, 232.0, 158.0, 122.0, 71.0, 70.0, 55.0, 31.0, 24.0, 12.0, 15.0, 9.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-23.8125, -23.17626953125, -22.5400390625, -21.90380859375, -21.267578125, -20.63134765625, -19.9951171875, -19.35888671875, -18.72265625, -18.08642578125, -17.4501953125, -16.81396484375, -16.177734375, -15.54150390625, -14.9052734375, -14.26904296875, -13.6328125, -12.99658203125, -12.3603515625, -11.72412109375, -11.087890625, -10.45166015625, -9.8154296875, -9.17919921875, -8.54296875, -7.90673828125, -7.2705078125, -6.63427734375, -5.998046875, -5.36181640625, -4.7255859375, -4.08935546875, -3.453125, -2.81689453125, -2.1806640625, -1.54443359375, -0.908203125, -0.27197265625, 0.3642578125, 1.00048828125, 1.63671875, 2.27294921875, 2.9091796875, 3.54541015625, 4.181640625, 4.81787109375, 5.4541015625, 6.09033203125, 6.7265625, 7.36279296875, 7.9990234375, 8.63525390625, 9.271484375, 9.90771484375, 10.5439453125, 11.18017578125, 11.81640625, 12.45263671875, 13.0888671875, 13.72509765625, 14.361328125, 14.99755859375, 15.6337890625, 16.27001953125, 16.90625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 29.0, 45.0, 251.0, 3417.0, 230.0, 58.0, 14.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.89727783203125, -9.6695556640625, -9.44183349609375, -9.214111328125, -8.98638916015625, -8.7586669921875, -8.53094482421875, -8.30322265625, -8.07550048828125, -7.8477783203125, -7.62005615234375, -7.392333984375, -7.16461181640625, -6.9368896484375, -6.70916748046875, -6.4814453125, -6.25372314453125, -6.0260009765625, -5.79827880859375, -5.570556640625, -5.34283447265625, -5.1151123046875, -4.88739013671875, -4.65966796875, -4.43194580078125, -4.2042236328125, -3.97650146484375, -3.748779296875, -3.52105712890625, -3.2933349609375, -3.06561279296875, -2.837890625, -2.61016845703125, -2.3824462890625, -2.15472412109375, -1.927001953125, -1.69927978515625, -1.4715576171875, -1.24383544921875, -1.01611328125, -0.78839111328125, -0.5606689453125, -0.33294677734375, -0.105224609375, 0.12249755859375, 0.3502197265625, 0.57794189453125, 0.8056640625, 1.03338623046875, 1.2611083984375, 1.48883056640625, 1.716552734375, 1.94427490234375, 2.1719970703125, 2.39971923828125, 2.62744140625, 2.85516357421875, 3.0828857421875, 3.31060791015625, 3.538330078125, 3.76605224609375, 3.9937744140625, 4.22149658203125, 4.44921875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 16.0, 19.0, 19.0, 38.0, 79.0, 124.0, 164.0, 166.0, 127.0, 96.0, 53.0, 38.0, 18.0, 18.0, 7.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.192977905273438, -17.525440216064453, -16.857900619506836, -16.19036293029785, -15.52282428741455, -14.85528564453125, -14.187747955322266, -13.520209312438965, -12.852670669555664, -12.185132026672363, -11.517593383789062, -10.850055694580078, -10.182517051696777, -9.514978408813477, -8.847440719604492, -8.179902076721191, -7.512363433837891, -6.84482479095459, -6.177286624908447, -5.509748458862305, -4.842209815979004, -4.174671173095703, -3.5071330070495605, -2.839594841003418, -2.172056198120117, -1.5045177936553955, -0.8369793891906738, -0.16944098472595215, 0.49809741973876953, 1.1656358242034912, 1.833174228668213, 2.5007123947143555, 3.168252944946289, 3.8357913494110107, 4.503329753875732, 5.170867919921875, 5.838406562805176, 6.505945205688477, 7.173483371734619, 7.841021537780762, 8.508560180664062, 9.176098823547363, 9.843637466430664, 10.511175155639648, 11.17871379852295, 11.84625244140625, 12.513790130615234, 13.181328773498535, 13.848867416381836, 14.516406059265137, 15.183944702148438, 15.851482391357422, 16.519020080566406, 17.186559677124023, 17.854097366333008, 18.521636962890625, 19.18917465209961, 19.856712341308594, 20.52425193786621, 21.191789627075195, 21.859329223632812, 22.526866912841797, 23.19440460205078, 23.861942291259766, 24.529481887817383]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 8.0, 18.0, 34.0, 43.0, 43.0, 60.0, 60.0, 86.0, 86.0, 103.0, 86.0, 86.0, 74.0, 62.0, 34.0, 34.0, 18.0, 18.0, 13.0, 7.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.035686492919922, -17.46177864074707, -16.88787078857422, -16.313962936401367, -15.740055084228516, -15.166147232055664, -14.592239379882812, -14.018331527709961, -13.44442367553711, -12.870515823364258, -12.296607971191406, -11.722700119018555, -11.148792266845703, -10.574884414672852, -10.0009765625, -9.427068710327148, -8.85315990447998, -8.279252052307129, -7.705344200134277, -7.131436347961426, -6.557528495788574, -5.983620643615723, -5.409712314605713, -4.835804462432861, -4.26189661026001, -3.687988758087158, -3.1140809059143066, -2.540172815322876, -1.9662649631500244, -1.3923571109771729, -0.8184490203857422, -0.24454116821289062, 0.32936668395996094, 0.9032745957374573, 1.4771825075149536, 2.0510904788970947, 2.6249983310699463, 3.198906183242798, 3.7728142738342285, 4.34672212600708, 4.920629978179932, 5.494537830352783, 6.068445682525635, 6.6423540115356445, 7.216261863708496, 7.790169715881348, 8.3640775680542, 8.93798542022705, 9.511893272399902, 10.085801124572754, 10.659708976745605, 11.233616828918457, 11.807524681091309, 12.38143253326416, 12.955341339111328, 13.52924919128418, 14.103157043457031, 14.677064895629883, 15.250972747802734, 15.824880599975586, 16.398788452148438, 16.97269630432129, 17.54660415649414, 18.120512008666992, 18.694419860839844]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 9.0, 15.0, 15.0, 27.0, 53.0, 86.0, 145.0, 280.0, 672.0, 2069.0, 8937.0, 60470.0, 519197.0, 403187.0, 43530.0, 7006.0, 1730.0, 575.0, 228.0, 114.0, 91.0, 37.0, 32.0, 18.0, 12.0, 9.0, 3.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.71875, -11.4013671875, -11.083984375, -10.7666015625, -10.44921875, -10.1318359375, -9.814453125, -9.4970703125, -9.1796875, -8.8623046875, -8.544921875, -8.2275390625, -7.91015625, -7.5927734375, -7.275390625, -6.9580078125, -6.640625, -6.3232421875, -6.005859375, -5.6884765625, -5.37109375, -5.0537109375, -4.736328125, -4.4189453125, -4.1015625, -3.7841796875, -3.466796875, -3.1494140625, -2.83203125, -2.5146484375, -2.197265625, -1.8798828125, -1.5625, -1.2451171875, -0.927734375, -0.6103515625, -0.29296875, 0.0244140625, 0.341796875, 0.6591796875, 0.9765625, 1.2939453125, 1.611328125, 1.9287109375, 2.24609375, 2.5634765625, 2.880859375, 3.1982421875, 3.515625, 3.8330078125, 4.150390625, 4.4677734375, 4.78515625, 5.1025390625, 5.419921875, 5.7373046875, 6.0546875, 6.3720703125, 6.689453125, 7.0068359375, 7.32421875, 7.6416015625, 7.958984375, 8.2763671875, 8.59375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 6.0, 9.0, 15.0, 23.0, 33.0, 36.0, 54.0, 72.0, 80.0, 102.0, 98.0, 93.0, 93.0, 74.0, 62.0, 49.0, 33.0, 21.0, 20.0, 7.0, 9.0, 9.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40625, -2.27703857421875, -2.1478271484375, -2.01861572265625, -1.889404296875, -1.76019287109375, -1.6309814453125, -1.50177001953125, -1.37255859375, -1.24334716796875, -1.1141357421875, -0.98492431640625, -0.855712890625, -0.72650146484375, -0.5972900390625, -0.46807861328125, -0.3388671875, -0.20965576171875, -0.0804443359375, 0.04876708984375, 0.177978515625, 0.30718994140625, 0.4364013671875, 0.56561279296875, 0.69482421875, 0.82403564453125, 0.9532470703125, 1.08245849609375, 1.211669921875, 1.34088134765625, 1.4700927734375, 1.59930419921875, 1.728515625, 1.85772705078125, 1.9869384765625, 2.11614990234375, 2.245361328125, 2.37457275390625, 2.5037841796875, 2.63299560546875, 2.76220703125, 2.89141845703125, 3.0206298828125, 3.14984130859375, 3.279052734375, 3.40826416015625, 3.5374755859375, 3.66668701171875, 3.7958984375, 3.92510986328125, 4.0543212890625, 4.18353271484375, 4.312744140625, 4.44195556640625, 4.5711669921875, 4.70037841796875, 4.82958984375, 4.95880126953125, 5.0880126953125, 5.21722412109375, 5.346435546875, 5.47564697265625, 5.6048583984375, 5.73406982421875, 5.86328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 8.0, 24.0, 60.0, 108.0, 234.0, 460.0, 1295.0, 8018.0, 613235.0, 416576.0, 6455.0, 1183.0, 450.0, 203.0, 98.0, 57.0, 26.0, 14.0, 14.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.546875, -22.853515625, -22.16015625, -21.466796875, -20.7734375, -20.080078125, -19.38671875, -18.693359375, -18.0, -17.306640625, -16.61328125, -15.919921875, -15.2265625, -14.533203125, -13.83984375, -13.146484375, -12.453125, -11.759765625, -11.06640625, -10.373046875, -9.6796875, -8.986328125, -8.29296875, -7.599609375, -6.90625, -6.212890625, -5.51953125, -4.826171875, -4.1328125, -3.439453125, -2.74609375, -2.052734375, -1.359375, -0.666015625, 0.02734375, 0.720703125, 1.4140625, 2.107421875, 2.80078125, 3.494140625, 4.1875, 4.880859375, 5.57421875, 6.267578125, 6.9609375, 7.654296875, 8.34765625, 9.041015625, 9.734375, 10.427734375, 11.12109375, 11.814453125, 12.5078125, 13.201171875, 13.89453125, 14.587890625, 15.28125, 15.974609375, 16.66796875, 17.361328125, 18.0546875, 18.748046875, 19.44140625, 20.134765625, 20.828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 7.0, 22.0, 25.0, 39.0, 61.0, 66.0, 71.0, 87.0, 109.0, 105.0, 97.0, 93.0, 72.0, 47.0, 40.0, 25.0, 14.0, 8.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.734375, -14.114013671875, -13.49365234375, -12.873291015625, -12.2529296875, -11.632568359375, -11.01220703125, -10.391845703125, -9.771484375, -9.151123046875, -8.53076171875, -7.910400390625, -7.2900390625, -6.669677734375, -6.04931640625, -5.428955078125, -4.80859375, -4.188232421875, -3.56787109375, -2.947509765625, -2.3271484375, -1.706787109375, -1.08642578125, -0.466064453125, 0.154296875, 0.774658203125, 1.39501953125, 2.015380859375, 2.6357421875, 3.256103515625, 3.87646484375, 4.496826171875, 5.1171875, 5.737548828125, 6.35791015625, 6.978271484375, 7.5986328125, 8.218994140625, 8.83935546875, 9.459716796875, 10.080078125, 10.700439453125, 11.32080078125, 11.941162109375, 12.5615234375, 13.181884765625, 13.80224609375, 14.422607421875, 15.04296875, 15.663330078125, 16.28369140625, 16.904052734375, 17.5244140625, 18.144775390625, 18.76513671875, 19.385498046875, 20.005859375, 20.626220703125, 21.24658203125, 21.866943359375, 22.4873046875, 23.107666015625, 23.72802734375, 24.348388671875, 24.96875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 5.0, 7.0, 8.0, 8.0, 17.0, 29.0, 48.0, 94.0, 172.0, 413.0, 1214.0, 4884.0, 33037.0, 755428.0, 233820.0, 15006.0, 2858.0, 838.0, 309.0, 140.0, 73.0, 44.0, 23.0, 19.0, 12.0, 13.0, 4.0, 5.0, 5.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.46875, -6.282958984375, -6.09716796875, -5.911376953125, -5.7255859375, -5.539794921875, -5.35400390625, -5.168212890625, -4.982421875, -4.796630859375, -4.61083984375, -4.425048828125, -4.2392578125, -4.053466796875, -3.86767578125, -3.681884765625, -3.49609375, -3.310302734375, -3.12451171875, -2.938720703125, -2.7529296875, -2.567138671875, -2.38134765625, -2.195556640625, -2.009765625, -1.823974609375, -1.63818359375, -1.452392578125, -1.2666015625, -1.080810546875, -0.89501953125, -0.709228515625, -0.5234375, -0.337646484375, -0.15185546875, 0.033935546875, 0.2197265625, 0.405517578125, 0.59130859375, 0.777099609375, 0.962890625, 1.148681640625, 1.33447265625, 1.520263671875, 1.7060546875, 1.891845703125, 2.07763671875, 2.263427734375, 2.44921875, 2.635009765625, 2.82080078125, 3.006591796875, 3.1923828125, 3.378173828125, 3.56396484375, 3.749755859375, 3.935546875, 4.121337890625, 4.30712890625, 4.492919921875, 4.6787109375, 4.864501953125, 5.05029296875, 5.236083984375, 5.421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 13.0, 14.0, 27.0, 66.0, 100.0, 239.0, 234.0, 138.0, 80.0, 25.0, 17.0, 12.0, 9.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007257461547851562, -0.0006896406412124634, -0.0006535351276397705, -0.0006174296140670776, -0.0005813241004943848, -0.0005452185869216919, -0.000509113073348999, -0.00047300755977630615, -0.0004369020462036133, -0.0004007965326309204, -0.00036469101905822754, -0.00032858550548553467, -0.0002924799919128418, -0.0002563744783401489, -0.00022026896476745605, -0.00018416345119476318, -0.0001480579376220703, -0.00011195242404937744, -7.584691047668457e-05, -3.97413969039917e-05, -3.635883331298828e-06, 3.246963024139404e-05, 6.857514381408691e-05, 0.00010468065738677979, 0.00014078617095947266, 0.00017689168453216553, 0.0002129971981048584, 0.00024910271167755127, 0.00028520822525024414, 0.000321313738822937, 0.0003574192523956299, 0.00039352476596832275, 0.0004296302795410156, 0.0004657357931137085, 0.0005018413066864014, 0.0005379468202590942, 0.0005740523338317871, 0.00061015784740448, 0.0006462633609771729, 0.0006823688745498657, 0.0007184743881225586, 0.0007545799016952515, 0.0007906854152679443, 0.0008267909288406372, 0.0008628964424133301, 0.000899001955986023, 0.0009351074695587158, 0.0009712129831314087, 0.0010073184967041016, 0.0010434240102767944, 0.0010795295238494873, 0.0011156350374221802, 0.001151740550994873, 0.001187846064567566, 0.0012239515781402588, 0.0012600570917129517, 0.0012961626052856445, 0.0013322681188583374, 0.0013683736324310303, 0.0014044791460037231, 0.001440584659576416, 0.0014766901731491089, 0.0015127956867218018, 0.0015489012002944946, 0.0015850067138671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 9.0, 14.0, 30.0, 82.0, 167.0, 703.0, 7084.0, 974809.0, 63462.0, 1654.0, 349.0, 110.0, 43.0, 18.0, 9.0, 4.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.703125, -17.24609375, -16.7890625, -16.33203125, -15.875, -15.41796875, -14.9609375, -14.50390625, -14.046875, -13.58984375, -13.1328125, -12.67578125, -12.21875, -11.76171875, -11.3046875, -10.84765625, -10.390625, -9.93359375, -9.4765625, -9.01953125, -8.5625, -8.10546875, -7.6484375, -7.19140625, -6.734375, -6.27734375, -5.8203125, -5.36328125, -4.90625, -4.44921875, -3.9921875, -3.53515625, -3.078125, -2.62109375, -2.1640625, -1.70703125, -1.25, -0.79296875, -0.3359375, 0.12109375, 0.578125, 1.03515625, 1.4921875, 1.94921875, 2.40625, 2.86328125, 3.3203125, 3.77734375, 4.234375, 4.69140625, 5.1484375, 5.60546875, 6.0625, 6.51953125, 6.9765625, 7.43359375, 7.890625, 8.34765625, 8.8046875, 9.26171875, 9.71875, 10.17578125, 10.6328125, 11.08984375, 11.546875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 9.0, 4.0, 7.0, 22.0, 19.0, 33.0, 30.0, 33.0, 62.0, 75.0, 94.0, 119.0, 111.0, 78.0, 67.0, 70.0, 39.0, 28.0, 22.0, 16.0, 14.0, 10.0, 8.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9296875, -3.80615234375, -3.6826171875, -3.55908203125, -3.435546875, -3.31201171875, -3.1884765625, -3.06494140625, -2.94140625, -2.81787109375, -2.6943359375, -2.57080078125, -2.447265625, -2.32373046875, -2.2001953125, -2.07666015625, -1.953125, -1.82958984375, -1.7060546875, -1.58251953125, -1.458984375, -1.33544921875, -1.2119140625, -1.08837890625, -0.96484375, -0.84130859375, -0.7177734375, -0.59423828125, -0.470703125, -0.34716796875, -0.2236328125, -0.10009765625, 0.0234375, 0.14697265625, 0.2705078125, 0.39404296875, 0.517578125, 0.64111328125, 0.7646484375, 0.88818359375, 1.01171875, 1.13525390625, 1.2587890625, 1.38232421875, 1.505859375, 1.62939453125, 1.7529296875, 1.87646484375, 2.0, 2.12353515625, 2.2470703125, 2.37060546875, 2.494140625, 2.61767578125, 2.7412109375, 2.86474609375, 2.98828125, 3.11181640625, 3.2353515625, 3.35888671875, 3.482421875, 3.60595703125, 3.7294921875, 3.85302734375, 3.9765625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 10.0, 6.0, 8.0, 14.0, 20.0, 30.0, 37.0, 58.0, 80.0, 111.0, 112.0, 125.0, 96.0, 85.0, 45.0, 44.0, 37.0, 23.0, 22.0, 12.0, 6.0, 9.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-66.50216674804688, -64.74848175048828, -62.99480056762695, -61.241119384765625, -59.4874382019043, -57.73375701904297, -55.980072021484375, -54.22639083862305, -52.47270965576172, -50.71902847290039, -48.9653434753418, -47.21166229248047, -45.45798110961914, -43.70429992675781, -41.95061492919922, -40.19693374633789, -38.4432487487793, -36.68956756591797, -34.935882568359375, -33.18220138549805, -31.42852020263672, -29.674837112426758, -27.921154022216797, -26.16747283935547, -24.413789749145508, -22.660106658935547, -20.90642547607422, -19.152742385864258, -17.399059295654297, -15.645378112792969, -13.891695022583008, -12.138012886047363, -10.384326934814453, -8.630644798278809, -6.876962184906006, -5.123279571533203, -3.3695974349975586, -1.615915298461914, 0.13776779174804688, 1.8914499282836914, 3.645132064819336, 5.3988142013549805, 7.152496814727783, 8.906179428100586, 10.65986156463623, 12.413543701171875, 14.167226791381836, 15.92090892791748, 17.674591064453125, 19.428274154663086, 21.181955337524414, 22.935638427734375, 24.689319610595703, 26.443002700805664, 28.196685791015625, 29.950366973876953, 31.704050064086914, 33.457733154296875, 35.2114143371582, 36.96509552001953, 38.718780517578125, 40.47246170043945, 42.22614288330078, 43.979827880859375, 45.7335090637207]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 13.0, 8.0, 8.0, 13.0, 15.0, 20.0, 24.0, 45.0, 42.0, 38.0, 60.0, 64.0, 53.0, 67.0, 67.0, 60.0, 67.0, 45.0, 52.0, 47.0, 39.0, 32.0, 34.0, 18.0, 16.0, 8.0, 13.0, 10.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.56510925292969, -72.67548370361328, -70.78585815429688, -68.89623260498047, -67.00660705566406, -65.11698150634766, -63.22735595703125, -61.337730407714844, -59.44810485839844, -57.55847930908203, -55.668853759765625, -53.77922821044922, -51.88960266113281, -49.999977111816406, -48.1103515625, -46.220726013183594, -44.33110046386719, -42.44147491455078, -40.551849365234375, -38.66222381591797, -36.77259826660156, -34.882972717285156, -32.99334716796875, -31.103721618652344, -29.214096069335938, -27.32447052001953, -25.434844970703125, -23.54521942138672, -21.655593872070312, -19.765968322753906, -17.8763427734375, -15.986717224121094, -14.097087860107422, -12.207462310791016, -10.31783676147461, -8.428211212158203, -6.538585662841797, -4.648960113525391, -2.7593345642089844, -0.8697090148925781, 1.0199165344238281, 2.9095420837402344, 4.799167633056641, 6.688793182373047, 8.578418731689453, 10.46804428100586, 12.357669830322266, 14.247295379638672, 16.136920928955078, 18.026546478271484, 19.91617202758789, 21.805797576904297, 23.695423126220703, 25.58504867553711, 27.474674224853516, 29.364299774169922, 31.253925323486328, 33.143550872802734, 35.03317642211914, 36.92280197143555, 38.81242752075195, 40.70205307006836, 42.591678619384766, 44.48130416870117, 46.37092971801758]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 8.0, 14.0, 13.0, 21.0, 24.0, 21.0, 41.0, 43.0, 75.0, 82.0, 145.0, 242.0, 382.0, 699.0, 1262.0, 2597.0, 5568.0, 14678.0, 47462.0, 419112.0, 3508614.0, 144650.0, 30310.0, 10211.0, 4098.0, 1797.0, 858.0, 463.0, 271.0, 155.0, 115.0, 79.0, 41.0, 24.0, 24.0, 28.0, 13.0, 10.0, 6.0, 5.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.73046875, -6.53985595703125, -6.3492431640625, -6.15863037109375, -5.968017578125, -5.77740478515625, -5.5867919921875, -5.39617919921875, -5.20556640625, -5.01495361328125, -4.8243408203125, -4.63372802734375, -4.443115234375, -4.25250244140625, -4.0618896484375, -3.87127685546875, -3.6806640625, -3.49005126953125, -3.2994384765625, -3.10882568359375, -2.918212890625, -2.72760009765625, -2.5369873046875, -2.34637451171875, -2.15576171875, -1.96514892578125, -1.7745361328125, -1.58392333984375, -1.393310546875, -1.20269775390625, -1.0120849609375, -0.82147216796875, -0.630859375, -0.44024658203125, -0.2496337890625, -0.05902099609375, 0.131591796875, 0.32220458984375, 0.5128173828125, 0.70343017578125, 0.89404296875, 1.08465576171875, 1.2752685546875, 1.46588134765625, 1.656494140625, 1.84710693359375, 2.0377197265625, 2.22833251953125, 2.4189453125, 2.60955810546875, 2.8001708984375, 2.99078369140625, 3.181396484375, 3.37200927734375, 3.5626220703125, 3.75323486328125, 3.94384765625, 4.13446044921875, 4.3250732421875, 4.51568603515625, 4.706298828125, 4.89691162109375, 5.0875244140625, 5.27813720703125, 5.46875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 9.0, 12.0, 15.0, 19.0, 32.0, 22.0, 40.0, 58.0, 65.0, 67.0, 74.0, 69.0, 92.0, 69.0, 69.0, 62.0, 43.0, 50.0, 37.0, 32.0, 24.0, 9.0, 7.0, 10.0, 6.0, 1.0, 6.0, 1.0, 1.0], "bins": [-4.4921875, -4.396270751953125, -4.30035400390625, -4.204437255859375, -4.1085205078125, -4.012603759765625, -3.91668701171875, -3.820770263671875, -3.724853515625, -3.628936767578125, -3.53302001953125, -3.437103271484375, -3.3411865234375, -3.245269775390625, -3.14935302734375, -3.053436279296875, -2.95751953125, -2.861602783203125, -2.76568603515625, -2.669769287109375, -2.5738525390625, -2.477935791015625, -2.38201904296875, -2.286102294921875, -2.190185546875, -2.094268798828125, -1.99835205078125, -1.902435302734375, -1.8065185546875, -1.710601806640625, -1.61468505859375, -1.518768310546875, -1.4228515625, -1.326934814453125, -1.23101806640625, -1.135101318359375, -1.0391845703125, -0.943267822265625, -0.84735107421875, -0.751434326171875, -0.655517578125, -0.559600830078125, -0.46368408203125, -0.367767333984375, -0.2718505859375, -0.175933837890625, -0.08001708984375, 0.015899658203125, 0.11181640625, 0.207733154296875, 0.30364990234375, 0.399566650390625, 0.4954833984375, 0.591400146484375, 0.68731689453125, 0.783233642578125, 0.879150390625, 0.975067138671875, 1.07098388671875, 1.166900634765625, 1.2628173828125, 1.358734130859375, 1.45465087890625, 1.550567626953125, 1.646484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 10.0, 8.0, 11.0, 7.0, 12.0, 11.0, 39.0, 55.0, 130.0, 291.0, 851.0, 2942.0, 12775.0, 87964.0, 3803087.0, 253675.0, 24767.0, 5246.0, 1454.0, 510.0, 198.0, 95.0, 43.0, 30.0, 16.0, 17.0, 6.0, 7.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-12.8046875, -12.46484375, -12.125, -11.78515625, -11.4453125, -11.10546875, -10.765625, -10.42578125, -10.0859375, -9.74609375, -9.40625, -9.06640625, -8.7265625, -8.38671875, -8.046875, -7.70703125, -7.3671875, -7.02734375, -6.6875, -6.34765625, -6.0078125, -5.66796875, -5.328125, -4.98828125, -4.6484375, -4.30859375, -3.96875, -3.62890625, -3.2890625, -2.94921875, -2.609375, -2.26953125, -1.9296875, -1.58984375, -1.25, -0.91015625, -0.5703125, -0.23046875, 0.109375, 0.44921875, 0.7890625, 1.12890625, 1.46875, 1.80859375, 2.1484375, 2.48828125, 2.828125, 3.16796875, 3.5078125, 3.84765625, 4.1875, 4.52734375, 4.8671875, 5.20703125, 5.546875, 5.88671875, 6.2265625, 6.56640625, 6.90625, 7.24609375, 7.5859375, 7.92578125, 8.265625, 8.60546875, 8.9453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 11.0, 13.0, 14.0, 27.0, 40.0, 57.0, 105.0, 168.0, 432.0, 1236.0, 1140.0, 368.0, 143.0, 78.0, 52.0, 31.0, 39.0, 21.0, 17.0, 8.0, 11.0, 9.0, 2.0, 9.0, 8.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8515625, -6.630126953125, -6.40869140625, -6.187255859375, -5.9658203125, -5.744384765625, -5.52294921875, -5.301513671875, -5.080078125, -4.858642578125, -4.63720703125, -4.415771484375, -4.1943359375, -3.972900390625, -3.75146484375, -3.530029296875, -3.30859375, -3.087158203125, -2.86572265625, -2.644287109375, -2.4228515625, -2.201416015625, -1.97998046875, -1.758544921875, -1.537109375, -1.315673828125, -1.09423828125, -0.872802734375, -0.6513671875, -0.429931640625, -0.20849609375, 0.012939453125, 0.234375, 0.455810546875, 0.67724609375, 0.898681640625, 1.1201171875, 1.341552734375, 1.56298828125, 1.784423828125, 2.005859375, 2.227294921875, 2.44873046875, 2.670166015625, 2.8916015625, 3.113037109375, 3.33447265625, 3.555908203125, 3.77734375, 3.998779296875, 4.22021484375, 4.441650390625, 4.6630859375, 4.884521484375, 5.10595703125, 5.327392578125, 5.548828125, 5.770263671875, 5.99169921875, 6.213134765625, 6.4345703125, 6.656005859375, 6.87744140625, 7.098876953125, 7.3203125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 29.0, 62.0, 110.0, 145.0, 173.0, 186.0, 129.0, 67.0, 35.0, 16.0, 9.0, 12.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.24144744873047, -44.1060791015625, -41.97071075439453, -39.8353385925293, -37.69997024536133, -35.56460189819336, -33.429229736328125, -31.293861389160156, -29.158493041992188, -27.02312469482422, -24.887754440307617, -22.752384185791016, -20.617015838623047, -18.481647491455078, -16.346277236938477, -14.210907936096191, -12.075538635253906, -9.940169334411621, -7.804800033569336, -5.669430732727051, -3.5340614318847656, -1.3986921310424805, 0.7366771697998047, 2.87204647064209, 5.007415771484375, 7.14278507232666, 9.278154373168945, 11.41352367401123, 13.548892974853516, 15.6842622756958, 17.819631576538086, 19.955001831054688, 22.090362548828125, 24.225730895996094, 26.361101150512695, 28.496471405029297, 30.631839752197266, 32.767208099365234, 34.90258026123047, 37.03794860839844, 39.173316955566406, 41.308685302734375, 43.444053649902344, 45.57942581176758, 47.71479415893555, 49.850162506103516, 51.98553466796875, 54.12090301513672, 56.25627136230469, 58.391639709472656, 60.527008056640625, 62.66238021850586, 64.79774475097656, 66.93312072753906, 69.06848907470703, 71.203857421875, 73.33922576904297, 75.47459411621094, 77.6099624633789, 79.74533081054688, 81.88070678710938, 84.01607513427734, 86.15144348144531, 88.28681182861328, 90.42218017578125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 9.0, 16.0, 9.0, 24.0, 28.0, 28.0, 37.0, 36.0, 49.0, 53.0, 49.0, 60.0, 65.0, 57.0, 65.0, 50.0, 55.0, 41.0, 39.0, 36.0, 38.0, 27.0, 36.0, 23.0, 17.0, 14.0, 9.0, 9.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-39.139930725097656, -38.08419418334961, -37.0284538269043, -35.97271728515625, -34.91697692871094, -33.86124038696289, -32.80550003051758, -31.74976348876953, -30.69402503967285, -29.638286590576172, -28.582548141479492, -27.526809692382812, -26.471073150634766, -25.415332794189453, -24.359596252441406, -23.303857803344727, -22.248119354248047, -21.192380905151367, -20.136642456054688, -19.080904006958008, -18.025165557861328, -16.96942901611328, -15.913690567016602, -14.857952117919922, -13.802213668823242, -12.746475219726562, -11.690736770629883, -10.63499927520752, -9.57926082611084, -8.52352237701416, -7.467784404754639, -6.412046432495117, -5.3563079833984375, -4.300569534301758, -3.2448315620422363, -2.1890933513641357, -1.1333551406860352, -0.07761669158935547, 0.978121280670166, 2.0338592529296875, 3.089597702026367, 4.145336151123047, 5.201074123382568, 6.25681209564209, 7.3125505447387695, 8.36828899383545, 9.424026489257812, 10.479764938354492, 11.535503387451172, 12.591241836547852, 13.646980285644531, 14.702717781066895, 15.758456230163574, 16.814193725585938, 17.869932174682617, 18.925670623779297, 19.981409072875977, 21.037147521972656, 22.092885971069336, 23.148624420166016, 24.204360961914062, 25.260101318359375, 26.315837860107422, 27.3715763092041, 28.42731475830078]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 8.0, 12.0, 15.0, 32.0, 38.0, 66.0, 91.0, 145.0, 236.0, 409.0, 660.0, 1190.0, 2232.0, 4453.0, 9456.0, 21823.0, 53785.0, 144648.0, 346079.0, 282744.0, 107232.0, 40951.0, 16973.0, 7385.0, 3670.0, 1737.0, 1012.0, 537.0, 338.0, 180.0, 127.0, 86.0, 52.0, 39.0, 29.0, 25.0, 11.0, 11.0, 12.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.578125, -4.43438720703125, -4.2906494140625, -4.14691162109375, -4.003173828125, -3.85943603515625, -3.7156982421875, -3.57196044921875, -3.42822265625, -3.28448486328125, -3.1407470703125, -2.99700927734375, -2.853271484375, -2.70953369140625, -2.5657958984375, -2.42205810546875, -2.2783203125, -2.13458251953125, -1.9908447265625, -1.84710693359375, -1.703369140625, -1.55963134765625, -1.4158935546875, -1.27215576171875, -1.12841796875, -0.98468017578125, -0.8409423828125, -0.69720458984375, -0.553466796875, -0.40972900390625, -0.2659912109375, -0.12225341796875, 0.021484375, 0.16522216796875, 0.3089599609375, 0.45269775390625, 0.596435546875, 0.74017333984375, 0.8839111328125, 1.02764892578125, 1.17138671875, 1.31512451171875, 1.4588623046875, 1.60260009765625, 1.746337890625, 1.89007568359375, 2.0338134765625, 2.17755126953125, 2.3212890625, 2.46502685546875, 2.6087646484375, 2.75250244140625, 2.896240234375, 3.03997802734375, 3.1837158203125, 3.32745361328125, 3.47119140625, 3.61492919921875, 3.7586669921875, 3.90240478515625, 4.046142578125, 4.18988037109375, 4.3336181640625, 4.47735595703125, 4.62109375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 0.0, 6.0, 3.0, 4.0, 7.0, 8.0, 9.0, 7.0, 9.0, 17.0, 17.0, 22.0, 27.0, 34.0, 25.0, 29.0, 33.0, 36.0, 33.0, 38.0, 44.0, 53.0, 45.0, 41.0, 62.0, 37.0, 43.0, 38.0, 33.0, 37.0, 28.0, 30.0, 24.0, 22.0, 14.0, 12.0, 14.0, 11.0, 11.0, 9.0, 8.0, 4.0, 6.0, 5.0, 2.0, 2.0, 3.0, 4.0], "bins": [-2.158203125, -2.1021575927734375, -2.046112060546875, -1.9900665283203125, -1.93402099609375, -1.8779754638671875, -1.821929931640625, -1.7658843994140625, -1.7098388671875, -1.6537933349609375, -1.597747802734375, -1.5417022705078125, -1.48565673828125, -1.4296112060546875, -1.373565673828125, -1.3175201416015625, -1.261474609375, -1.2054290771484375, -1.149383544921875, -1.0933380126953125, -1.03729248046875, -0.9812469482421875, -0.925201416015625, -0.8691558837890625, -0.8131103515625, -0.7570648193359375, -0.701019287109375, -0.6449737548828125, -0.58892822265625, -0.5328826904296875, -0.476837158203125, -0.4207916259765625, -0.36474609375, -0.3087005615234375, -0.252655029296875, -0.1966094970703125, -0.14056396484375, -0.0845184326171875, -0.028472900390625, 0.0275726318359375, 0.0836181640625, 0.1396636962890625, 0.195709228515625, 0.2517547607421875, 0.30780029296875, 0.3638458251953125, 0.419891357421875, 0.4759368896484375, 0.531982421875, 0.5880279541015625, 0.644073486328125, 0.7001190185546875, 0.75616455078125, 0.8122100830078125, 0.868255615234375, 0.9243011474609375, 0.9803466796875, 1.0363922119140625, 1.092437744140625, 1.1484832763671875, 1.20452880859375, 1.2605743408203125, 1.316619873046875, 1.3726654052734375, 1.4287109375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 10.0, 10.0, 15.0, 22.0, 42.0, 58.0, 74.0, 85.0, 154.0, 210.0, 383.0, 696.0, 1267.0, 2471.0, 6562.0, 27409.0, 200906.0, 680866.0, 101464.0, 16618.0, 4822.0, 1883.0, 1030.0, 544.0, 327.0, 184.0, 138.0, 87.0, 61.0, 41.0, 27.0, 23.0, 19.0, 11.0, 12.0, 7.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.84765625, -5.5859375, -5.32421875, -5.0625, -4.80078125, -4.5390625, -4.27734375, -4.015625, -3.75390625, -3.4921875, -3.23046875, -2.96875, -2.70703125, -2.4453125, -2.18359375, -1.921875, -1.66015625, -1.3984375, -1.13671875, -0.875, -0.61328125, -0.3515625, -0.08984375, 0.171875, 0.43359375, 0.6953125, 0.95703125, 1.21875, 1.48046875, 1.7421875, 2.00390625, 2.265625, 2.52734375, 2.7890625, 3.05078125, 3.3125, 3.57421875, 3.8359375, 4.09765625, 4.359375, 4.62109375, 4.8828125, 5.14453125, 5.40625, 5.66796875, 5.9296875, 6.19140625, 6.453125, 6.71484375, 6.9765625, 7.23828125, 7.5, 7.76171875, 8.0234375, 8.28515625, 8.546875, 8.80859375, 9.0703125, 9.33203125, 9.59375, 9.85546875, 10.1171875, 10.37890625, 10.640625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 4.0, 9.0, 19.0, 21.0, 18.0, 24.0, 30.0, 23.0, 35.0, 41.0, 47.0, 53.0, 48.0, 54.0, 55.0, 50.0, 46.0, 64.0, 45.0, 48.0, 51.0, 34.0, 32.0, 31.0, 20.0, 20.0, 14.0, 17.0, 6.0, 8.0, 4.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.265625, -9.9539794921875, -9.642333984375, -9.3306884765625, -9.01904296875, -8.7073974609375, -8.395751953125, -8.0841064453125, -7.7724609375, -7.4608154296875, -7.149169921875, -6.8375244140625, -6.52587890625, -6.2142333984375, -5.902587890625, -5.5909423828125, -5.279296875, -4.9676513671875, -4.656005859375, -4.3443603515625, -4.03271484375, -3.7210693359375, -3.409423828125, -3.0977783203125, -2.7861328125, -2.4744873046875, -2.162841796875, -1.8511962890625, -1.53955078125, -1.2279052734375, -0.916259765625, -0.6046142578125, -0.29296875, 0.0186767578125, 0.330322265625, 0.6419677734375, 0.95361328125, 1.2652587890625, 1.576904296875, 1.8885498046875, 2.2001953125, 2.5118408203125, 2.823486328125, 3.1351318359375, 3.44677734375, 3.7584228515625, 4.070068359375, 4.3817138671875, 4.693359375, 5.0050048828125, 5.316650390625, 5.6282958984375, 5.93994140625, 6.2515869140625, 6.563232421875, 6.8748779296875, 7.1865234375, 7.4981689453125, 7.809814453125, 8.1214599609375, 8.43310546875, 8.7447509765625, 9.056396484375, 9.3680419921875, 9.6796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 6.0, 8.0, 6.0, 12.0, 28.0, 41.0, 42.0, 65.0, 79.0, 164.0, 330.0, 674.0, 1647.0, 5383.0, 28860.0, 448127.0, 524328.0, 30016.0, 5592.0, 1685.0, 633.0, 321.0, 189.0, 103.0, 67.0, 39.0, 28.0, 21.0, 10.0, 14.0, 11.0, 12.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5546875, -4.37957763671875, -4.2044677734375, -4.02935791015625, -3.854248046875, -3.67913818359375, -3.5040283203125, -3.32891845703125, -3.15380859375, -2.97869873046875, -2.8035888671875, -2.62847900390625, -2.453369140625, -2.27825927734375, -2.1031494140625, -1.92803955078125, -1.7529296875, -1.57781982421875, -1.4027099609375, -1.22760009765625, -1.052490234375, -0.87738037109375, -0.7022705078125, -0.52716064453125, -0.35205078125, -0.17694091796875, -0.0018310546875, 0.17327880859375, 0.348388671875, 0.52349853515625, 0.6986083984375, 0.87371826171875, 1.048828125, 1.22393798828125, 1.3990478515625, 1.57415771484375, 1.749267578125, 1.92437744140625, 2.0994873046875, 2.27459716796875, 2.44970703125, 2.62481689453125, 2.7999267578125, 2.97503662109375, 3.150146484375, 3.32525634765625, 3.5003662109375, 3.67547607421875, 3.8505859375, 4.02569580078125, 4.2008056640625, 4.37591552734375, 4.551025390625, 4.72613525390625, 4.9012451171875, 5.07635498046875, 5.25146484375, 5.42657470703125, 5.6016845703125, 5.77679443359375, 5.951904296875, 6.12701416015625, 6.3021240234375, 6.47723388671875, 6.65234375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 11.0, 7.0, 12.0, 18.0, 20.0, 26.0, 31.0, 59.0, 60.0, 114.0, 156.0, 134.0, 89.0, 82.0, 39.0, 25.0, 23.0, 22.0, 12.0, 13.0, 15.0, 12.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006170272827148438, -0.000593230128288269, -0.0005694329738616943, -0.0005456358194351196, -0.0005218386650085449, -0.0004980415105819702, -0.0004742443561553955, -0.0004504472017288208, -0.0004266500473022461, -0.0004028528928756714, -0.0003790557384490967, -0.00035525858402252197, -0.00033146142959594727, -0.00030766427516937256, -0.00028386712074279785, -0.00026006996631622314, -0.00023627281188964844, -0.00021247565746307373, -0.00018867850303649902, -0.00016488134860992432, -0.0001410841941833496, -0.0001172870397567749, -9.34898853302002e-05, -6.969273090362549e-05, -4.589557647705078e-05, -2.2098422050476074e-05, 1.6987323760986328e-06, 2.549588680267334e-05, 4.929304122924805e-05, 7.309019565582275e-05, 9.688735008239746e-05, 0.00012068450450897217, 0.00014448165893554688, 0.00016827881336212158, 0.0001920759677886963, 0.000215873122215271, 0.0002396702766418457, 0.0002634674310684204, 0.0002872645854949951, 0.0003110617399215698, 0.00033485889434814453, 0.00035865604877471924, 0.00038245320320129395, 0.00040625035762786865, 0.00043004751205444336, 0.00045384466648101807, 0.0004776418209075928, 0.0005014389753341675, 0.0005252361297607422, 0.0005490332841873169, 0.0005728304386138916, 0.0005966275930404663, 0.000620424747467041, 0.0006442219018936157, 0.0006680190563201904, 0.0006918162107467651, 0.0007156133651733398, 0.0007394105195999146, 0.0007632076740264893, 0.000787004828453064, 0.0008108019828796387, 0.0008345991373062134, 0.0008583962917327881, 0.0008821934461593628, 0.0009059906005859375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 6.0, 16.0, 15.0, 22.0, 49.0, 63.0, 116.0, 260.0, 617.0, 1783.0, 8686.0, 127313.0, 867136.0, 36091.0, 4304.0, 1189.0, 447.0, 204.0, 93.0, 54.0, 29.0, 14.0, 13.0, 5.0, 9.0, 9.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.9453125, -9.6856689453125, -9.426025390625, -9.1663818359375, -8.90673828125, -8.6470947265625, -8.387451171875, -8.1278076171875, -7.8681640625, -7.6085205078125, -7.348876953125, -7.0892333984375, -6.82958984375, -6.5699462890625, -6.310302734375, -6.0506591796875, -5.791015625, -5.5313720703125, -5.271728515625, -5.0120849609375, -4.75244140625, -4.4927978515625, -4.233154296875, -3.9735107421875, -3.7138671875, -3.4542236328125, -3.194580078125, -2.9349365234375, -2.67529296875, -2.4156494140625, -2.156005859375, -1.8963623046875, -1.63671875, -1.3770751953125, -1.117431640625, -0.8577880859375, -0.59814453125, -0.3385009765625, -0.078857421875, 0.1807861328125, 0.4404296875, 0.7000732421875, 0.959716796875, 1.2193603515625, 1.47900390625, 1.7386474609375, 1.998291015625, 2.2579345703125, 2.517578125, 2.7772216796875, 3.036865234375, 3.2965087890625, 3.55615234375, 3.8157958984375, 4.075439453125, 4.3350830078125, 4.5947265625, 4.8543701171875, 5.114013671875, 5.3736572265625, 5.63330078125, 5.8929443359375, 6.152587890625, 6.4122314453125, 6.671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 20.0, 24.0, 39.0, 42.0, 82.0, 145.0, 146.0, 143.0, 107.0, 91.0, 46.0, 35.0, 25.0, 15.0, 14.0, 3.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.3359375, -9.132293701171875, -8.92864990234375, -8.725006103515625, -8.5213623046875, -8.317718505859375, -8.11407470703125, -7.910430908203125, -7.706787109375, -7.503143310546875, -7.29949951171875, -7.095855712890625, -6.8922119140625, -6.688568115234375, -6.48492431640625, -6.281280517578125, -6.07763671875, -5.873992919921875, -5.67034912109375, -5.466705322265625, -5.2630615234375, -5.059417724609375, -4.85577392578125, -4.652130126953125, -4.448486328125, -4.244842529296875, -4.04119873046875, -3.837554931640625, -3.6339111328125, -3.430267333984375, -3.22662353515625, -3.022979736328125, -2.8193359375, -2.615692138671875, -2.41204833984375, -2.208404541015625, -2.0047607421875, -1.801116943359375, -1.59747314453125, -1.393829345703125, -1.190185546875, -0.986541748046875, -0.78289794921875, -0.579254150390625, -0.3756103515625, -0.171966552734375, 0.03167724609375, 0.235321044921875, 0.43896484375, 0.642608642578125, 0.84625244140625, 1.049896240234375, 1.2535400390625, 1.457183837890625, 1.66082763671875, 1.864471435546875, 2.068115234375, 2.271759033203125, 2.47540283203125, 2.679046630859375, 2.8826904296875, 3.086334228515625, 3.28997802734375, 3.493621826171875, 3.697265625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 21.0, 48.0, 102.0, 189.0, 193.0, 179.0, 129.0, 49.0, 33.0, 19.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-102.30469512939453, -99.72172546386719, -97.13876342773438, -94.55579376220703, -91.97282409667969, -89.38986206054688, -86.80689239501953, -84.22392272949219, -81.64096069335938, -79.05799102783203, -76.47502899169922, -73.89205932617188, -71.30908966064453, -68.72611999511719, -66.14315795898438, -63.56018829345703, -60.97721862792969, -58.39425277709961, -55.811283111572266, -53.22831726074219, -50.645347595214844, -48.062381744384766, -45.47941589355469, -42.896446228027344, -40.313480377197266, -37.73051452636719, -35.147544860839844, -32.564579010009766, -29.981611251831055, -27.398643493652344, -24.815677642822266, -22.232709884643555, -19.649738311767578, -17.066770553588867, -14.483803749084473, -11.900836944580078, -9.317869186401367, -6.734901428222656, -4.151934623718262, -1.5689678192138672, 1.0139999389648438, 3.5969672203063965, 6.179934501647949, 8.762901306152344, 11.345869064331055, 13.928836822509766, 16.511802673339844, 19.094770431518555, 21.677738189697266, 24.260705947875977, 26.843673706054688, 29.426639556884766, 32.009605407714844, 34.59257507324219, 37.175540924072266, 39.758506774902344, 42.34147644042969, 44.924442291259766, 47.50741195678711, 50.09037780761719, 52.67334747314453, 55.25631332397461, 57.83927917480469, 60.42224884033203, 63.00521469116211]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 7.0, 8.0, 10.0, 15.0, 9.0, 23.0, 24.0, 29.0, 28.0, 31.0, 36.0, 50.0, 49.0, 71.0, 53.0, 56.0, 65.0, 62.0, 58.0, 48.0, 52.0, 40.0, 26.0, 30.0, 25.0, 22.0, 16.0, 14.0, 14.0, 8.0, 9.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.708566665649414, -28.415071487426758, -27.1215763092041, -25.828079223632812, -24.534584045410156, -23.2410888671875, -21.947593688964844, -20.654098510742188, -19.36060333251953, -18.067108154296875, -16.77361297607422, -15.480116844177246, -14.186620712280273, -12.893125534057617, -11.599630355834961, -10.306134223937988, -9.012638092041016, -7.719142436981201, -6.425646781921387, -5.1321516036987305, -3.838655948638916, -2.5451602935791016, -1.2516651153564453, 0.041831016540527344, 1.3353261947631836, 2.628821849822998, 3.9223172664642334, 5.215812683105469, 6.509308338165283, 7.802803993225098, 9.096299171447754, 10.389795303344727, 11.68328857421875, 12.976783752441406, 14.270279884338379, 15.563775062561035, 16.857271194458008, 18.150766372680664, 19.44426155090332, 20.73775863647461, 22.031253814697266, 23.324748992919922, 24.618244171142578, 25.911739349365234, 27.205236434936523, 28.49873161315918, 29.792226791381836, 31.085723876953125, 32.37921905517578, 33.67271423339844, 34.966209411621094, 36.25970458984375, 37.553199768066406, 38.84669494628906, 40.14019012451172, 41.43368911743164, 42.72718048095703, 44.02067565917969, 45.314170837402344, 46.607666015625, 47.901161193847656, 49.19465637207031, 50.48815155029297, 51.78165054321289, 53.07514572143555]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 10.0, 22.0, 20.0, 46.0, 60.0, 120.0, 196.0, 363.0, 676.0, 1450.0, 3396.0, 9102.0, 30827.0, 171669.0, 3257097.0, 637446.0, 57883.0, 14644.0, 5117.0, 2132.0, 900.0, 458.0, 261.0, 139.0, 81.0, 49.0, 25.0, 27.0, 22.0, 11.0, 8.0, 9.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.49609375, -4.314208984375, -4.13232421875, -3.950439453125, -3.7685546875, -3.586669921875, -3.40478515625, -3.222900390625, -3.041015625, -2.859130859375, -2.67724609375, -2.495361328125, -2.3134765625, -2.131591796875, -1.94970703125, -1.767822265625, -1.5859375, -1.404052734375, -1.22216796875, -1.040283203125, -0.8583984375, -0.676513671875, -0.49462890625, -0.312744140625, -0.130859375, 0.051025390625, 0.23291015625, 0.414794921875, 0.5966796875, 0.778564453125, 0.96044921875, 1.142333984375, 1.32421875, 1.506103515625, 1.68798828125, 1.869873046875, 2.0517578125, 2.233642578125, 2.41552734375, 2.597412109375, 2.779296875, 2.961181640625, 3.14306640625, 3.324951171875, 3.5068359375, 3.688720703125, 3.87060546875, 4.052490234375, 4.234375, 4.416259765625, 4.59814453125, 4.780029296875, 4.9619140625, 5.143798828125, 5.32568359375, 5.507568359375, 5.689453125, 5.871337890625, 6.05322265625, 6.235107421875, 6.4169921875, 6.598876953125, 6.78076171875, 6.962646484375, 7.14453125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 9.0, 19.0, 20.0, 28.0, 37.0, 34.0, 47.0, 72.0, 83.0, 73.0, 75.0, 70.0, 78.0, 76.0, 64.0, 65.0, 39.0, 27.0, 23.0, 19.0, 15.0, 4.0, 11.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.015625, -1.9190673828125, -1.822509765625, -1.7259521484375, -1.62939453125, -1.5328369140625, -1.436279296875, -1.3397216796875, -1.2431640625, -1.1466064453125, -1.050048828125, -0.9534912109375, -0.85693359375, -0.7603759765625, -0.663818359375, -0.5672607421875, -0.470703125, -0.3741455078125, -0.277587890625, -0.1810302734375, -0.08447265625, 0.0120849609375, 0.108642578125, 0.2052001953125, 0.3017578125, 0.3983154296875, 0.494873046875, 0.5914306640625, 0.68798828125, 0.7845458984375, 0.881103515625, 0.9776611328125, 1.07421875, 1.1707763671875, 1.267333984375, 1.3638916015625, 1.46044921875, 1.5570068359375, 1.653564453125, 1.7501220703125, 1.8466796875, 1.9432373046875, 2.039794921875, 2.1363525390625, 2.23291015625, 2.3294677734375, 2.426025390625, 2.5225830078125, 2.619140625, 2.7156982421875, 2.812255859375, 2.9088134765625, 3.00537109375, 3.1019287109375, 3.198486328125, 3.2950439453125, 3.3916015625, 3.4881591796875, 3.584716796875, 3.6812744140625, 3.77783203125, 3.8743896484375, 3.970947265625, 4.0675048828125, 4.1640625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 8.0, 15.0, 25.0, 30.0, 46.0, 53.0, 109.0, 193.0, 435.0, 1061.0, 3132.0, 10429.0, 45248.0, 427371.0, 3439635.0, 221753.0, 32377.0, 8192.0, 2541.0, 909.0, 343.0, 172.0, 80.0, 43.0, 26.0, 16.0, 13.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75, -4.546875, -4.34375, -4.140625, -3.9375, -3.734375, -3.53125, -3.328125, -3.125, -2.921875, -2.71875, -2.515625, -2.3125, -2.109375, -1.90625, -1.703125, -1.5, -1.296875, -1.09375, -0.890625, -0.6875, -0.484375, -0.28125, -0.078125, 0.125, 0.328125, 0.53125, 0.734375, 0.9375, 1.140625, 1.34375, 1.546875, 1.75, 1.953125, 2.15625, 2.359375, 2.5625, 2.765625, 2.96875, 3.171875, 3.375, 3.578125, 3.78125, 3.984375, 4.1875, 4.390625, 4.59375, 4.796875, 5.0, 5.203125, 5.40625, 5.609375, 5.8125, 6.015625, 6.21875, 6.421875, 6.625, 6.828125, 7.03125, 7.234375, 7.4375, 7.640625, 7.84375, 8.046875, 8.25]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 11.0, 15.0, 26.0, 27.0, 45.0, 78.0, 116.0, 253.0, 470.0, 861.0, 947.0, 529.0, 250.0, 150.0, 82.0, 68.0, 43.0, 18.0, 17.0, 16.0, 16.0, 5.0, 2.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.2734375, -7.09185791015625, -6.9102783203125, -6.72869873046875, -6.547119140625, -6.36553955078125, -6.1839599609375, -6.00238037109375, -5.82080078125, -5.63922119140625, -5.4576416015625, -5.27606201171875, -5.094482421875, -4.91290283203125, -4.7313232421875, -4.54974365234375, -4.3681640625, -4.18658447265625, -4.0050048828125, -3.82342529296875, -3.641845703125, -3.46026611328125, -3.2786865234375, -3.09710693359375, -2.91552734375, -2.73394775390625, -2.5523681640625, -2.37078857421875, -2.189208984375, -2.00762939453125, -1.8260498046875, -1.64447021484375, -1.462890625, -1.28131103515625, -1.0997314453125, -0.91815185546875, -0.736572265625, -0.55499267578125, -0.3734130859375, -0.19183349609375, -0.01025390625, 0.17132568359375, 0.3529052734375, 0.53448486328125, 0.716064453125, 0.89764404296875, 1.0792236328125, 1.26080322265625, 1.4423828125, 1.62396240234375, 1.8055419921875, 1.98712158203125, 2.168701171875, 2.35028076171875, 2.5318603515625, 2.71343994140625, 2.89501953125, 3.07659912109375, 3.2581787109375, 3.43975830078125, 3.621337890625, 3.80291748046875, 3.9844970703125, 4.16607666015625, 4.34765625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 7.0, 8.0, 14.0, 26.0, 33.0, 71.0, 140.0, 165.0, 179.0, 134.0, 74.0, 60.0, 35.0, 11.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.72447204589844, -39.21959686279297, -37.7147216796875, -36.20984649658203, -34.70497131347656, -33.20009231567383, -31.69521713256836, -30.19034194946289, -28.685466766357422, -27.180591583251953, -25.675716400146484, -24.170839309692383, -22.665964126586914, -21.161088943481445, -19.656211853027344, -18.151336669921875, -16.646461486816406, -15.141586303710938, -13.636710166931152, -12.131834030151367, -10.626958847045898, -9.12208366394043, -7.6172075271606445, -6.112331390380859, -4.607456207275391, -3.1025805473327637, -1.5977048873901367, -0.09282922744750977, 1.4120464324951172, 2.916922092437744, 4.421797752380371, 5.926673889160156, 7.431552886962891, 8.93642807006836, 10.441304206848145, 11.94618034362793, 13.451055526733398, 14.955930709838867, 16.46080780029297, 17.965682983398438, 19.470558166503906, 20.975433349609375, 22.480308532714844, 23.985185623168945, 25.490060806274414, 26.994935989379883, 28.499813079833984, 30.004688262939453, 31.509563446044922, 33.01443862915039, 34.51931381225586, 36.02418899536133, 37.52906799316406, 39.03394317626953, 40.538818359375, 42.04369354248047, 43.54856872558594, 45.053443908691406, 46.558319091796875, 48.063194274902344, 49.56806945800781, 51.07294845581055, 52.577823638916016, 54.082698822021484, 55.58757400512695]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 6.0, 7.0, 15.0, 12.0, 29.0, 30.0, 33.0, 34.0, 43.0, 60.0, 65.0, 70.0, 70.0, 73.0, 73.0, 48.0, 65.0, 54.0, 28.0, 32.0, 36.0, 28.0, 27.0, 21.0, 10.0, 12.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.603004455566406, -24.620500564575195, -23.637996673583984, -22.655494689941406, -21.672990798950195, -20.690486907958984, -19.707984924316406, -18.725481033325195, -17.742977142333984, -16.760473251342773, -15.777970314025879, -14.795467376708984, -13.812963485717773, -12.830459594726562, -11.847956657409668, -10.865453720092773, -9.882949829101562, -8.900445938110352, -7.917943000793457, -6.935439586639404, -5.952936172485352, -4.970432758331299, -3.987929344177246, -3.0054259300231934, -2.0229225158691406, -1.040419101715088, -0.057915687561035156, 0.9245877265930176, 1.9070911407470703, 2.889594554901123, 3.872097969055176, 4.8546013832092285, 5.837104797363281, 6.819608211517334, 7.802111625671387, 8.784614562988281, 9.767118453979492, 10.749622344970703, 11.732125282287598, 12.714628219604492, 13.697132110595703, 14.679636001586914, 15.662138938903809, 16.644641876220703, 17.627145767211914, 18.609649658203125, 19.592151641845703, 20.574655532836914, 21.557159423828125, 22.539663314819336, 23.522167205810547, 24.504669189453125, 25.487173080444336, 26.469676971435547, 27.452178955078125, 28.434682846069336, 29.417186737060547, 30.399690628051758, 31.38219451904297, 32.36469650268555, 33.347198486328125, 34.32970428466797, 35.31220626831055, 36.29471206665039, 37.27721405029297]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 9.0, 2.0, 7.0, 8.0, 6.0, 14.0, 18.0, 42.0, 60.0, 54.0, 115.0, 213.0, 324.0, 586.0, 1184.0, 2354.0, 5058.0, 11503.0, 28741.0, 78879.0, 245963.0, 414748.0, 166344.0, 55116.0, 20799.0, 8583.0, 3773.0, 1882.0, 947.0, 504.0, 274.0, 161.0, 92.0, 57.0, 42.0, 29.0, 18.0, 13.0, 11.0, 5.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.15234375, -5.00225830078125, -4.8521728515625, -4.70208740234375, -4.552001953125, -4.40191650390625, -4.2518310546875, -4.10174560546875, -3.95166015625, -3.80157470703125, -3.6514892578125, -3.50140380859375, -3.351318359375, -3.20123291015625, -3.0511474609375, -2.90106201171875, -2.7509765625, -2.60089111328125, -2.4508056640625, -2.30072021484375, -2.150634765625, -2.00054931640625, -1.8504638671875, -1.70037841796875, -1.55029296875, -1.40020751953125, -1.2501220703125, -1.10003662109375, -0.949951171875, -0.79986572265625, -0.6497802734375, -0.49969482421875, -0.349609375, -0.19952392578125, -0.0494384765625, 0.10064697265625, 0.250732421875, 0.40081787109375, 0.5509033203125, 0.70098876953125, 0.85107421875, 1.00115966796875, 1.1512451171875, 1.30133056640625, 1.451416015625, 1.60150146484375, 1.7515869140625, 1.90167236328125, 2.0517578125, 2.20184326171875, 2.3519287109375, 2.50201416015625, 2.652099609375, 2.80218505859375, 2.9522705078125, 3.10235595703125, 3.25244140625, 3.40252685546875, 3.5526123046875, 3.70269775390625, 3.852783203125, 4.00286865234375, 4.1529541015625, 4.30303955078125, 4.453125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 6.0, 10.0, 8.0, 11.0, 8.0, 18.0, 15.0, 12.0, 18.0, 14.0, 30.0, 32.0, 20.0, 35.0, 30.0, 34.0, 43.0, 36.0, 45.0, 50.0, 46.0, 35.0, 46.0, 46.0, 44.0, 25.0, 28.0, 30.0, 28.0, 30.0, 30.0, 24.0, 19.0, 15.0, 17.0, 12.0, 10.0, 9.0, 6.0, 4.0, 7.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.59765625, -1.5445098876953125, -1.491363525390625, -1.4382171630859375, -1.38507080078125, -1.3319244384765625, -1.278778076171875, -1.2256317138671875, -1.1724853515625, -1.1193389892578125, -1.066192626953125, -1.0130462646484375, -0.95989990234375, -0.9067535400390625, -0.853607177734375, -0.8004608154296875, -0.747314453125, -0.6941680908203125, -0.641021728515625, -0.5878753662109375, -0.53472900390625, -0.4815826416015625, -0.428436279296875, -0.3752899169921875, -0.3221435546875, -0.2689971923828125, -0.215850830078125, -0.1627044677734375, -0.10955810546875, -0.0564117431640625, -0.003265380859375, 0.0498809814453125, 0.10302734375, 0.1561737060546875, 0.209320068359375, 0.2624664306640625, 0.31561279296875, 0.3687591552734375, 0.421905517578125, 0.4750518798828125, 0.5281982421875, 0.5813446044921875, 0.634490966796875, 0.6876373291015625, 0.74078369140625, 0.7939300537109375, 0.847076416015625, 0.9002227783203125, 0.953369140625, 1.0065155029296875, 1.059661865234375, 1.1128082275390625, 1.16595458984375, 1.2191009521484375, 1.272247314453125, 1.3253936767578125, 1.3785400390625, 1.4316864013671875, 1.484832763671875, 1.5379791259765625, 1.59112548828125, 1.6442718505859375, 1.697418212890625, 1.7505645751953125, 1.8037109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 10.0, 6.0, 9.0, 17.0, 33.0, 33.0, 69.0, 88.0, 159.0, 279.0, 492.0, 1117.0, 2418.0, 8286.0, 40973.0, 363278.0, 561729.0, 54051.0, 10128.0, 2970.0, 1121.0, 532.0, 287.0, 166.0, 109.0, 58.0, 37.0, 32.0, 25.0, 7.0, 5.0, 9.0, 6.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.43359375, -7.14849853515625, -6.8634033203125, -6.57830810546875, -6.293212890625, -6.00811767578125, -5.7230224609375, -5.43792724609375, -5.15283203125, -4.86773681640625, -4.5826416015625, -4.29754638671875, -4.012451171875, -3.72735595703125, -3.4422607421875, -3.15716552734375, -2.8720703125, -2.58697509765625, -2.3018798828125, -2.01678466796875, -1.731689453125, -1.44659423828125, -1.1614990234375, -0.87640380859375, -0.59130859375, -0.30621337890625, -0.0211181640625, 0.26397705078125, 0.549072265625, 0.83416748046875, 1.1192626953125, 1.40435791015625, 1.689453125, 1.97454833984375, 2.2596435546875, 2.54473876953125, 2.829833984375, 3.11492919921875, 3.4000244140625, 3.68511962890625, 3.97021484375, 4.25531005859375, 4.5404052734375, 4.82550048828125, 5.110595703125, 5.39569091796875, 5.6807861328125, 5.96588134765625, 6.2509765625, 6.53607177734375, 6.8211669921875, 7.10626220703125, 7.391357421875, 7.67645263671875, 7.9615478515625, 8.24664306640625, 8.53173828125, 8.81683349609375, 9.1019287109375, 9.38702392578125, 9.672119140625, 9.95721435546875, 10.2423095703125, 10.52740478515625, 10.8125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 13.0, 13.0, 16.0, 16.0, 17.0, 19.0, 41.0, 32.0, 36.0, 44.0, 58.0, 48.0, 44.0, 67.0, 65.0, 77.0, 62.0, 53.0, 51.0, 46.0, 36.0, 34.0, 23.0, 13.0, 20.0, 9.0, 12.0, 9.0, 3.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-10.9921875, -10.7069091796875, -10.421630859375, -10.1363525390625, -9.85107421875, -9.5657958984375, -9.280517578125, -8.9952392578125, -8.7099609375, -8.4246826171875, -8.139404296875, -7.8541259765625, -7.56884765625, -7.2835693359375, -6.998291015625, -6.7130126953125, -6.427734375, -6.1424560546875, -5.857177734375, -5.5718994140625, -5.28662109375, -5.0013427734375, -4.716064453125, -4.4307861328125, -4.1455078125, -3.8602294921875, -3.574951171875, -3.2896728515625, -3.00439453125, -2.7191162109375, -2.433837890625, -2.1485595703125, -1.86328125, -1.5780029296875, -1.292724609375, -1.0074462890625, -0.72216796875, -0.4368896484375, -0.151611328125, 0.1336669921875, 0.4189453125, 0.7042236328125, 0.989501953125, 1.2747802734375, 1.56005859375, 1.8453369140625, 2.130615234375, 2.4158935546875, 2.701171875, 2.9864501953125, 3.271728515625, 3.5570068359375, 3.84228515625, 4.1275634765625, 4.412841796875, 4.6981201171875, 4.9833984375, 5.2686767578125, 5.553955078125, 5.8392333984375, 6.12451171875, 6.4097900390625, 6.695068359375, 6.9803466796875, 7.265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 11.0, 12.0, 20.0, 31.0, 74.0, 212.0, 1091.0, 28310.0, 1006673.0, 11080.0, 716.0, 172.0, 67.0, 25.0, 23.0, 9.0, 6.0, 3.0, 7.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8671875, -10.49755859375, -10.1279296875, -9.75830078125, -9.388671875, -9.01904296875, -8.6494140625, -8.27978515625, -7.91015625, -7.54052734375, -7.1708984375, -6.80126953125, -6.431640625, -6.06201171875, -5.6923828125, -5.32275390625, -4.953125, -4.58349609375, -4.2138671875, -3.84423828125, -3.474609375, -3.10498046875, -2.7353515625, -2.36572265625, -1.99609375, -1.62646484375, -1.2568359375, -0.88720703125, -0.517578125, -0.14794921875, 0.2216796875, 0.59130859375, 0.9609375, 1.33056640625, 1.7001953125, 2.06982421875, 2.439453125, 2.80908203125, 3.1787109375, 3.54833984375, 3.91796875, 4.28759765625, 4.6572265625, 5.02685546875, 5.396484375, 5.76611328125, 6.1357421875, 6.50537109375, 6.875, 7.24462890625, 7.6142578125, 7.98388671875, 8.353515625, 8.72314453125, 9.0927734375, 9.46240234375, 9.83203125, 10.20166015625, 10.5712890625, 10.94091796875, 11.310546875, 11.68017578125, 12.0498046875, 12.41943359375, 12.7890625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 9.0, 9.0, 5.0, 20.0, 13.0, 23.0, 30.0, 48.0, 61.0, 88.0, 114.0, 159.0, 124.0, 81.0, 70.0, 23.0, 30.0, 18.0, 8.0, 12.0, 12.0, 2.0, 11.0, 7.0, 7.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00083160400390625, -0.0008105486631393433, -0.0007894933223724365, -0.0007684379816055298, -0.000747382640838623, -0.0007263273000717163, -0.0007052719593048096, -0.0006842166185379028, -0.0006631612777709961, -0.0006421059370040894, -0.0006210505962371826, -0.0005999952554702759, -0.0005789399147033691, -0.0005578845739364624, -0.0005368292331695557, -0.0005157738924026489, -0.0004947185516357422, -0.00047366321086883545, -0.0004526078701019287, -0.00043155252933502197, -0.00041049718856811523, -0.0003894418478012085, -0.00036838650703430176, -0.000347331166267395, -0.0003262758255004883, -0.00030522048473358154, -0.0002841651439666748, -0.00026310980319976807, -0.00024205446243286133, -0.0002209991216659546, -0.00019994378089904785, -0.0001788884401321411, -0.00015783309936523438, -0.00013677775859832764, -0.0001157224178314209, -9.466707706451416e-05, -7.361173629760742e-05, -5.2556395530700684e-05, -3.1501054763793945e-05, -1.0445713996887207e-05, 1.0609626770019531e-05, 3.166496753692627e-05, 5.272030830383301e-05, 7.377564907073975e-05, 9.483098983764648e-05, 0.00011588633060455322, 0.00013694167137145996, 0.0001579970121383667, 0.00017905235290527344, 0.00020010769367218018, 0.00022116303443908691, 0.00024221837520599365, 0.0002632737159729004, 0.00028432905673980713, 0.00030538439750671387, 0.0003264397382736206, 0.00034749507904052734, 0.0003685504198074341, 0.0003896057605743408, 0.00041066110134124756, 0.0004317164421081543, 0.00045277178287506104, 0.0004738271236419678, 0.0004948824644088745, 0.0005159378051757812]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 11.0, 10.0, 18.0, 25.0, 39.0, 59.0, 108.0, 158.0, 268.0, 535.0, 1034.0, 2368.0, 6882.0, 29384.0, 224384.0, 675421.0, 85748.0, 14667.0, 4187.0, 1554.0, 688.0, 372.0, 224.0, 133.0, 73.0, 57.0, 33.0, 25.0, 18.0, 14.0, 10.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9140625, -2.81103515625, -2.7080078125, -2.60498046875, -2.501953125, -2.39892578125, -2.2958984375, -2.19287109375, -2.08984375, -1.98681640625, -1.8837890625, -1.78076171875, -1.677734375, -1.57470703125, -1.4716796875, -1.36865234375, -1.265625, -1.16259765625, -1.0595703125, -0.95654296875, -0.853515625, -0.75048828125, -0.6474609375, -0.54443359375, -0.44140625, -0.33837890625, -0.2353515625, -0.13232421875, -0.029296875, 0.07373046875, 0.1767578125, 0.27978515625, 0.3828125, 0.48583984375, 0.5888671875, 0.69189453125, 0.794921875, 0.89794921875, 1.0009765625, 1.10400390625, 1.20703125, 1.31005859375, 1.4130859375, 1.51611328125, 1.619140625, 1.72216796875, 1.8251953125, 1.92822265625, 2.03125, 2.13427734375, 2.2373046875, 2.34033203125, 2.443359375, 2.54638671875, 2.6494140625, 2.75244140625, 2.85546875, 2.95849609375, 3.0615234375, 3.16455078125, 3.267578125, 3.37060546875, 3.4736328125, 3.57666015625, 3.6796875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 10.0, 8.0, 13.0, 16.0, 18.0, 30.0, 37.0, 74.0, 55.0, 97.0, 117.0, 112.0, 96.0, 76.0, 63.0, 49.0, 30.0, 25.0, 14.0, 10.0, 10.0, 9.0, 9.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.958984375, -2.858001708984375, -2.75701904296875, -2.656036376953125, -2.5550537109375, -2.454071044921875, -2.35308837890625, -2.252105712890625, -2.151123046875, -2.050140380859375, -1.94915771484375, -1.848175048828125, -1.7471923828125, -1.646209716796875, -1.54522705078125, -1.444244384765625, -1.34326171875, -1.242279052734375, -1.14129638671875, -1.040313720703125, -0.9393310546875, -0.838348388671875, -0.73736572265625, -0.636383056640625, -0.535400390625, -0.434417724609375, -0.33343505859375, -0.232452392578125, -0.1314697265625, -0.030487060546875, 0.07049560546875, 0.171478271484375, 0.2724609375, 0.373443603515625, 0.47442626953125, 0.575408935546875, 0.6763916015625, 0.777374267578125, 0.87835693359375, 0.979339599609375, 1.080322265625, 1.181304931640625, 1.28228759765625, 1.383270263671875, 1.4842529296875, 1.585235595703125, 1.68621826171875, 1.787200927734375, 1.88818359375, 1.989166259765625, 2.09014892578125, 2.191131591796875, 2.2921142578125, 2.393096923828125, 2.49407958984375, 2.595062255859375, 2.696044921875, 2.797027587890625, 2.89801025390625, 2.998992919921875, 3.0999755859375, 3.200958251953125, 3.30194091796875, 3.402923583984375, 3.50390625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 10.0, 24.0, 28.0, 51.0, 99.0, 107.0, 179.0, 171.0, 117.0, 88.0, 47.0, 27.0, 14.0, 13.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.706787109375, -41.12086486816406, -39.534942626953125, -37.94902420043945, -36.363101959228516, -34.77717971801758, -33.19125747680664, -31.605337142944336, -30.01941680908203, -28.433494567871094, -26.84757423400879, -25.26165199279785, -23.675731658935547, -22.08980941772461, -20.503887176513672, -18.917966842651367, -17.33204460144043, -15.746123313903809, -14.160202026367188, -12.57427978515625, -10.988359451293945, -9.402437210083008, -7.816515922546387, -6.230594635009766, -4.6446733474731445, -3.0587520599365234, -1.4728305339813232, 0.11309099197387695, 1.699012279510498, 3.284933567047119, 4.870855331420898, 6.4567766189575195, 8.04269790649414, 9.628619194030762, 11.214540481567383, 12.80046272277832, 14.386383056640625, 15.972305297851562, 17.5582275390625, 19.144147872924805, 20.73006820678711, 22.315990447998047, 23.90191078186035, 25.48783302307129, 27.073753356933594, 28.65967559814453, 30.24559783935547, 31.831518173217773, 33.417442321777344, 35.00336456298828, 36.58928680419922, 38.17520523071289, 39.76112747192383, 41.347049713134766, 42.9329719543457, 44.518890380859375, 46.10481262207031, 47.69073486328125, 49.27665710449219, 50.86257553100586, 52.4484977722168, 54.034420013427734, 55.62034225463867, 57.206260681152344, 58.79218292236328]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 9.0, 14.0, 10.0, 14.0, 17.0, 17.0, 18.0, 18.0, 33.0, 27.0, 33.0, 29.0, 36.0, 48.0, 46.0, 54.0, 49.0, 61.0, 50.0, 42.0, 55.0, 42.0, 44.0, 24.0, 29.0, 26.0, 26.0, 18.0, 19.0, 16.0, 14.0, 5.0, 9.0, 5.0, 8.0, 6.0, 7.0, 2.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.030855178833008, -29.050264358520508, -28.069673538208008, -27.089082717895508, -26.108489990234375, -25.127899169921875, -24.147308349609375, -23.166717529296875, -22.186126708984375, -21.205535888671875, -20.224945068359375, -19.244354248046875, -18.263763427734375, -17.283172607421875, -16.302579879760742, -15.321989059448242, -14.341398239135742, -13.360807418823242, -12.380216598510742, -11.399624824523926, -10.419034004211426, -9.438443183898926, -8.45785140991211, -7.477260589599609, -6.496669769287109, -5.516078948974609, -4.535487651824951, -3.554896593093872, -2.574305534362793, -1.593714714050293, -0.6131234169006348, 0.36746788024902344, 1.3480606079101562, 2.3286516666412354, 3.3092427253723145, 4.289834022521973, 5.270424842834473, 6.251015663146973, 7.231606960296631, 8.212198257446289, 9.192789077758789, 10.173379898071289, 11.153970718383789, 12.134562492370605, 13.115153312683105, 14.095744132995605, 15.076335906982422, 16.056926727294922, 17.037517547607422, 18.018108367919922, 18.998699188232422, 19.979290008544922, 20.959880828857422, 21.940471649169922, 22.921064376831055, 23.901655197143555, 24.882246017456055, 25.862836837768555, 26.843427658081055, 27.824018478393555, 28.804611206054688, 29.785202026367188, 30.765792846679688, 31.746383666992188, 32.72697448730469]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 7.0, 13.0, 17.0, 28.0, 36.0, 57.0, 88.0, 137.0, 237.0, 404.0, 692.0, 1280.0, 2700.0, 6283.0, 15990.0, 50483.0, 242386.0, 2254493.0, 1404831.0, 155094.0, 36779.0, 12376.0, 4893.0, 2253.0, 1124.0, 655.0, 354.0, 196.0, 112.0, 91.0, 53.0, 34.0, 23.0, 26.0, 15.0, 11.0, 8.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.361328125, -3.252471923828125, -3.14361572265625, -3.034759521484375, -2.9259033203125, -2.817047119140625, -2.70819091796875, -2.599334716796875, -2.490478515625, -2.381622314453125, -2.27276611328125, -2.163909912109375, -2.0550537109375, -1.946197509765625, -1.83734130859375, -1.728485107421875, -1.61962890625, -1.510772705078125, -1.40191650390625, -1.293060302734375, -1.1842041015625, -1.075347900390625, -0.96649169921875, -0.857635498046875, -0.748779296875, -0.639923095703125, -0.53106689453125, -0.422210693359375, -0.3133544921875, -0.204498291015625, -0.09564208984375, 0.013214111328125, 0.1220703125, 0.230926513671875, 0.33978271484375, 0.448638916015625, 0.5574951171875, 0.666351318359375, 0.77520751953125, 0.884063720703125, 0.992919921875, 1.101776123046875, 1.21063232421875, 1.319488525390625, 1.4283447265625, 1.537200927734375, 1.64605712890625, 1.754913330078125, 1.86376953125, 1.972625732421875, 2.08148193359375, 2.190338134765625, 2.2991943359375, 2.408050537109375, 2.51690673828125, 2.625762939453125, 2.734619140625, 2.843475341796875, 2.95233154296875, 3.061187744140625, 3.1700439453125, 3.278900146484375, 3.38775634765625, 3.496612548828125, 3.60546875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 6.0, 6.0, 5.0, 12.0, 11.0, 23.0, 13.0, 25.0, 30.0, 29.0, 32.0, 41.0, 51.0, 56.0, 60.0, 56.0, 57.0, 66.0, 70.0, 51.0, 44.0, 48.0, 34.0, 33.0, 42.0, 16.0, 20.0, 20.0, 14.0, 8.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.167816162109375, -2.10125732421875, -2.034698486328125, -1.9681396484375, -1.901580810546875, -1.83502197265625, -1.768463134765625, -1.701904296875, -1.635345458984375, -1.56878662109375, -1.502227783203125, -1.4356689453125, -1.369110107421875, -1.30255126953125, -1.235992431640625, -1.16943359375, -1.102874755859375, -1.03631591796875, -0.969757080078125, -0.9031982421875, -0.836639404296875, -0.77008056640625, -0.703521728515625, -0.636962890625, -0.570404052734375, -0.50384521484375, -0.437286376953125, -0.3707275390625, -0.304168701171875, -0.23760986328125, -0.171051025390625, -0.1044921875, -0.037933349609375, 0.02862548828125, 0.095184326171875, 0.1617431640625, 0.228302001953125, 0.29486083984375, 0.361419677734375, 0.427978515625, 0.494537353515625, 0.56109619140625, 0.627655029296875, 0.6942138671875, 0.760772705078125, 0.82733154296875, 0.893890380859375, 0.96044921875, 1.027008056640625, 1.09356689453125, 1.160125732421875, 1.2266845703125, 1.293243408203125, 1.35980224609375, 1.426361083984375, 1.492919921875, 1.559478759765625, 1.62603759765625, 1.692596435546875, 1.7591552734375, 1.825714111328125, 1.89227294921875, 1.958831787109375, 2.025390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 4.0, 8.0, 13.0, 15.0, 18.0, 39.0, 42.0, 72.0, 117.0, 205.0, 333.0, 590.0, 1274.0, 2626.0, 6723.0, 20603.0, 78736.0, 502461.0, 3039244.0, 440751.0, 72244.0, 18518.0, 5728.0, 2117.0, 896.0, 403.0, 190.0, 116.0, 66.0, 47.0, 35.0, 17.0, 14.0, 6.0, 1.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.474609375, -3.338226318359375, -3.20184326171875, -3.065460205078125, -2.9290771484375, -2.792694091796875, -2.65631103515625, -2.519927978515625, -2.383544921875, -2.247161865234375, -2.11077880859375, -1.974395751953125, -1.8380126953125, -1.701629638671875, -1.56524658203125, -1.428863525390625, -1.29248046875, -1.156097412109375, -1.01971435546875, -0.883331298828125, -0.7469482421875, -0.610565185546875, -0.47418212890625, -0.337799072265625, -0.201416015625, -0.065032958984375, 0.07135009765625, 0.207733154296875, 0.3441162109375, 0.480499267578125, 0.61688232421875, 0.753265380859375, 0.8896484375, 1.026031494140625, 1.16241455078125, 1.298797607421875, 1.4351806640625, 1.571563720703125, 1.70794677734375, 1.844329833984375, 1.980712890625, 2.117095947265625, 2.25347900390625, 2.389862060546875, 2.5262451171875, 2.662628173828125, 2.79901123046875, 2.935394287109375, 3.07177734375, 3.208160400390625, 3.34454345703125, 3.480926513671875, 3.6173095703125, 3.753692626953125, 3.89007568359375, 4.026458740234375, 4.162841796875, 4.299224853515625, 4.43560791015625, 4.571990966796875, 4.7083740234375, 4.844757080078125, 4.98114013671875, 5.117523193359375, 5.25390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 10.0, 7.0, 6.0, 4.0, 18.0, 22.0, 19.0, 26.0, 37.0, 54.0, 61.0, 110.0, 114.0, 198.0, 317.0, 444.0, 568.0, 610.0, 442.0, 299.0, 192.0, 127.0, 89.0, 71.0, 50.0, 48.0, 32.0, 24.0, 15.0, 7.0, 12.0, 8.0, 6.0, 5.0, 1.0, 6.0, 3.0, 3.0, 0.0, 2.0], "bins": [-5.26171875, -5.133636474609375, -5.00555419921875, -4.877471923828125, -4.7493896484375, -4.621307373046875, -4.49322509765625, -4.365142822265625, -4.237060546875, -4.108978271484375, -3.98089599609375, -3.852813720703125, -3.7247314453125, -3.596649169921875, -3.46856689453125, -3.340484619140625, -3.21240234375, -3.084320068359375, -2.95623779296875, -2.828155517578125, -2.7000732421875, -2.571990966796875, -2.44390869140625, -2.315826416015625, -2.187744140625, -2.059661865234375, -1.93157958984375, -1.803497314453125, -1.6754150390625, -1.547332763671875, -1.41925048828125, -1.291168212890625, -1.1630859375, -1.035003662109375, -0.90692138671875, -0.778839111328125, -0.6507568359375, -0.522674560546875, -0.39459228515625, -0.266510009765625, -0.138427734375, -0.010345458984375, 0.11773681640625, 0.245819091796875, 0.3739013671875, 0.501983642578125, 0.63006591796875, 0.758148193359375, 0.88623046875, 1.014312744140625, 1.14239501953125, 1.270477294921875, 1.3985595703125, 1.526641845703125, 1.65472412109375, 1.782806396484375, 1.910888671875, 2.038970947265625, 2.16705322265625, 2.295135498046875, 2.4232177734375, 2.551300048828125, 2.67938232421875, 2.807464599609375, 2.935546875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 6.0, 10.0, 50.0, 167.0, 374.0, 261.0, 89.0, 29.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-177.92782592773438, -174.41653442382812, -170.9052276611328, -167.39393615722656, -163.88262939453125, -160.371337890625, -156.86004638671875, -153.34873962402344, -149.8374481201172, -146.32615661621094, -142.81484985351562, -139.30355834960938, -135.79225158691406, -132.2809600830078, -128.7696533203125, -125.25836181640625, -121.74706268310547, -118.23576354980469, -114.7244644165039, -111.21316528320312, -107.70187377929688, -104.1905746459961, -100.67927551269531, -97.16797637939453, -93.65667724609375, -90.14537811279297, -86.63407897949219, -83.12278747558594, -79.61148834228516, -76.10018920898438, -72.5888900756836, -69.07759094238281, -65.56629943847656, -62.05500030517578, -58.543704986572266, -55.032405853271484, -51.52111053466797, -48.00981140136719, -44.498512268066406, -40.987213134765625, -37.47591781616211, -33.96461868286133, -30.453323364257812, -26.94202423095703, -23.430727005004883, -19.919429779052734, -16.408130645751953, -12.896833419799805, -9.385536193847656, -5.87423849105835, -2.362940788269043, 1.1483573913574219, 4.65965461730957, 8.170951843261719, 11.6822509765625, 15.193548202514648, 18.704845428466797, 22.216142654418945, 25.727439880371094, 29.238739013671875, 32.750038146972656, 36.26133346557617, 39.77263259887695, 43.28392791748047, 46.79522705078125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 9.0, 4.0, 9.0, 14.0, 17.0, 18.0, 27.0, 31.0, 29.0, 41.0, 43.0, 54.0, 51.0, 46.0, 49.0, 40.0, 52.0, 50.0, 55.0, 54.0, 43.0, 35.0, 31.0, 31.0, 34.0, 21.0, 28.0, 13.0, 18.0, 7.0, 10.0, 8.0, 3.0, 10.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.25941276550293, -21.451753616333008, -20.644094467163086, -19.836435317993164, -19.028776168823242, -18.22111701965332, -17.41345977783203, -16.60580062866211, -15.798140525817871, -14.99048137664795, -14.182822227478027, -13.375164031982422, -12.5675048828125, -11.759845733642578, -10.952186584472656, -10.144527435302734, -9.336868286132812, -8.52920913696289, -7.721549987792969, -6.913891315460205, -6.106232166290283, -5.298573017120361, -4.490914344787598, -3.683255195617676, -2.875596046447754, -2.067936897277832, -1.2602779865264893, -0.4526190757751465, 0.3550400733947754, 1.1626992225646973, 1.970357894897461, 2.778017044067383, 3.5856781005859375, 4.393337249755859, 5.200996398925781, 6.008655071258545, 6.816314220428467, 7.623973369598389, 8.431632041931152, 9.239291191101074, 10.046950340270996, 10.854609489440918, 11.66226863861084, 12.469926834106445, 13.277585983276367, 14.085245132446289, 14.892904281616211, 15.700563430786133, 16.508222579956055, 17.315881729125977, 18.1235408782959, 18.93120002746582, 19.738859176635742, 20.546518325805664, 21.354175567626953, 22.161834716796875, 22.969493865966797, 23.77715301513672, 24.58481216430664, 25.392471313476562, 26.200130462646484, 27.007789611816406, 27.815448760986328, 28.62310791015625, 29.430767059326172]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 9.0, 8.0, 21.0, 19.0, 27.0, 44.0, 94.0, 122.0, 191.0, 389.0, 705.0, 1401.0, 3314.0, 8473.0, 23713.0, 70627.0, 208732.0, 396476.0, 218769.0, 74381.0, 25212.0, 9065.0, 3556.0, 1522.0, 763.0, 359.0, 193.0, 132.0, 87.0, 55.0, 30.0, 19.0, 13.0, 11.0, 5.0, 4.0, 4.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0390625, -4.897216796875, -4.75537109375, -4.613525390625, -4.4716796875, -4.329833984375, -4.18798828125, -4.046142578125, -3.904296875, -3.762451171875, -3.62060546875, -3.478759765625, -3.3369140625, -3.195068359375, -3.05322265625, -2.911376953125, -2.76953125, -2.627685546875, -2.48583984375, -2.343994140625, -2.2021484375, -2.060302734375, -1.91845703125, -1.776611328125, -1.634765625, -1.492919921875, -1.35107421875, -1.209228515625, -1.0673828125, -0.925537109375, -0.78369140625, -0.641845703125, -0.5, -0.358154296875, -0.21630859375, -0.074462890625, 0.0673828125, 0.209228515625, 0.35107421875, 0.492919921875, 0.634765625, 0.776611328125, 0.91845703125, 1.060302734375, 1.2021484375, 1.343994140625, 1.48583984375, 1.627685546875, 1.76953125, 1.911376953125, 2.05322265625, 2.195068359375, 2.3369140625, 2.478759765625, 2.62060546875, 2.762451171875, 2.904296875, 3.046142578125, 3.18798828125, 3.329833984375, 3.4716796875, 3.613525390625, 3.75537109375, 3.897216796875, 4.0390625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 12.0, 4.0, 11.0, 15.0, 18.0, 15.0, 30.0, 18.0, 34.0, 33.0, 40.0, 40.0, 33.0, 32.0, 45.0, 37.0, 50.0, 55.0, 50.0, 52.0, 33.0, 40.0, 40.0, 41.0, 41.0, 47.0, 27.0, 18.0, 17.0, 13.0, 12.0, 10.0, 6.0, 11.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7431640625, -1.6873016357421875, -1.631439208984375, -1.5755767822265625, -1.51971435546875, -1.4638519287109375, -1.407989501953125, -1.3521270751953125, -1.2962646484375, -1.2404022216796875, -1.184539794921875, -1.1286773681640625, -1.07281494140625, -1.0169525146484375, -0.961090087890625, -0.9052276611328125, -0.849365234375, -0.7935028076171875, -0.737640380859375, -0.6817779541015625, -0.62591552734375, -0.5700531005859375, -0.514190673828125, -0.4583282470703125, -0.4024658203125, -0.3466033935546875, -0.290740966796875, -0.2348785400390625, -0.17901611328125, -0.1231536865234375, -0.067291259765625, -0.0114288330078125, 0.04443359375, 0.1002960205078125, 0.156158447265625, 0.2120208740234375, 0.26788330078125, 0.3237457275390625, 0.379608154296875, 0.4354705810546875, 0.4913330078125, 0.5471954345703125, 0.603057861328125, 0.6589202880859375, 0.71478271484375, 0.7706451416015625, 0.826507568359375, 0.8823699951171875, 0.938232421875, 0.9940948486328125, 1.049957275390625, 1.1058197021484375, 1.16168212890625, 1.2175445556640625, 1.273406982421875, 1.3292694091796875, 1.3851318359375, 1.4409942626953125, 1.496856689453125, 1.5527191162109375, 1.60858154296875, 1.6644439697265625, 1.720306396484375, 1.7761688232421875, 1.83203125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 7.0, 7.0, 7.0, 10.0, 18.0, 15.0, 23.0, 45.0, 64.0, 90.0, 108.0, 206.0, 329.0, 485.0, 805.0, 1452.0, 2951.0, 9162.0, 55325.0, 630254.0, 302648.0, 32356.0, 6580.0, 2423.0, 1186.0, 712.0, 458.0, 260.0, 184.0, 118.0, 87.0, 45.0, 48.0, 27.0, 13.0, 10.0, 6.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-8.5625, -8.302001953125, -8.04150390625, -7.781005859375, -7.5205078125, -7.260009765625, -6.99951171875, -6.739013671875, -6.478515625, -6.218017578125, -5.95751953125, -5.697021484375, -5.4365234375, -5.176025390625, -4.91552734375, -4.655029296875, -4.39453125, -4.134033203125, -3.87353515625, -3.613037109375, -3.3525390625, -3.092041015625, -2.83154296875, -2.571044921875, -2.310546875, -2.050048828125, -1.78955078125, -1.529052734375, -1.2685546875, -1.008056640625, -0.74755859375, -0.487060546875, -0.2265625, 0.033935546875, 0.29443359375, 0.554931640625, 0.8154296875, 1.075927734375, 1.33642578125, 1.596923828125, 1.857421875, 2.117919921875, 2.37841796875, 2.638916015625, 2.8994140625, 3.159912109375, 3.42041015625, 3.680908203125, 3.94140625, 4.201904296875, 4.46240234375, 4.722900390625, 4.9833984375, 5.243896484375, 5.50439453125, 5.764892578125, 6.025390625, 6.285888671875, 6.54638671875, 6.806884765625, 7.0673828125, 7.327880859375, 7.58837890625, 7.848876953125, 8.109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 7.0, 11.0, 17.0, 8.0, 20.0, 21.0, 20.0, 32.0, 19.0, 32.0, 28.0, 33.0, 41.0, 40.0, 44.0, 40.0, 57.0, 69.0, 52.0, 37.0, 46.0, 46.0, 51.0, 37.0, 34.0, 25.0, 13.0, 29.0, 14.0, 14.0, 16.0, 7.0, 8.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.25, -8.01751708984375, -7.7850341796875, -7.55255126953125, -7.320068359375, -7.08758544921875, -6.8551025390625, -6.62261962890625, -6.39013671875, -6.15765380859375, -5.9251708984375, -5.69268798828125, -5.460205078125, -5.22772216796875, -4.9952392578125, -4.76275634765625, -4.5302734375, -4.29779052734375, -4.0653076171875, -3.83282470703125, -3.600341796875, -3.36785888671875, -3.1353759765625, -2.90289306640625, -2.67041015625, -2.43792724609375, -2.2054443359375, -1.97296142578125, -1.740478515625, -1.50799560546875, -1.2755126953125, -1.04302978515625, -0.810546875, -0.57806396484375, -0.3455810546875, -0.11309814453125, 0.119384765625, 0.35186767578125, 0.5843505859375, 0.81683349609375, 1.04931640625, 1.28179931640625, 1.5142822265625, 1.74676513671875, 1.979248046875, 2.21173095703125, 2.4442138671875, 2.67669677734375, 2.9091796875, 3.14166259765625, 3.3741455078125, 3.60662841796875, 3.839111328125, 4.07159423828125, 4.3040771484375, 4.53656005859375, 4.76904296875, 5.00152587890625, 5.2340087890625, 5.46649169921875, 5.698974609375, 5.93145751953125, 6.1639404296875, 6.39642333984375, 6.62890625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 11.0, 19.0, 24.0, 53.0, 126.0, 309.0, 1259.0, 15143.0, 883827.0, 142847.0, 3922.0, 598.0, 205.0, 91.0, 43.0, 34.0, 14.0, 12.0, 8.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.953125, -7.753173828125, -7.55322265625, -7.353271484375, -7.1533203125, -6.953369140625, -6.75341796875, -6.553466796875, -6.353515625, -6.153564453125, -5.95361328125, -5.753662109375, -5.5537109375, -5.353759765625, -5.15380859375, -4.953857421875, -4.75390625, -4.553955078125, -4.35400390625, -4.154052734375, -3.9541015625, -3.754150390625, -3.55419921875, -3.354248046875, -3.154296875, -2.954345703125, -2.75439453125, -2.554443359375, -2.3544921875, -2.154541015625, -1.95458984375, -1.754638671875, -1.5546875, -1.354736328125, -1.15478515625, -0.954833984375, -0.7548828125, -0.554931640625, -0.35498046875, -0.155029296875, 0.044921875, 0.244873046875, 0.44482421875, 0.644775390625, 0.8447265625, 1.044677734375, 1.24462890625, 1.444580078125, 1.64453125, 1.844482421875, 2.04443359375, 2.244384765625, 2.4443359375, 2.644287109375, 2.84423828125, 3.044189453125, 3.244140625, 3.444091796875, 3.64404296875, 3.843994140625, 4.0439453125, 4.243896484375, 4.44384765625, 4.643798828125, 4.84375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 8.0, 13.0, 8.0, 10.0, 18.0, 18.0, 17.0, 14.0, 24.0, 21.0, 31.0, 45.0, 56.0, 70.0, 109.0, 113.0, 78.0, 73.0, 49.0, 29.0, 31.0, 24.0, 31.0, 23.0, 12.0, 17.0, 9.0, 9.0, 3.0, 2.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004487037658691406, -0.0004339292645454407, -0.0004191547632217407, -0.00040438026189804077, -0.0003896057605743408, -0.00037483125925064087, -0.0003600567579269409, -0.00034528225660324097, -0.000330507755279541, -0.00031573325395584106, -0.0003009587526321411, -0.00028618425130844116, -0.0002714097499847412, -0.00025663524866104126, -0.0002418607473373413, -0.00022708624601364136, -0.0002123117446899414, -0.00019753724336624146, -0.0001827627420425415, -0.00016798824071884155, -0.0001532137393951416, -0.00013843923807144165, -0.0001236647367477417, -0.00010889023542404175, -9.41157341003418e-05, -7.934123277664185e-05, -6.45667314529419e-05, -4.979223012924194e-05, -3.501772880554199e-05, -2.024322748184204e-05, -5.46872615814209e-06, 9.305775165557861e-06, 2.4080276489257812e-05, 3.8854777812957764e-05, 5.3629279136657715e-05, 6.840378046035767e-05, 8.317828178405762e-05, 9.795278310775757e-05, 0.00011272728443145752, 0.00012750178575515747, 0.00014227628707885742, 0.00015705078840255737, 0.00017182528972625732, 0.00018659979104995728, 0.00020137429237365723, 0.00021614879369735718, 0.00023092329502105713, 0.0002456977963447571, 0.00026047229766845703, 0.000275246798992157, 0.00029002130031585693, 0.0003047958016395569, 0.00031957030296325684, 0.0003343448042869568, 0.00034911930561065674, 0.0003638938069343567, 0.00037866830825805664, 0.0003934428095817566, 0.00040821731090545654, 0.0004229918122291565, 0.00043776631355285645, 0.0004525408148765564, 0.00046731531620025635, 0.0004820898175239563, 0.0004968643188476562]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 6.0, 3.0, 7.0, 10.0, 21.0, 14.0, 18.0, 40.0, 59.0, 87.0, 192.0, 309.0, 562.0, 1163.0, 3266.0, 12716.0, 90927.0, 787760.0, 128915.0, 16084.0, 3671.0, 1357.0, 582.0, 326.0, 171.0, 105.0, 69.0, 36.0, 32.0, 17.0, 11.0, 10.0, 7.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.482421875, -2.377105712890625, -2.27178955078125, -2.166473388671875, -2.0611572265625, -1.955841064453125, -1.85052490234375, -1.745208740234375, -1.639892578125, -1.534576416015625, -1.42926025390625, -1.323944091796875, -1.2186279296875, -1.113311767578125, -1.00799560546875, -0.902679443359375, -0.79736328125, -0.692047119140625, -0.58673095703125, -0.481414794921875, -0.3760986328125, -0.270782470703125, -0.16546630859375, -0.060150146484375, 0.045166015625, 0.150482177734375, 0.25579833984375, 0.361114501953125, 0.4664306640625, 0.571746826171875, 0.67706298828125, 0.782379150390625, 0.8876953125, 0.993011474609375, 1.09832763671875, 1.203643798828125, 1.3089599609375, 1.414276123046875, 1.51959228515625, 1.624908447265625, 1.730224609375, 1.835540771484375, 1.94085693359375, 2.046173095703125, 2.1514892578125, 2.256805419921875, 2.36212158203125, 2.467437744140625, 2.57275390625, 2.678070068359375, 2.78338623046875, 2.888702392578125, 2.9940185546875, 3.099334716796875, 3.20465087890625, 3.309967041015625, 3.415283203125, 3.520599365234375, 3.62591552734375, 3.731231689453125, 3.8365478515625, 3.941864013671875, 4.04718017578125, 4.152496337890625, 4.2578125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 9.0, 9.0, 5.0, 8.0, 8.0, 6.0, 9.0, 14.0, 31.0, 32.0, 37.0, 40.0, 54.0, 51.0, 67.0, 100.0, 96.0, 82.0, 62.0, 73.0, 36.0, 32.0, 29.0, 17.0, 18.0, 17.0, 15.0, 8.0, 10.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.17578125, -2.10784912109375, -2.0399169921875, -1.97198486328125, -1.904052734375, -1.83612060546875, -1.7681884765625, -1.70025634765625, -1.63232421875, -1.56439208984375, -1.4964599609375, -1.42852783203125, -1.360595703125, -1.29266357421875, -1.2247314453125, -1.15679931640625, -1.0888671875, -1.02093505859375, -0.9530029296875, -0.88507080078125, -0.817138671875, -0.74920654296875, -0.6812744140625, -0.61334228515625, -0.54541015625, -0.47747802734375, -0.4095458984375, -0.34161376953125, -0.273681640625, -0.20574951171875, -0.1378173828125, -0.06988525390625, -0.001953125, 0.06597900390625, 0.1339111328125, 0.20184326171875, 0.269775390625, 0.33770751953125, 0.4056396484375, 0.47357177734375, 0.54150390625, 0.60943603515625, 0.6773681640625, 0.74530029296875, 0.813232421875, 0.88116455078125, 0.9490966796875, 1.01702880859375, 1.0849609375, 1.15289306640625, 1.2208251953125, 1.28875732421875, 1.356689453125, 1.42462158203125, 1.4925537109375, 1.56048583984375, 1.62841796875, 1.69635009765625, 1.7642822265625, 1.83221435546875, 1.900146484375, 1.96807861328125, 2.0360107421875, 2.10394287109375, 2.171875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 17.0, 27.0, 72.0, 148.0, 179.0, 242.0, 133.0, 75.0, 43.0, 19.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.4610710144043, -48.66960144042969, -46.878135681152344, -45.086666107177734, -43.295196533203125, -41.503726959228516, -39.712257385253906, -37.92079162597656, -36.12932205200195, -34.337852478027344, -32.54638671875, -30.75491714477539, -28.96344757080078, -27.171977996826172, -25.380510330200195, -23.58904266357422, -21.79757308959961, -20.006103515625, -18.214635848999023, -16.423168182373047, -14.631698608398438, -12.840229988098145, -11.048761367797852, -9.257292747497559, -7.465824127197266, -5.674355506896973, -3.8828868865966797, -2.0914182662963867, -0.29994964599609375, 1.4915189743041992, 3.282987594604492, 5.074456214904785, 6.865928649902344, 8.657397270202637, 10.44886589050293, 12.240334510803223, 14.031803131103516, 15.823271751403809, 17.6147403717041, 19.406208038330078, 21.197677612304688, 22.989147186279297, 24.780614852905273, 26.57208251953125, 28.36355209350586, 30.15502166748047, 31.946489334106445, 33.73795700073242, 35.52942657470703, 37.32089614868164, 39.11236572265625, 40.903831481933594, 42.6953010559082, 44.48677062988281, 46.278236389160156, 48.069705963134766, 49.861175537109375, 51.652645111083984, 53.444114685058594, 55.23558044433594, 57.02705001831055, 58.818519592285156, 60.6099853515625, 62.40145492553711, 64.19292449951172]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 7.0, 5.0, 4.0, 15.0, 14.0, 7.0, 13.0, 22.0, 20.0, 24.0, 23.0, 31.0, 21.0, 25.0, 32.0, 43.0, 39.0, 53.0, 66.0, 60.0, 74.0, 50.0, 46.0, 44.0, 27.0, 33.0, 28.0, 28.0, 25.0, 22.0, 14.0, 17.0, 14.0, 7.0, 12.0, 10.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-28.83102798461914, -27.94133186340332, -27.051637649536133, -26.161941528320312, -25.272247314453125, -24.382551193237305, -23.492855072021484, -22.603160858154297, -21.71346664428711, -20.82377052307129, -19.9340763092041, -19.04438018798828, -18.154685974121094, -17.264989852905273, -16.375293731689453, -15.485599517822266, -14.595903396606445, -13.706208229064941, -12.816513061523438, -11.926816940307617, -11.03712272644043, -10.14742660522461, -9.257731437683105, -8.368036270141602, -7.478341102600098, -6.588645935058594, -5.69895076751709, -4.809255123138428, -3.919559955596924, -3.02986478805542, -2.140169143676758, -1.250473976135254, -0.3607769012451172, 0.5289183855056763, 1.4186136722564697, 2.3083090782165527, 3.1980042457580566, 4.0876994132995605, 4.977395057678223, 5.867090225219727, 6.7567853927612305, 7.646480560302734, 8.536175727844238, 9.425870895385742, 10.315567016601562, 11.20526123046875, 12.09495735168457, 12.984652519226074, 13.874347686767578, 14.764042854309082, 15.653738021850586, 16.543434143066406, 17.433128356933594, 18.322824478149414, 19.212520599365234, 20.102214813232422, 20.99190902709961, 21.88160514831543, 22.771299362182617, 23.660995483398438, 24.550689697265625, 25.440385818481445, 26.330081939697266, 27.219776153564453, 28.109472274780273]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 7.0, 2.0, 6.0, 7.0, 16.0, 19.0, 22.0, 37.0, 49.0, 78.0, 117.0, 165.0, 333.0, 574.0, 1045.0, 2231.0, 4852.0, 12791.0, 40292.0, 185214.0, 1712640.0, 1957586.0, 209894.0, 43030.0, 13279.0, 5102.0, 2246.0, 1102.0, 633.0, 312.0, 199.0, 132.0, 81.0, 52.0, 35.0, 25.0, 21.0, 19.0, 10.0, 5.0, 3.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.35546875, -3.247344970703125, -3.13922119140625, -3.031097412109375, -2.9229736328125, -2.814849853515625, -2.70672607421875, -2.598602294921875, -2.490478515625, -2.382354736328125, -2.27423095703125, -2.166107177734375, -2.0579833984375, -1.949859619140625, -1.84173583984375, -1.733612060546875, -1.62548828125, -1.517364501953125, -1.40924072265625, -1.301116943359375, -1.1929931640625, -1.084869384765625, -0.97674560546875, -0.868621826171875, -0.760498046875, -0.652374267578125, -0.54425048828125, -0.436126708984375, -0.3280029296875, -0.219879150390625, -0.11175537109375, -0.003631591796875, 0.1044921875, 0.212615966796875, 0.32073974609375, 0.428863525390625, 0.5369873046875, 0.645111083984375, 0.75323486328125, 0.861358642578125, 0.969482421875, 1.077606201171875, 1.18572998046875, 1.293853759765625, 1.4019775390625, 1.510101318359375, 1.61822509765625, 1.726348876953125, 1.83447265625, 1.942596435546875, 2.05072021484375, 2.158843994140625, 2.2669677734375, 2.375091552734375, 2.48321533203125, 2.591339111328125, 2.699462890625, 2.807586669921875, 2.91571044921875, 3.023834228515625, 3.1319580078125, 3.240081787109375, 3.34820556640625, 3.456329345703125, 3.564453125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 8.0, 10.0, 12.0, 17.0, 21.0, 20.0, 23.0, 42.0, 32.0, 43.0, 49.0, 56.0, 50.0, 53.0, 47.0, 69.0, 30.0, 47.0, 56.0, 42.0, 51.0, 37.0, 44.0, 34.0, 22.0, 15.0, 13.0, 11.0, 10.0, 12.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4814453125, -1.4198455810546875, -1.358245849609375, -1.2966461181640625, -1.23504638671875, -1.1734466552734375, -1.111846923828125, -1.0502471923828125, -0.9886474609375, -0.9270477294921875, -0.865447998046875, -0.8038482666015625, -0.74224853515625, -0.6806488037109375, -0.619049072265625, -0.5574493408203125, -0.495849609375, -0.4342498779296875, -0.372650146484375, -0.3110504150390625, -0.24945068359375, -0.1878509521484375, -0.126251220703125, -0.0646514892578125, -0.0030517578125, 0.0585479736328125, 0.120147705078125, 0.1817474365234375, 0.24334716796875, 0.3049468994140625, 0.366546630859375, 0.4281463623046875, 0.48974609375, 0.5513458251953125, 0.612945556640625, 0.6745452880859375, 0.73614501953125, 0.7977447509765625, 0.859344482421875, 0.9209442138671875, 0.9825439453125, 1.0441436767578125, 1.105743408203125, 1.1673431396484375, 1.22894287109375, 1.2905426025390625, 1.352142333984375, 1.4137420654296875, 1.475341796875, 1.5369415283203125, 1.598541259765625, 1.6601409912109375, 1.72174072265625, 1.7833404541015625, 1.844940185546875, 1.9065399169921875, 1.9681396484375, 2.0297393798828125, 2.091339111328125, 2.1529388427734375, 2.21453857421875, 2.2761383056640625, 2.337738037109375, 2.3993377685546875, 2.4609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 8.0, 14.0, 16.0, 21.0, 33.0, 50.0, 77.0, 100.0, 147.0, 232.0, 411.0, 763.0, 1479.0, 3068.0, 7125.0, 18957.0, 59206.0, 273443.0, 2470057.0, 1165880.0, 140216.0, 33922.0, 10944.0, 4132.0, 1884.0, 944.0, 471.0, 261.0, 158.0, 94.0, 56.0, 25.0, 29.0, 17.0, 12.0, 7.0, 5.0, 4.0, 1.0, 6.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.75, -3.6357421875, -3.521484375, -3.4072265625, -3.29296875, -3.1787109375, -3.064453125, -2.9501953125, -2.8359375, -2.7216796875, -2.607421875, -2.4931640625, -2.37890625, -2.2646484375, -2.150390625, -2.0361328125, -1.921875, -1.8076171875, -1.693359375, -1.5791015625, -1.46484375, -1.3505859375, -1.236328125, -1.1220703125, -1.0078125, -0.8935546875, -0.779296875, -0.6650390625, -0.55078125, -0.4365234375, -0.322265625, -0.2080078125, -0.09375, 0.0205078125, 0.134765625, 0.2490234375, 0.36328125, 0.4775390625, 0.591796875, 0.7060546875, 0.8203125, 0.9345703125, 1.048828125, 1.1630859375, 1.27734375, 1.3916015625, 1.505859375, 1.6201171875, 1.734375, 1.8486328125, 1.962890625, 2.0771484375, 2.19140625, 2.3056640625, 2.419921875, 2.5341796875, 2.6484375, 2.7626953125, 2.876953125, 2.9912109375, 3.10546875, 3.2197265625, 3.333984375, 3.4482421875, 3.5625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 12.0, 12.0, 17.0, 14.0, 30.0, 29.0, 64.0, 85.0, 125.0, 219.0, 364.0, 620.0, 924.0, 624.0, 354.0, 224.0, 121.0, 79.0, 42.0, 38.0, 17.0, 16.0, 14.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01171875, -5.837646484375, -5.66357421875, -5.489501953125, -5.3154296875, -5.141357421875, -4.96728515625, -4.793212890625, -4.619140625, -4.445068359375, -4.27099609375, -4.096923828125, -3.9228515625, -3.748779296875, -3.57470703125, -3.400634765625, -3.2265625, -3.052490234375, -2.87841796875, -2.704345703125, -2.5302734375, -2.356201171875, -2.18212890625, -2.008056640625, -1.833984375, -1.659912109375, -1.48583984375, -1.311767578125, -1.1376953125, -0.963623046875, -0.78955078125, -0.615478515625, -0.44140625, -0.267333984375, -0.09326171875, 0.080810546875, 0.2548828125, 0.428955078125, 0.60302734375, 0.777099609375, 0.951171875, 1.125244140625, 1.29931640625, 1.473388671875, 1.6474609375, 1.821533203125, 1.99560546875, 2.169677734375, 2.34375, 2.517822265625, 2.69189453125, 2.865966796875, 3.0400390625, 3.214111328125, 3.38818359375, 3.562255859375, 3.736328125, 3.910400390625, 4.08447265625, 4.258544921875, 4.4326171875, 4.606689453125, 4.78076171875, 4.954833984375, 5.12890625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 3.0, 3.0, 1.0, 6.0, 20.0, 62.0, 183.0, 321.0, 248.0, 89.0, 37.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.32659912109375, -121.61647033691406, -118.9063491821289, -116.19622802734375, -113.48609924316406, -110.77597045898438, -108.06584930419922, -105.35572814941406, -102.64559936523438, -99.93547058105469, -97.22534942626953, -94.51522827148438, -91.80509948730469, -89.094970703125, -86.38484954833984, -83.67472839355469, -80.964599609375, -78.25447082519531, -75.54434967041016, -72.834228515625, -70.12409973144531, -67.41397094726562, -64.70384979248047, -61.99372482299805, -59.283599853515625, -56.5734748840332, -53.86334991455078, -51.15322494506836, -48.44309997558594, -45.732975006103516, -43.022850036621094, -40.31272506713867, -37.60259246826172, -34.8924674987793, -32.182342529296875, -29.472217559814453, -26.76209259033203, -24.05196762084961, -21.341842651367188, -18.631717681884766, -15.921592712402344, -13.211467742919922, -10.5013427734375, -7.791217803955078, -5.081092834472656, -2.3709678649902344, 0.3391571044921875, 3.0492820739746094, 5.759407043457031, 8.469532012939453, 11.179656982421875, 13.889781951904297, 16.59990692138672, 19.31003189086914, 22.020156860351562, 24.730281829833984, 27.440406799316406, 30.150531768798828, 32.86065673828125, 35.57078170776367, 38.280906677246094, 40.991031646728516, 43.70115661621094, 46.41128158569336, 49.12140655517578]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 3.0, 1.0, 2.0, 7.0, 3.0, 12.0, 17.0, 16.0, 24.0, 23.0, 21.0, 34.0, 42.0, 32.0, 43.0, 39.0, 67.0, 51.0, 52.0, 50.0, 65.0, 65.0, 41.0, 43.0, 47.0, 32.0, 35.0, 26.0, 31.0, 20.0, 15.0, 11.0, 8.0, 9.0, 1.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.64452362060547, -23.84337615966797, -23.04222869873047, -22.241079330444336, -21.439931869506836, -20.638784408569336, -19.837636947631836, -19.036487579345703, -18.235340118408203, -17.434192657470703, -16.633045196533203, -15.831896781921387, -15.03074836730957, -14.22960090637207, -13.42845344543457, -12.627305030822754, -11.826157569885254, -11.025010108947754, -10.223861694335938, -9.422714233398438, -8.621565818786621, -7.820418357849121, -7.019270420074463, -6.218122482299805, -5.4169745445251465, -4.615826606750488, -3.81467866897583, -3.013530969619751, -2.2123830318450928, -1.4112353324890137, -0.6100873947143555, 0.19106054306030273, 0.9922084808349609, 1.7933564186096191, 2.5945043563842773, 3.3956520557403564, 4.196800231933594, 4.997947692871094, 5.799095630645752, 6.60024356842041, 7.401391506195068, 8.202539443969727, 9.003686904907227, 9.804835319519043, 10.605982780456543, 11.40713119506836, 12.20827865600586, 13.00942611694336, 13.810574531555176, 14.611721992492676, 15.412870407104492, 16.214017868041992, 17.015165328979492, 17.816314697265625, 18.617462158203125, 19.418609619140625, 20.219757080078125, 21.020904541015625, 21.822052001953125, 22.623201370239258, 23.424348831176758, 24.225496292114258, 25.026643753051758, 25.82779312133789, 26.62894058227539]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 11.0, 9.0, 18.0, 18.0, 26.0, 33.0, 64.0, 123.0, 182.0, 313.0, 632.0, 1251.0, 2977.0, 7184.0, 19643.0, 59047.0, 190336.0, 431358.0, 227235.0, 70125.0, 23051.0, 8327.0, 3424.0, 1503.0, 745.0, 354.0, 211.0, 103.0, 74.0, 48.0, 37.0, 29.0, 17.0, 11.0, 4.0, 5.0, 5.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-5.16796875, -5.022705078125, -4.87744140625, -4.732177734375, -4.5869140625, -4.441650390625, -4.29638671875, -4.151123046875, -4.005859375, -3.860595703125, -3.71533203125, -3.570068359375, -3.4248046875, -3.279541015625, -3.13427734375, -2.989013671875, -2.84375, -2.698486328125, -2.55322265625, -2.407958984375, -2.2626953125, -2.117431640625, -1.97216796875, -1.826904296875, -1.681640625, -1.536376953125, -1.39111328125, -1.245849609375, -1.1005859375, -0.955322265625, -0.81005859375, -0.664794921875, -0.51953125, -0.374267578125, -0.22900390625, -0.083740234375, 0.0615234375, 0.206787109375, 0.35205078125, 0.497314453125, 0.642578125, 0.787841796875, 0.93310546875, 1.078369140625, 1.2236328125, 1.368896484375, 1.51416015625, 1.659423828125, 1.8046875, 1.949951171875, 2.09521484375, 2.240478515625, 2.3857421875, 2.531005859375, 2.67626953125, 2.821533203125, 2.966796875, 3.112060546875, 3.25732421875, 3.402587890625, 3.5478515625, 3.693115234375, 3.83837890625, 3.983642578125, 4.12890625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 4.0, 3.0, 5.0, 9.0, 12.0, 10.0, 20.0, 17.0, 14.0, 25.0, 17.0, 25.0, 24.0, 19.0, 27.0, 31.0, 37.0, 30.0, 41.0, 36.0, 41.0, 25.0, 30.0, 40.0, 41.0, 38.0, 35.0, 27.0, 39.0, 20.0, 28.0, 31.0, 20.0, 13.0, 22.0, 30.0, 17.0, 12.0, 21.0, 10.0, 9.0, 9.0, 7.0, 6.0, 6.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.4228515625, -1.379180908203125, -1.33551025390625, -1.291839599609375, -1.2481689453125, -1.204498291015625, -1.16082763671875, -1.117156982421875, -1.073486328125, -1.029815673828125, -0.98614501953125, -0.942474365234375, -0.8988037109375, -0.855133056640625, -0.81146240234375, -0.767791748046875, -0.72412109375, -0.680450439453125, -0.63677978515625, -0.593109130859375, -0.5494384765625, -0.505767822265625, -0.46209716796875, -0.418426513671875, -0.374755859375, -0.331085205078125, -0.28741455078125, -0.243743896484375, -0.2000732421875, -0.156402587890625, -0.11273193359375, -0.069061279296875, -0.025390625, 0.018280029296875, 0.06195068359375, 0.105621337890625, 0.1492919921875, 0.192962646484375, 0.23663330078125, 0.280303955078125, 0.323974609375, 0.367645263671875, 0.41131591796875, 0.454986572265625, 0.4986572265625, 0.542327880859375, 0.58599853515625, 0.629669189453125, 0.67333984375, 0.717010498046875, 0.76068115234375, 0.804351806640625, 0.8480224609375, 0.891693115234375, 0.93536376953125, 0.979034423828125, 1.022705078125, 1.066375732421875, 1.11004638671875, 1.153717041015625, 1.1973876953125, 1.241058349609375, 1.28472900390625, 1.328399658203125, 1.3720703125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 6.0, 5.0, 11.0, 21.0, 20.0, 36.0, 54.0, 78.0, 89.0, 140.0, 198.0, 294.0, 439.0, 784.0, 1442.0, 3168.0, 9715.0, 45841.0, 358641.0, 555585.0, 53688.0, 10896.0, 3524.0, 1513.0, 810.0, 492.0, 322.0, 198.0, 143.0, 104.0, 81.0, 65.0, 50.0, 26.0, 19.0, 14.0, 8.0, 9.0, 9.0, 6.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.1640625, -7.92425537109375, -7.6844482421875, -7.44464111328125, -7.204833984375, -6.96502685546875, -6.7252197265625, -6.48541259765625, -6.24560546875, -6.00579833984375, -5.7659912109375, -5.52618408203125, -5.286376953125, -5.04656982421875, -4.8067626953125, -4.56695556640625, -4.3271484375, -4.08734130859375, -3.8475341796875, -3.60772705078125, -3.367919921875, -3.12811279296875, -2.8883056640625, -2.64849853515625, -2.40869140625, -2.16888427734375, -1.9290771484375, -1.68927001953125, -1.449462890625, -1.20965576171875, -0.9698486328125, -0.73004150390625, -0.490234375, -0.25042724609375, -0.0106201171875, 0.22918701171875, 0.468994140625, 0.70880126953125, 0.9486083984375, 1.18841552734375, 1.42822265625, 1.66802978515625, 1.9078369140625, 2.14764404296875, 2.387451171875, 2.62725830078125, 2.8670654296875, 3.10687255859375, 3.3466796875, 3.58648681640625, 3.8262939453125, 4.06610107421875, 4.305908203125, 4.54571533203125, 4.7855224609375, 5.02532958984375, 5.26513671875, 5.50494384765625, 5.7447509765625, 5.98455810546875, 6.224365234375, 6.46417236328125, 6.7039794921875, 6.94378662109375, 7.18359375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 8.0, 4.0, 7.0, 6.0, 14.0, 9.0, 17.0, 21.0, 33.0, 32.0, 40.0, 44.0, 52.0, 58.0, 49.0, 54.0, 61.0, 62.0, 53.0, 45.0, 52.0, 52.0, 31.0, 33.0, 25.0, 28.0, 28.0, 18.0, 14.0, 7.0, 10.0, 10.0, 3.0, 8.0, 7.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78125, -8.5234375, -8.265625, -8.0078125, -7.75, -7.4921875, -7.234375, -6.9765625, -6.71875, -6.4609375, -6.203125, -5.9453125, -5.6875, -5.4296875, -5.171875, -4.9140625, -4.65625, -4.3984375, -4.140625, -3.8828125, -3.625, -3.3671875, -3.109375, -2.8515625, -2.59375, -2.3359375, -2.078125, -1.8203125, -1.5625, -1.3046875, -1.046875, -0.7890625, -0.53125, -0.2734375, -0.015625, 0.2421875, 0.5, 0.7578125, 1.015625, 1.2734375, 1.53125, 1.7890625, 2.046875, 2.3046875, 2.5625, 2.8203125, 3.078125, 3.3359375, 3.59375, 3.8515625, 4.109375, 4.3671875, 4.625, 4.8828125, 5.140625, 5.3984375, 5.65625, 5.9140625, 6.171875, 6.4296875, 6.6875, 6.9453125, 7.203125, 7.4609375, 7.71875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 8.0, 9.0, 4.0, 11.0, 11.0, 24.0, 31.0, 44.0, 53.0, 76.0, 124.0, 213.0, 431.0, 1177.0, 4651.0, 30389.0, 527776.0, 446681.0, 30108.0, 4520.0, 1185.0, 477.0, 205.0, 121.0, 57.0, 46.0, 24.0, 15.0, 23.0, 12.0, 12.0, 5.0, 9.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.0859375, -2.983062744140625, -2.88018798828125, -2.777313232421875, -2.6744384765625, -2.571563720703125, -2.46868896484375, -2.365814208984375, -2.262939453125, -2.160064697265625, -2.05718994140625, -1.954315185546875, -1.8514404296875, -1.748565673828125, -1.64569091796875, -1.542816162109375, -1.43994140625, -1.337066650390625, -1.23419189453125, -1.131317138671875, -1.0284423828125, -0.925567626953125, -0.82269287109375, -0.719818115234375, -0.616943359375, -0.514068603515625, -0.41119384765625, -0.308319091796875, -0.2054443359375, -0.102569580078125, 0.00030517578125, 0.103179931640625, 0.2060546875, 0.308929443359375, 0.41180419921875, 0.514678955078125, 0.6175537109375, 0.720428466796875, 0.82330322265625, 0.926177978515625, 1.029052734375, 1.131927490234375, 1.23480224609375, 1.337677001953125, 1.4405517578125, 1.543426513671875, 1.64630126953125, 1.749176025390625, 1.85205078125, 1.954925537109375, 2.05780029296875, 2.160675048828125, 2.2635498046875, 2.366424560546875, 2.46929931640625, 2.572174072265625, 2.675048828125, 2.777923583984375, 2.88079833984375, 2.983673095703125, 3.0865478515625, 3.189422607421875, 3.29229736328125, 3.395172119140625, 3.498046875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 2.0, 7.0, 6.0, 8.0, 15.0, 8.0, 14.0, 18.0, 23.0, 27.0, 47.0, 70.0, 89.0, 127.0, 122.0, 96.0, 81.0, 49.0, 40.0, 34.0, 28.0, 17.0, 10.0, 12.0, 5.0, 7.0, 6.0, 4.0, 8.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0006747245788574219, -0.0006574690341949463, -0.0006402134895324707, -0.0006229579448699951, -0.0006057024002075195, -0.0005884468555450439, -0.0005711913108825684, -0.0005539357662200928, -0.0005366802215576172, -0.0005194246768951416, -0.000502169132232666, -0.00048491358757019043, -0.00046765804290771484, -0.00045040249824523926, -0.00043314695358276367, -0.0004158914089202881, -0.0003986358642578125, -0.0003813803195953369, -0.00036412477493286133, -0.00034686923027038574, -0.00032961368560791016, -0.00031235814094543457, -0.000295102596282959, -0.0002778470516204834, -0.0002605915069580078, -0.00024333596229553223, -0.00022608041763305664, -0.00020882487297058105, -0.00019156932830810547, -0.00017431378364562988, -0.0001570582389831543, -0.0001398026943206787, -0.00012254714965820312, -0.00010529160499572754, -8.803606033325195e-05, -7.078051567077637e-05, -5.352497100830078e-05, -3.6269426345825195e-05, -1.901388168334961e-05, -1.7583370208740234e-06, 1.5497207641601562e-05, 3.275275230407715e-05, 5.0008296966552734e-05, 6.726384162902832e-05, 8.45193862915039e-05, 0.00010177493095397949, 0.00011903047561645508, 0.00013628602027893066, 0.00015354156494140625, 0.00017079710960388184, 0.00018805265426635742, 0.000205308198928833, 0.0002225637435913086, 0.00023981928825378418, 0.00025707483291625977, 0.00027433037757873535, 0.00029158592224121094, 0.0003088414669036865, 0.0003260970115661621, 0.0003433525562286377, 0.0003606081008911133, 0.00037786364555358887, 0.00039511919021606445, 0.00041237473487854004, 0.0004296302795410156]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 8.0, 11.0, 20.0, 21.0, 28.0, 47.0, 88.0, 107.0, 186.0, 370.0, 559.0, 1186.0, 2757.0, 8723.0, 39558.0, 306725.0, 610881.0, 59319.0, 11509.0, 3440.0, 1335.0, 695.0, 351.0, 209.0, 127.0, 84.0, 61.0, 44.0, 28.0, 14.0, 17.0, 11.0, 11.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3125, -2.233062744140625, -2.15362548828125, -2.074188232421875, -1.9947509765625, -1.915313720703125, -1.83587646484375, -1.756439208984375, -1.677001953125, -1.597564697265625, -1.51812744140625, -1.438690185546875, -1.3592529296875, -1.279815673828125, -1.20037841796875, -1.120941162109375, -1.04150390625, -0.962066650390625, -0.88262939453125, -0.803192138671875, -0.7237548828125, -0.644317626953125, -0.56488037109375, -0.485443115234375, -0.406005859375, -0.326568603515625, -0.24713134765625, -0.167694091796875, -0.0882568359375, -0.008819580078125, 0.07061767578125, 0.150054931640625, 0.2294921875, 0.308929443359375, 0.38836669921875, 0.467803955078125, 0.5472412109375, 0.626678466796875, 0.70611572265625, 0.785552978515625, 0.864990234375, 0.944427490234375, 1.02386474609375, 1.103302001953125, 1.1827392578125, 1.262176513671875, 1.34161376953125, 1.421051025390625, 1.50048828125, 1.579925537109375, 1.65936279296875, 1.738800048828125, 1.8182373046875, 1.897674560546875, 1.97711181640625, 2.056549072265625, 2.135986328125, 2.215423583984375, 2.29486083984375, 2.374298095703125, 2.4537353515625, 2.533172607421875, 2.61260986328125, 2.692047119140625, 2.771484375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 4.0, 6.0, 6.0, 17.0, 17.0, 16.0, 18.0, 31.0, 36.0, 43.0, 53.0, 68.0, 98.0, 91.0, 91.0, 92.0, 68.0, 43.0, 45.0, 27.0, 29.0, 28.0, 10.0, 11.0, 6.0, 4.0, 8.0, 4.0, 5.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8349609375, -1.7672576904296875, -1.699554443359375, -1.6318511962890625, -1.56414794921875, -1.4964447021484375, -1.428741455078125, -1.3610382080078125, -1.2933349609375, -1.2256317138671875, -1.157928466796875, -1.0902252197265625, -1.02252197265625, -0.9548187255859375, -0.887115478515625, -0.8194122314453125, -0.751708984375, -0.6840057373046875, -0.616302490234375, -0.5485992431640625, -0.48089599609375, -0.4131927490234375, -0.345489501953125, -0.2777862548828125, -0.2100830078125, -0.1423797607421875, -0.074676513671875, -0.0069732666015625, 0.06072998046875, 0.1284332275390625, 0.196136474609375, 0.2638397216796875, 0.33154296875, 0.3992462158203125, 0.466949462890625, 0.5346527099609375, 0.60235595703125, 0.6700592041015625, 0.737762451171875, 0.8054656982421875, 0.8731689453125, 0.9408721923828125, 1.008575439453125, 1.0762786865234375, 1.14398193359375, 1.2116851806640625, 1.279388427734375, 1.3470916748046875, 1.414794921875, 1.4824981689453125, 1.550201416015625, 1.6179046630859375, 1.68560791015625, 1.7533111572265625, 1.821014404296875, 1.8887176513671875, 1.9564208984375, 2.0241241455078125, 2.091827392578125, 2.1595306396484375, 2.22723388671875, 2.2949371337890625, 2.362640380859375, 2.4303436279296875, 2.498046875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 5.0, 11.0, 17.0, 44.0, 65.0, 101.0, 227.0, 283.0, 118.0, 55.0, 30.0, 12.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-78.0013198852539, -76.14591217041016, -74.2905044555664, -72.43509674072266, -70.5796890258789, -68.72428131103516, -66.86888122558594, -65.01347351074219, -63.15806198120117, -61.30265426635742, -59.44724655151367, -57.59184265136719, -55.73643493652344, -53.88102722167969, -52.02561950683594, -50.17021179199219, -48.31480407714844, -46.45939636230469, -44.60398864746094, -42.74858093261719, -40.8931770324707, -39.03776931762695, -37.1823616027832, -35.32695388793945, -33.47154998779297, -31.61614227294922, -29.7607364654541, -27.90532875061035, -26.0499210357666, -24.194515228271484, -22.339107513427734, -20.483699798583984, -18.628292083740234, -16.772884368896484, -14.91747760772705, -13.062070846557617, -11.206663131713867, -9.351256370544434, -7.495849609375, -5.64044189453125, -3.7850351333618164, -1.9296280145645142, -0.07422089576721191, 1.7811861038208008, 3.6365933418273926, 5.492000579833984, 7.347407341003418, 9.202815055847168, 11.058221817016602, 12.913628578186035, 14.769036293029785, 16.62444305419922, 18.47985076904297, 20.33525848388672, 22.190664291381836, 24.046072006225586, 25.901477813720703, 27.756885528564453, 29.61229133605957, 31.46769905090332, 33.32310485839844, 35.17851257324219, 37.03392028808594, 38.88932800292969, 40.74473571777344]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 6.0, 9.0, 13.0, 13.0, 12.0, 12.0, 17.0, 25.0, 23.0, 21.0, 31.0, 24.0, 18.0, 47.0, 38.0, 39.0, 39.0, 81.0, 64.0, 65.0, 50.0, 46.0, 39.0, 39.0, 19.0, 24.0, 28.0, 15.0, 20.0, 19.0, 21.0, 9.0, 12.0, 7.0, 10.0, 5.0, 5.0, 6.0, 1.0, 5.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-26.624732971191406, -25.820785522460938, -25.016836166381836, -24.212888717651367, -23.4089412689209, -22.604991912841797, -21.801044464111328, -20.99709701538086, -20.19314956665039, -19.389202117919922, -18.58525276184082, -17.78130531311035, -16.977357864379883, -16.17340850830078, -15.369461059570312, -14.565513610839844, -13.761565208435059, -12.957616806030273, -12.153669357299805, -11.34972095489502, -10.54577350616455, -9.741825103759766, -8.937877655029297, -8.133929252624512, -7.329981327056885, -6.526033401489258, -5.722085475921631, -4.918137550354004, -4.114189147949219, -3.310241222381592, -2.506293296813965, -1.702345371246338, -0.8983974456787109, -0.09444946050643921, 0.7094985246658325, 1.513446569442749, 2.317394495010376, 3.121342658996582, 3.925290584564209, 4.729238510131836, 5.533186435699463, 6.33713436126709, 7.141082286834717, 7.945030212402344, 8.748978614807129, 9.552927017211914, 10.356874465942383, 11.160821914672852, 11.964770317077637, 12.768718719482422, 13.57266616821289, 14.376614570617676, 15.180562019348145, 15.98451042175293, 16.7884578704834, 17.5924072265625, 18.39635467529297, 19.200302124023438, 20.00425148010254, 20.808198928833008, 21.612146377563477, 22.416095733642578, 23.220043182373047, 24.023990631103516, 24.827938079833984]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 12.0, 23.0, 30.0, 53.0, 92.0, 140.0, 268.0, 543.0, 1430.0, 5253.0, 29631.0, 556212.0, 3441864.0, 139703.0, 14115.0, 3017.0, 974.0, 404.0, 203.0, 124.0, 92.0, 40.0, 17.0, 9.0, 13.0, 3.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1171875, -4.9483642578125, -4.779541015625, -4.6107177734375, -4.44189453125, -4.2730712890625, -4.104248046875, -3.9354248046875, -3.7666015625, -3.5977783203125, -3.428955078125, -3.2601318359375, -3.09130859375, -2.9224853515625, -2.753662109375, -2.5848388671875, -2.416015625, -2.2471923828125, -2.078369140625, -1.9095458984375, -1.74072265625, -1.5718994140625, -1.403076171875, -1.2342529296875, -1.0654296875, -0.8966064453125, -0.727783203125, -0.5589599609375, -0.39013671875, -0.2213134765625, -0.052490234375, 0.1163330078125, 0.28515625, 0.4539794921875, 0.622802734375, 0.7916259765625, 0.96044921875, 1.1292724609375, 1.298095703125, 1.4669189453125, 1.6357421875, 1.8045654296875, 1.973388671875, 2.1422119140625, 2.31103515625, 2.4798583984375, 2.648681640625, 2.8175048828125, 2.986328125, 3.1551513671875, 3.323974609375, 3.4927978515625, 3.66162109375, 3.8304443359375, 3.999267578125, 4.1680908203125, 4.3369140625, 4.5057373046875, 4.674560546875, 4.8433837890625, 5.01220703125, 5.1810302734375, 5.349853515625, 5.5186767578125, 5.6875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 10.0, 4.0, 12.0, 16.0, 27.0, 33.0, 28.0, 50.0, 48.0, 54.0, 63.0, 78.0, 66.0, 86.0, 72.0, 59.0, 79.0, 57.0, 40.0, 38.0, 31.0, 21.0, 13.0, 15.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.390625, -2.305450439453125, -2.22027587890625, -2.135101318359375, -2.0499267578125, -1.964752197265625, -1.87957763671875, -1.794403076171875, -1.709228515625, -1.624053955078125, -1.53887939453125, -1.453704833984375, -1.3685302734375, -1.283355712890625, -1.19818115234375, -1.113006591796875, -1.02783203125, -0.942657470703125, -0.85748291015625, -0.772308349609375, -0.6871337890625, -0.601959228515625, -0.51678466796875, -0.431610107421875, -0.346435546875, -0.261260986328125, -0.17608642578125, -0.090911865234375, -0.0057373046875, 0.079437255859375, 0.16461181640625, 0.249786376953125, 0.3349609375, 0.420135498046875, 0.50531005859375, 0.590484619140625, 0.6756591796875, 0.760833740234375, 0.84600830078125, 0.931182861328125, 1.016357421875, 1.101531982421875, 1.18670654296875, 1.271881103515625, 1.3570556640625, 1.442230224609375, 1.52740478515625, 1.612579345703125, 1.69775390625, 1.782928466796875, 1.86810302734375, 1.953277587890625, 2.0384521484375, 2.123626708984375, 2.20880126953125, 2.293975830078125, 2.379150390625, 2.464324951171875, 2.54949951171875, 2.634674072265625, 2.7198486328125, 2.805023193359375, 2.89019775390625, 2.975372314453125, 3.060546875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 4.0, 5.0, 10.0, 12.0, 23.0, 25.0, 36.0, 38.0, 67.0, 110.0, 172.0, 268.0, 462.0, 881.0, 1897.0, 4366.0, 12549.0, 45588.0, 276404.0, 3062252.0, 682788.0, 75779.0, 18859.0, 6211.0, 2622.0, 1215.0, 626.0, 372.0, 202.0, 139.0, 95.0, 56.0, 39.0, 22.0, 28.0, 14.0, 12.0, 9.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6796875, -3.5596923828125, -3.439697265625, -3.3197021484375, -3.19970703125, -3.0797119140625, -2.959716796875, -2.8397216796875, -2.7197265625, -2.5997314453125, -2.479736328125, -2.3597412109375, -2.23974609375, -2.1197509765625, -1.999755859375, -1.8797607421875, -1.759765625, -1.6397705078125, -1.519775390625, -1.3997802734375, -1.27978515625, -1.1597900390625, -1.039794921875, -0.9197998046875, -0.7998046875, -0.6798095703125, -0.559814453125, -0.4398193359375, -0.31982421875, -0.1998291015625, -0.079833984375, 0.0401611328125, 0.16015625, 0.2801513671875, 0.400146484375, 0.5201416015625, 0.64013671875, 0.7601318359375, 0.880126953125, 1.0001220703125, 1.1201171875, 1.2401123046875, 1.360107421875, 1.4801025390625, 1.60009765625, 1.7200927734375, 1.840087890625, 1.9600830078125, 2.080078125, 2.2000732421875, 2.320068359375, 2.4400634765625, 2.56005859375, 2.6800537109375, 2.800048828125, 2.9200439453125, 3.0400390625, 3.1600341796875, 3.280029296875, 3.4000244140625, 3.52001953125, 3.6400146484375, 3.760009765625, 3.8800048828125, 4.0]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 4.0, 2.0, 15.0, 9.0, 15.0, 16.0, 28.0, 24.0, 47.0, 60.0, 85.0, 122.0, 208.0, 303.0, 469.0, 632.0, 615.0, 490.0, 314.0, 200.0, 102.0, 80.0, 53.0, 39.0, 33.0, 28.0, 18.0, 8.0, 8.0, 10.0, 6.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.333984375, -3.218597412109375, -3.10321044921875, -2.987823486328125, -2.8724365234375, -2.757049560546875, -2.64166259765625, -2.526275634765625, -2.410888671875, -2.295501708984375, -2.18011474609375, -2.064727783203125, -1.9493408203125, -1.833953857421875, -1.71856689453125, -1.603179931640625, -1.48779296875, -1.372406005859375, -1.25701904296875, -1.141632080078125, -1.0262451171875, -0.910858154296875, -0.79547119140625, -0.680084228515625, -0.564697265625, -0.449310302734375, -0.33392333984375, -0.218536376953125, -0.1031494140625, 0.012237548828125, 0.12762451171875, 0.243011474609375, 0.3583984375, 0.473785400390625, 0.58917236328125, 0.704559326171875, 0.8199462890625, 0.935333251953125, 1.05072021484375, 1.166107177734375, 1.281494140625, 1.396881103515625, 1.51226806640625, 1.627655029296875, 1.7430419921875, 1.858428955078125, 1.97381591796875, 2.089202880859375, 2.20458984375, 2.319976806640625, 2.43536376953125, 2.550750732421875, 2.6661376953125, 2.781524658203125, 2.89691162109375, 3.012298583984375, 3.127685546875, 3.243072509765625, 3.35845947265625, 3.473846435546875, 3.5892333984375, 3.704620361328125, 3.82000732421875, 3.935394287109375, 4.05078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 15.0, 30.0, 88.0, 186.0, 287.0, 232.0, 97.0, 31.0, 14.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-84.01828002929688, -81.99960327148438, -79.98092651367188, -77.9622573852539, -75.9435806274414, -73.9249038696289, -71.90623474121094, -69.88755798339844, -67.86888122558594, -65.85020446777344, -63.8315315246582, -61.81285858154297, -59.79418182373047, -57.77550506591797, -55.756832122802734, -53.7381591796875, -51.719482421875, -49.7008056640625, -47.682132720947266, -45.66345977783203, -43.64478302001953, -41.62610626220703, -39.6074333190918, -37.58876037597656, -35.57008361816406, -33.55140686035156, -31.532733917236328, -29.51405906677246, -27.495384216308594, -25.476709365844727, -23.45803451538086, -21.439359664916992, -19.420677185058594, -17.402002334594727, -15.38332748413086, -13.364652633666992, -11.345977783203125, -9.327302932739258, -7.308628082275391, -5.289953231811523, -3.2712783813476562, -1.252603530883789, 0.7660713195800781, 2.7847461700439453, 4.8034210205078125, 6.82209587097168, 8.840770721435547, 10.859445571899414, 12.878120422363281, 14.896795272827148, 16.915470123291016, 18.934144973754883, 20.95281982421875, 22.971494674682617, 24.990169525146484, 27.00884437561035, 29.02751922607422, 31.046194076538086, 33.06486892700195, 35.08354187011719, 37.10221862792969, 39.12089538574219, 41.13956832885742, 43.158241271972656, 45.176918029785156]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 12.0, 9.0, 11.0, 11.0, 27.0, 17.0, 27.0, 24.0, 28.0, 26.0, 36.0, 38.0, 47.0, 57.0, 51.0, 45.0, 54.0, 58.0, 52.0, 45.0, 29.0, 43.0, 28.0, 25.0, 27.0, 34.0, 22.0, 34.0, 12.0, 14.0, 7.0, 7.0, 5.0, 8.0, 4.0, 1.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.831260681152344, -18.28981590270996, -17.748371124267578, -17.206928253173828, -16.665483474731445, -16.124038696289062, -15.58259391784668, -15.041149139404297, -14.49970531463623, -13.958260536193848, -13.416816711425781, -12.875371932983398, -12.333927154541016, -11.79248332977295, -11.251038551330566, -10.7095947265625, -10.168149948120117, -9.626705169677734, -9.085261344909668, -8.543816566467285, -8.002372741699219, -7.460927963256836, -6.919483184814453, -6.3780388832092285, -5.836594581604004, -5.295150279998779, -4.753705978393555, -4.212261199951172, -3.6708168983459473, -3.1293725967407227, -2.587928056716919, -2.0464835166931152, -1.5050392150878906, -0.9635947942733765, -0.4221503734588623, 0.11929404735565186, 0.660738468170166, 1.2021827697753906, 1.7436273097991943, 2.285071849822998, 2.8265161514282227, 3.3679604530334473, 3.909404993057251, 4.450849533081055, 4.992293834686279, 5.533738136291504, 6.075182914733887, 6.616627216339111, 7.158071517944336, 7.6995158195495605, 8.240960121154785, 8.782404899597168, 9.323848724365234, 9.865293502807617, 10.40673828125, 10.948183059692383, 11.48962688446045, 12.031071662902832, 12.572515487670898, 13.113960266113281, 13.655405044555664, 14.19684886932373, 14.738293647766113, 15.27973747253418, 15.821182250976562]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 11.0, 7.0, 7.0, 17.0, 32.0, 26.0, 67.0, 93.0, 216.0, 470.0, 1302.0, 4446.0, 21257.0, 153886.0, 623986.0, 206853.0, 27709.0, 5602.0, 1493.0, 524.0, 276.0, 110.0, 66.0, 31.0, 23.0, 8.0, 7.0, 8.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.58062744140625, -6.3721923828125, -6.16375732421875, -5.955322265625, -5.74688720703125, -5.5384521484375, -5.33001708984375, -5.12158203125, -4.91314697265625, -4.7047119140625, -4.49627685546875, -4.287841796875, -4.07940673828125, -3.8709716796875, -3.66253662109375, -3.4541015625, -3.24566650390625, -3.0372314453125, -2.82879638671875, -2.620361328125, -2.41192626953125, -2.2034912109375, -1.99505615234375, -1.78662109375, -1.57818603515625, -1.3697509765625, -1.16131591796875, -0.952880859375, -0.74444580078125, -0.5360107421875, -0.32757568359375, -0.119140625, 0.08929443359375, 0.2977294921875, 0.50616455078125, 0.714599609375, 0.92303466796875, 1.1314697265625, 1.33990478515625, 1.54833984375, 1.75677490234375, 1.9652099609375, 2.17364501953125, 2.382080078125, 2.59051513671875, 2.7989501953125, 3.00738525390625, 3.2158203125, 3.42425537109375, 3.6326904296875, 3.84112548828125, 4.049560546875, 4.25799560546875, 4.4664306640625, 4.67486572265625, 4.88330078125, 5.09173583984375, 5.3001708984375, 5.50860595703125, 5.717041015625, 5.92547607421875, 6.1339111328125, 6.34234619140625, 6.55078125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 10.0, 9.0, 20.0, 26.0, 29.0, 32.0, 39.0, 40.0, 51.0, 77.0, 52.0, 66.0, 75.0, 73.0, 51.0, 78.0, 56.0, 57.0, 41.0, 32.0, 22.0, 23.0, 18.0, 8.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.388671875, -2.307891845703125, -2.22711181640625, -2.146331787109375, -2.0655517578125, -1.984771728515625, -1.90399169921875, -1.823211669921875, -1.742431640625, -1.661651611328125, -1.58087158203125, -1.500091552734375, -1.4193115234375, -1.338531494140625, -1.25775146484375, -1.176971435546875, -1.09619140625, -1.015411376953125, -0.93463134765625, -0.853851318359375, -0.7730712890625, -0.692291259765625, -0.61151123046875, -0.530731201171875, -0.449951171875, -0.369171142578125, -0.28839111328125, -0.207611083984375, -0.1268310546875, -0.046051025390625, 0.03472900390625, 0.115509033203125, 0.1962890625, 0.277069091796875, 0.35784912109375, 0.438629150390625, 0.5194091796875, 0.600189208984375, 0.68096923828125, 0.761749267578125, 0.842529296875, 0.923309326171875, 1.00408935546875, 1.084869384765625, 1.1656494140625, 1.246429443359375, 1.32720947265625, 1.407989501953125, 1.48876953125, 1.569549560546875, 1.65032958984375, 1.731109619140625, 1.8118896484375, 1.892669677734375, 1.97344970703125, 2.054229736328125, 2.135009765625, 2.215789794921875, 2.29656982421875, 2.377349853515625, 2.4581298828125, 2.538909912109375, 2.61968994140625, 2.700469970703125, 2.78125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 10.0, 11.0, 10.0, 27.0, 26.0, 34.0, 55.0, 63.0, 97.0, 182.0, 358.0, 731.0, 1985.0, 6330.0, 24972.0, 131703.0, 642252.0, 192039.0, 34884.0, 8292.0, 2536.0, 941.0, 430.0, 193.0, 128.0, 70.0, 51.0, 42.0, 26.0, 19.0, 13.0, 4.0, 5.0, 7.0, 4.0, 3.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.71380615234375, -5.5487060546875, -5.38360595703125, -5.218505859375, -5.05340576171875, -4.8883056640625, -4.72320556640625, -4.55810546875, -4.39300537109375, -4.2279052734375, -4.06280517578125, -3.897705078125, -3.73260498046875, -3.5675048828125, -3.40240478515625, -3.2373046875, -3.07220458984375, -2.9071044921875, -2.74200439453125, -2.576904296875, -2.41180419921875, -2.2467041015625, -2.08160400390625, -1.91650390625, -1.75140380859375, -1.5863037109375, -1.42120361328125, -1.256103515625, -1.09100341796875, -0.9259033203125, -0.76080322265625, -0.595703125, -0.43060302734375, -0.2655029296875, -0.10040283203125, 0.064697265625, 0.22979736328125, 0.3948974609375, 0.55999755859375, 0.72509765625, 0.89019775390625, 1.0552978515625, 1.22039794921875, 1.385498046875, 1.55059814453125, 1.7156982421875, 1.88079833984375, 2.0458984375, 2.21099853515625, 2.3760986328125, 2.54119873046875, 2.706298828125, 2.87139892578125, 3.0364990234375, 3.20159912109375, 3.36669921875, 3.53179931640625, 3.6968994140625, 3.86199951171875, 4.027099609375, 4.19219970703125, 4.3572998046875, 4.52239990234375, 4.6875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 4.0, 7.0, 9.0, 6.0, 12.0, 11.0, 16.0, 18.0, 31.0, 28.0, 25.0, 29.0, 29.0, 27.0, 40.0, 35.0, 44.0, 53.0, 46.0, 54.0, 41.0, 47.0, 47.0, 42.0, 48.0, 39.0, 27.0, 30.0, 25.0, 13.0, 19.0, 19.0, 10.0, 11.0, 8.0, 12.0, 7.0, 9.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.3359375, -5.1470947265625, -4.958251953125, -4.7694091796875, -4.58056640625, -4.3917236328125, -4.202880859375, -4.0140380859375, -3.8251953125, -3.6363525390625, -3.447509765625, -3.2586669921875, -3.06982421875, -2.8809814453125, -2.692138671875, -2.5032958984375, -2.314453125, -2.1256103515625, -1.936767578125, -1.7479248046875, -1.55908203125, -1.3702392578125, -1.181396484375, -0.9925537109375, -0.8037109375, -0.6148681640625, -0.426025390625, -0.2371826171875, -0.04833984375, 0.1405029296875, 0.329345703125, 0.5181884765625, 0.70703125, 0.8958740234375, 1.084716796875, 1.2735595703125, 1.46240234375, 1.6512451171875, 1.840087890625, 2.0289306640625, 2.2177734375, 2.4066162109375, 2.595458984375, 2.7843017578125, 2.97314453125, 3.1619873046875, 3.350830078125, 3.5396728515625, 3.728515625, 3.9173583984375, 4.106201171875, 4.2950439453125, 4.48388671875, 4.6727294921875, 4.861572265625, 5.0504150390625, 5.2392578125, 5.4281005859375, 5.616943359375, 5.8057861328125, 5.99462890625, 6.1834716796875, 6.372314453125, 6.5611572265625, 6.75]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 7.0, 3.0, 11.0, 20.0, 23.0, 47.0, 60.0, 108.0, 184.0, 356.0, 835.0, 1962.0, 5480.0, 17747.0, 70488.0, 328269.0, 515970.0, 78053.0, 19266.0, 5893.0, 2099.0, 817.0, 358.0, 195.0, 104.0, 66.0, 31.0, 23.0, 24.0, 20.0, 13.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3662109375, -1.3235626220703125, -1.280914306640625, -1.2382659912109375, -1.19561767578125, -1.1529693603515625, -1.110321044921875, -1.0676727294921875, -1.0250244140625, -0.9823760986328125, -0.939727783203125, -0.8970794677734375, -0.85443115234375, -0.8117828369140625, -0.769134521484375, -0.7264862060546875, -0.683837890625, -0.6411895751953125, -0.598541259765625, -0.5558929443359375, -0.51324462890625, -0.4705963134765625, -0.427947998046875, -0.3852996826171875, -0.3426513671875, -0.3000030517578125, -0.257354736328125, -0.2147064208984375, -0.17205810546875, -0.1294097900390625, -0.086761474609375, -0.0441131591796875, -0.00146484375, 0.0411834716796875, 0.083831787109375, 0.1264801025390625, 0.16912841796875, 0.2117767333984375, 0.254425048828125, 0.2970733642578125, 0.3397216796875, 0.3823699951171875, 0.425018310546875, 0.4676666259765625, 0.51031494140625, 0.5529632568359375, 0.595611572265625, 0.6382598876953125, 0.680908203125, 0.7235565185546875, 0.766204833984375, 0.8088531494140625, 0.85150146484375, 0.8941497802734375, 0.936798095703125, 0.9794464111328125, 1.0220947265625, 1.0647430419921875, 1.107391357421875, 1.1500396728515625, 1.19268798828125, 1.2353363037109375, 1.277984619140625, 1.3206329345703125, 1.36328125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 6.0, 7.0, 10.0, 15.0, 23.0, 31.0, 46.0, 58.0, 72.0, 98.0, 114.0, 104.0, 99.0, 72.0, 62.0, 47.0, 27.0, 14.0, 15.0, 14.0, 7.0, 8.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00037384033203125, -0.0003628581762313843, -0.00035187602043151855, -0.00034089386463165283, -0.0003299117088317871, -0.0003189295530319214, -0.00030794739723205566, -0.00029696524143218994, -0.0002859830856323242, -0.0002750009298324585, -0.0002640187740325928, -0.00025303661823272705, -0.00024205446243286133, -0.0002310723066329956, -0.00022009015083312988, -0.00020910799503326416, -0.00019812583923339844, -0.00018714368343353271, -0.000176161527633667, -0.00016517937183380127, -0.00015419721603393555, -0.00014321506023406982, -0.0001322329044342041, -0.00012125074863433838, -0.00011026859283447266, -9.928643703460693e-05, -8.830428123474121e-05, -7.732212543487549e-05, -6.633996963500977e-05, -5.535781383514404e-05, -4.437565803527832e-05, -3.33935022354126e-05, -2.2411346435546875e-05, -1.1429190635681152e-05, -4.470348358154297e-07, 1.0535120964050293e-05, 2.1517276763916016e-05, 3.249943256378174e-05, 4.348158836364746e-05, 5.4463744163513184e-05, 6.54458999633789e-05, 7.642805576324463e-05, 8.741021156311035e-05, 9.839236736297607e-05, 0.0001093745231628418, 0.00012035667896270752, 0.00013133883476257324, 0.00014232099056243896, 0.0001533031463623047, 0.0001642853021621704, 0.00017526745796203613, 0.00018624961376190186, 0.00019723176956176758, 0.0002082139253616333, 0.00021919608116149902, 0.00023017823696136475, 0.00024116039276123047, 0.0002521425485610962, 0.0002631247043609619, 0.00027410686016082764, 0.00028508901596069336, 0.0002960711717605591, 0.0003070533275604248, 0.00031803548336029053, 0.00032901763916015625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 18.0, 22.0, 44.0, 123.0, 222.0, 712.0, 3242.0, 28123.0, 646166.0, 346074.0, 20181.0, 2636.0, 581.0, 231.0, 82.0, 43.0, 23.0, 14.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.162109375, -2.067840576171875, -1.97357177734375, -1.879302978515625, -1.7850341796875, -1.690765380859375, -1.59649658203125, -1.502227783203125, -1.407958984375, -1.313690185546875, -1.21942138671875, -1.125152587890625, -1.0308837890625, -0.936614990234375, -0.84234619140625, -0.748077392578125, -0.65380859375, -0.559539794921875, -0.46527099609375, -0.371002197265625, -0.2767333984375, -0.182464599609375, -0.08819580078125, 0.006072998046875, 0.100341796875, 0.194610595703125, 0.28887939453125, 0.383148193359375, 0.4774169921875, 0.571685791015625, 0.66595458984375, 0.760223388671875, 0.8544921875, 0.948760986328125, 1.04302978515625, 1.137298583984375, 1.2315673828125, 1.325836181640625, 1.42010498046875, 1.514373779296875, 1.608642578125, 1.702911376953125, 1.79718017578125, 1.891448974609375, 1.9857177734375, 2.079986572265625, 2.17425537109375, 2.268524169921875, 2.36279296875, 2.457061767578125, 2.55133056640625, 2.645599365234375, 2.7398681640625, 2.834136962890625, 2.92840576171875, 3.022674560546875, 3.116943359375, 3.211212158203125, 3.30548095703125, 3.399749755859375, 3.4940185546875, 3.588287353515625, 3.68255615234375, 3.776824951171875, 3.87109375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 11.0, 9.0, 23.0, 24.0, 19.0, 39.0, 42.0, 54.0, 75.0, 105.0, 99.0, 120.0, 90.0, 79.0, 59.0, 42.0, 37.0, 20.0, 18.0, 6.0, 13.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5283203125, -1.4672698974609375, -1.406219482421875, -1.3451690673828125, -1.28411865234375, -1.2230682373046875, -1.162017822265625, -1.1009674072265625, -1.0399169921875, -0.9788665771484375, -0.917816162109375, -0.8567657470703125, -0.79571533203125, -0.7346649169921875, -0.673614501953125, -0.6125640869140625, -0.551513671875, -0.4904632568359375, -0.429412841796875, -0.3683624267578125, -0.30731201171875, -0.2462615966796875, -0.185211181640625, -0.1241607666015625, -0.0631103515625, -0.0020599365234375, 0.058990478515625, 0.1200408935546875, 0.18109130859375, 0.2421417236328125, 0.303192138671875, 0.3642425537109375, 0.42529296875, 0.4863433837890625, 0.547393798828125, 0.6084442138671875, 0.66949462890625, 0.7305450439453125, 0.791595458984375, 0.8526458740234375, 0.9136962890625, 0.9747467041015625, 1.035797119140625, 1.0968475341796875, 1.15789794921875, 1.2189483642578125, 1.279998779296875, 1.3410491943359375, 1.402099609375, 1.4631500244140625, 1.524200439453125, 1.5852508544921875, 1.64630126953125, 1.7073516845703125, 1.768402099609375, 1.8294525146484375, 1.8905029296875, 1.9515533447265625, 2.012603759765625, 2.0736541748046875, 2.13470458984375, 2.1957550048828125, 2.256805419921875, 2.3178558349609375, 2.37890625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 6.0, 9.0, 27.0, 77.0, 220.0, 352.0, 180.0, 77.0, 24.0, 12.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.987667083740234, -45.04798889160156, -43.108306884765625, -41.16862869262695, -39.22895050048828, -37.289268493652344, -35.34959030151367, -33.409912109375, -31.470230102539062, -29.530550003051758, -27.590869903564453, -25.65119171142578, -23.711511611938477, -21.771831512451172, -19.8321533203125, -17.892473220825195, -15.95279312133789, -14.013113021850586, -12.073433876037598, -10.13375473022461, -8.194074630737305, -6.25439453125, -4.314715385437012, -2.3750362396240234, -0.43535614013671875, 1.5043234825134277, 3.444003105163574, 5.383682727813721, 7.323362350463867, 9.263042449951172, 11.20272159576416, 13.142400741577148, 15.082077026367188, 17.021757125854492, 18.961437225341797, 20.90111541748047, 22.840795516967773, 24.780475616455078, 26.72015380859375, 28.659833908081055, 30.59951400756836, 32.53919219970703, 34.47887420654297, 36.41855239868164, 38.35823059082031, 40.29791259765625, 42.23759078979492, 44.177268981933594, 46.11695098876953, 48.0566291809082, 49.99631118774414, 51.93598937988281, 53.87567138671875, 55.81534957885742, 57.755027770996094, 59.69470977783203, 61.6343879699707, 63.574066162109375, 65.51374816894531, 67.45343017578125, 69.39310455322266, 71.3327865600586, 73.27246856689453, 75.21214294433594, 77.15182495117188]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 5.0, 3.0, 2.0, 5.0, 8.0, 13.0, 9.0, 14.0, 21.0, 26.0, 29.0, 24.0, 34.0, 32.0, 36.0, 45.0, 52.0, 94.0, 113.0, 73.0, 61.0, 39.0, 48.0, 32.0, 27.0, 21.0, 21.0, 24.0, 21.0, 15.0, 11.0, 11.0, 8.0, 12.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.13483428955078, -34.174034118652344, -33.21323776245117, -32.252437591552734, -31.291637420654297, -30.330839157104492, -29.370040893554688, -28.40924072265625, -27.448440551757812, -26.487642288208008, -25.52684211730957, -24.566043853759766, -23.605243682861328, -22.644445419311523, -21.68364715576172, -20.72284698486328, -19.762048721313477, -18.801250457763672, -17.840450286865234, -16.87965202331543, -15.918851852416992, -14.958053588867188, -13.997254371643066, -13.036455154418945, -12.075655937194824, -11.114856719970703, -10.154057502746582, -9.193258285522461, -8.232460021972656, -7.271660327911377, -6.310861587524414, -5.350062370300293, -4.389263153076172, -3.428463935852051, -2.467664957046509, -1.5068659782409668, -0.5460667610168457, 0.4147324562072754, 1.3755311965942383, 2.3363304138183594, 3.2971296310424805, 4.257928848266602, 5.218728065490723, 6.1795268058776855, 7.140326023101807, 8.101125717163086, 9.06192398071289, 10.022723197937012, 10.983522415161133, 11.944321632385254, 12.905120849609375, 13.86591911315918, 14.826719284057617, 15.787517547607422, 16.74831771850586, 17.709115982055664, 18.66991424560547, 19.630712509155273, 20.59151268005371, 21.552310943603516, 22.513111114501953, 23.473909378051758, 24.434707641601562, 25.3955078125, 26.356307983398438]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 8.0, 15.0, 24.0, 26.0, 46.0, 71.0, 97.0, 185.0, 275.0, 583.0, 1144.0, 3152.0, 10468.0, 49861.0, 601952.0, 3180812.0, 300430.0, 32712.0, 7823.0, 2465.0, 968.0, 508.0, 263.0, 146.0, 72.0, 52.0, 44.0, 21.0, 15.0, 15.0, 10.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.265625, -3.15057373046875, -3.0355224609375, -2.92047119140625, -2.805419921875, -2.69036865234375, -2.5753173828125, -2.46026611328125, -2.34521484375, -2.23016357421875, -2.1151123046875, -2.00006103515625, -1.885009765625, -1.76995849609375, -1.6549072265625, -1.53985595703125, -1.4248046875, -1.30975341796875, -1.1947021484375, -1.07965087890625, -0.964599609375, -0.84954833984375, -0.7344970703125, -0.61944580078125, -0.50439453125, -0.38934326171875, -0.2742919921875, -0.15924072265625, -0.044189453125, 0.07086181640625, 0.1859130859375, 0.30096435546875, 0.416015625, 0.53106689453125, 0.6461181640625, 0.76116943359375, 0.876220703125, 0.99127197265625, 1.1063232421875, 1.22137451171875, 1.33642578125, 1.45147705078125, 1.5665283203125, 1.68157958984375, 1.796630859375, 1.91168212890625, 2.0267333984375, 2.14178466796875, 2.2568359375, 2.37188720703125, 2.4869384765625, 2.60198974609375, 2.717041015625, 2.83209228515625, 2.9471435546875, 3.06219482421875, 3.17724609375, 3.29229736328125, 3.4073486328125, 3.52239990234375, 3.637451171875, 3.75250244140625, 3.8675537109375, 3.98260498046875, 4.09765625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 11.0, 9.0, 9.0, 8.0, 16.0, 17.0, 23.0, 28.0, 20.0, 28.0, 24.0, 40.0, 55.0, 37.0, 45.0, 42.0, 64.0, 63.0, 59.0, 47.0, 42.0, 50.0, 41.0, 34.0, 31.0, 40.0, 26.0, 12.0, 12.0, 14.0, 16.0, 10.0, 4.0, 6.0, 6.0, 7.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0], "bins": [-2.1875, -2.1316986083984375, -2.075897216796875, -2.0200958251953125, -1.96429443359375, -1.9084930419921875, -1.852691650390625, -1.7968902587890625, -1.7410888671875, -1.6852874755859375, -1.629486083984375, -1.5736846923828125, -1.51788330078125, -1.4620819091796875, -1.406280517578125, -1.3504791259765625, -1.294677734375, -1.2388763427734375, -1.183074951171875, -1.1272735595703125, -1.07147216796875, -1.0156707763671875, -0.959869384765625, -0.9040679931640625, -0.8482666015625, -0.7924652099609375, -0.736663818359375, -0.6808624267578125, -0.62506103515625, -0.5692596435546875, -0.513458251953125, -0.4576568603515625, -0.40185546875, -0.3460540771484375, -0.290252685546875, -0.2344512939453125, -0.17864990234375, -0.1228485107421875, -0.067047119140625, -0.0112457275390625, 0.0445556640625, 0.1003570556640625, 0.156158447265625, 0.2119598388671875, 0.26776123046875, 0.3235626220703125, 0.379364013671875, 0.4351654052734375, 0.490966796875, 0.5467681884765625, 0.602569580078125, 0.6583709716796875, 0.71417236328125, 0.7699737548828125, 0.825775146484375, 0.8815765380859375, 0.9373779296875, 0.9931793212890625, 1.048980712890625, 1.1047821044921875, 1.16058349609375, 1.2163848876953125, 1.272186279296875, 1.3279876708984375, 1.3837890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 7.0, 7.0, 7.0, 6.0, 10.0, 13.0, 16.0, 41.0, 39.0, 69.0, 102.0, 220.0, 372.0, 871.0, 2293.0, 7548.0, 32948.0, 275525.0, 3291445.0, 519475.0, 48413.0, 9970.0, 2799.0, 1090.0, 436.0, 213.0, 115.0, 62.0, 49.0, 27.0, 19.0, 13.0, 13.0, 12.0, 10.0, 7.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.927734375, -3.807281494140625, -3.68682861328125, -3.566375732421875, -3.4459228515625, -3.325469970703125, -3.20501708984375, -3.084564208984375, -2.964111328125, -2.843658447265625, -2.72320556640625, -2.602752685546875, -2.4822998046875, -2.361846923828125, -2.24139404296875, -2.120941162109375, -2.00048828125, -1.880035400390625, -1.75958251953125, -1.639129638671875, -1.5186767578125, -1.398223876953125, -1.27777099609375, -1.157318115234375, -1.036865234375, -0.916412353515625, -0.79595947265625, -0.675506591796875, -0.5550537109375, -0.434600830078125, -0.31414794921875, -0.193695068359375, -0.0732421875, 0.047210693359375, 0.16766357421875, 0.288116455078125, 0.4085693359375, 0.529022216796875, 0.64947509765625, 0.769927978515625, 0.890380859375, 1.010833740234375, 1.13128662109375, 1.251739501953125, 1.3721923828125, 1.492645263671875, 1.61309814453125, 1.733551025390625, 1.85400390625, 1.974456787109375, 2.09490966796875, 2.215362548828125, 2.3358154296875, 2.456268310546875, 2.57672119140625, 2.697174072265625, 2.817626953125, 2.938079833984375, 3.05853271484375, 3.178985595703125, 3.2994384765625, 3.419891357421875, 3.54034423828125, 3.660797119140625, 3.78125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 8.0, 13.0, 12.0, 16.0, 24.0, 40.0, 51.0, 64.0, 113.0, 151.0, 221.0, 376.0, 489.0, 662.0, 588.0, 401.0, 272.0, 153.0, 119.0, 69.0, 68.0, 47.0, 23.0, 21.0, 18.0, 8.0, 6.0, 9.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.392578125, -3.29150390625, -3.1904296875, -3.08935546875, -2.98828125, -2.88720703125, -2.7861328125, -2.68505859375, -2.583984375, -2.48291015625, -2.3818359375, -2.28076171875, -2.1796875, -2.07861328125, -1.9775390625, -1.87646484375, -1.775390625, -1.67431640625, -1.5732421875, -1.47216796875, -1.37109375, -1.27001953125, -1.1689453125, -1.06787109375, -0.966796875, -0.86572265625, -0.7646484375, -0.66357421875, -0.5625, -0.46142578125, -0.3603515625, -0.25927734375, -0.158203125, -0.05712890625, 0.0439453125, 0.14501953125, 0.24609375, 0.34716796875, 0.4482421875, 0.54931640625, 0.650390625, 0.75146484375, 0.8525390625, 0.95361328125, 1.0546875, 1.15576171875, 1.2568359375, 1.35791015625, 1.458984375, 1.56005859375, 1.6611328125, 1.76220703125, 1.86328125, 1.96435546875, 2.0654296875, 2.16650390625, 2.267578125, 2.36865234375, 2.4697265625, 2.57080078125, 2.671875, 2.77294921875, 2.8740234375, 2.97509765625, 3.076171875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 14.0, 42.0, 136.0, 243.0, 258.0, 167.0, 81.0, 29.0, 12.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.297306060791016, -48.68324279785156, -47.069175720214844, -45.455108642578125, -43.84104537963867, -42.22698211669922, -40.6129150390625, -38.99884796142578, -37.38478469848633, -35.770721435546875, -34.156654357910156, -32.54258728027344, -30.928524017333984, -29.3144588470459, -27.700393676757812, -26.086328506469727, -24.47226333618164, -22.858198165893555, -21.24413299560547, -19.630067825317383, -18.016002655029297, -16.40193748474121, -14.787872314453125, -13.173807144165039, -11.559741973876953, -9.945676803588867, -8.331611633300781, -6.717546463012695, -5.103481292724609, -3.4894161224365234, -1.8753509521484375, -0.26128578186035156, 1.352783203125, 2.966848373413086, 4.580913543701172, 6.194978713989258, 7.809043884277344, 9.42310905456543, 11.037174224853516, 12.651239395141602, 14.265304565429688, 15.879369735717773, 17.49343490600586, 19.107500076293945, 20.72156524658203, 22.335630416870117, 23.949695587158203, 25.56376075744629, 27.177825927734375, 28.79189109802246, 30.405956268310547, 32.02001953125, 33.63408660888672, 35.24815368652344, 36.86221694946289, 38.476280212402344, 40.09034729003906, 41.70441436767578, 43.318477630615234, 44.93254089355469, 46.546607971191406, 48.160675048828125, 49.77473831176758, 51.38880157470703, 53.00286865234375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 8.0, 9.0, 13.0, 9.0, 13.0, 20.0, 15.0, 15.0, 21.0, 21.0, 29.0, 25.0, 43.0, 43.0, 44.0, 44.0, 52.0, 39.0, 46.0, 46.0, 52.0, 42.0, 50.0, 38.0, 31.0, 34.0, 26.0, 27.0, 25.0, 25.0, 17.0, 9.0, 18.0, 4.0, 6.0, 14.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.289567947387695, -11.863394737243652, -11.43722152709961, -11.011048316955566, -10.584875106811523, -10.15870189666748, -9.732528686523438, -9.306354522705078, -8.880182266235352, -8.454009056091309, -8.027835845947266, -7.601662635803223, -7.17548942565918, -6.749316215515137, -6.3231425285339355, -5.896969318389893, -5.470795631408691, -5.044622421264648, -4.6184492111206055, -4.1922760009765625, -3.7661025524139404, -3.3399293422698975, -2.9137558937072754, -2.4875826835632324, -2.0614094734191895, -1.6352362632751465, -1.209062933921814, -0.7828896045684814, -0.3567163944244385, 0.06945681571960449, 0.49563026428222656, 0.9218034744262695, 1.3479766845703125, 1.7741498947143555, 2.2003231048583984, 2.6264965534210205, 3.0526697635650635, 3.4788429737091064, 3.9050164222717285, 4.3311896324157715, 4.7573628425598145, 5.183536052703857, 5.6097092628479, 6.035882949829102, 6.4620561599731445, 6.8882293701171875, 7.3144025802612305, 7.740575790405273, 8.166749000549316, 8.59292221069336, 9.019095420837402, 9.445268630981445, 9.871441841125488, 10.297615051269531, 10.72378921508789, 11.149961471557617, 11.576135635375977, 12.00230884552002, 12.428482055664062, 12.854655265808105, 13.280828475952148, 13.707001686096191, 14.133174896240234, 14.559349060058594, 14.98552131652832]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 8.0, 2.0, 6.0, 14.0, 19.0, 29.0, 40.0, 66.0, 120.0, 197.0, 351.0, 755.0, 1616.0, 3897.0, 11382.0, 36304.0, 133525.0, 419725.0, 315386.0, 87261.0, 24453.0, 7868.0, 2983.0, 1222.0, 595.0, 277.0, 165.0, 102.0, 59.0, 45.0, 26.0, 14.0, 9.0, 10.0, 10.0, 9.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0078125, -3.889373779296875, -3.77093505859375, -3.652496337890625, -3.5340576171875, -3.415618896484375, -3.29718017578125, -3.178741455078125, -3.060302734375, -2.941864013671875, -2.82342529296875, -2.704986572265625, -2.5865478515625, -2.468109130859375, -2.34967041015625, -2.231231689453125, -2.11279296875, -1.994354248046875, -1.87591552734375, -1.757476806640625, -1.6390380859375, -1.520599365234375, -1.40216064453125, -1.283721923828125, -1.165283203125, -1.046844482421875, -0.92840576171875, -0.809967041015625, -0.6915283203125, -0.573089599609375, -0.45465087890625, -0.336212158203125, -0.2177734375, -0.099334716796875, 0.01910400390625, 0.137542724609375, 0.2559814453125, 0.374420166015625, 0.49285888671875, 0.611297607421875, 0.729736328125, 0.848175048828125, 0.96661376953125, 1.085052490234375, 1.2034912109375, 1.321929931640625, 1.44036865234375, 1.558807373046875, 1.67724609375, 1.795684814453125, 1.91412353515625, 2.032562255859375, 2.1510009765625, 2.269439697265625, 2.38787841796875, 2.506317138671875, 2.624755859375, 2.743194580078125, 2.86163330078125, 2.980072021484375, 3.0985107421875, 3.216949462890625, 3.33538818359375, 3.453826904296875, 3.572265625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 3.0, 4.0, 5.0, 8.0, 11.0, 17.0, 23.0, 31.0, 17.0, 31.0, 29.0, 48.0, 44.0, 34.0, 45.0, 56.0, 56.0, 56.0, 46.0, 44.0, 51.0, 45.0, 41.0, 43.0, 31.0, 34.0, 20.0, 30.0, 22.0, 18.0, 15.0, 12.0, 9.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.177734375, -2.118560791015625, -2.05938720703125, -2.000213623046875, -1.9410400390625, -1.881866455078125, -1.82269287109375, -1.763519287109375, -1.704345703125, -1.645172119140625, -1.58599853515625, -1.526824951171875, -1.4676513671875, -1.408477783203125, -1.34930419921875, -1.290130615234375, -1.23095703125, -1.171783447265625, -1.11260986328125, -1.053436279296875, -0.9942626953125, -0.935089111328125, -0.87591552734375, -0.816741943359375, -0.757568359375, -0.698394775390625, -0.63922119140625, -0.580047607421875, -0.5208740234375, -0.461700439453125, -0.40252685546875, -0.343353271484375, -0.2841796875, -0.225006103515625, -0.16583251953125, -0.106658935546875, -0.0474853515625, 0.011688232421875, 0.07086181640625, 0.130035400390625, 0.189208984375, 0.248382568359375, 0.30755615234375, 0.366729736328125, 0.4259033203125, 0.485076904296875, 0.54425048828125, 0.603424072265625, 0.66259765625, 0.721771240234375, 0.78094482421875, 0.840118408203125, 0.8992919921875, 0.958465576171875, 1.01763916015625, 1.076812744140625, 1.135986328125, 1.195159912109375, 1.25433349609375, 1.313507080078125, 1.3726806640625, 1.431854248046875, 1.49102783203125, 1.550201416015625, 1.609375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 7.0, 16.0, 24.0, 27.0, 38.0, 44.0, 60.0, 81.0, 118.0, 145.0, 243.0, 340.0, 548.0, 1024.0, 2304.0, 6433.0, 25060.0, 137235.0, 691265.0, 145676.0, 26007.0, 6877.0, 2223.0, 1037.0, 544.0, 360.0, 238.0, 144.0, 98.0, 79.0, 63.0, 62.0, 34.0, 35.0, 13.0, 12.0, 10.0, 9.0, 7.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8125, -4.66448974609375, -4.5164794921875, -4.36846923828125, -4.220458984375, -4.07244873046875, -3.9244384765625, -3.77642822265625, -3.62841796875, -3.48040771484375, -3.3323974609375, -3.18438720703125, -3.036376953125, -2.88836669921875, -2.7403564453125, -2.59234619140625, -2.4443359375, -2.29632568359375, -2.1483154296875, -2.00030517578125, -1.852294921875, -1.70428466796875, -1.5562744140625, -1.40826416015625, -1.26025390625, -1.11224365234375, -0.9642333984375, -0.81622314453125, -0.668212890625, -0.52020263671875, -0.3721923828125, -0.22418212890625, -0.076171875, 0.07183837890625, 0.2198486328125, 0.36785888671875, 0.515869140625, 0.66387939453125, 0.8118896484375, 0.95989990234375, 1.10791015625, 1.25592041015625, 1.4039306640625, 1.55194091796875, 1.699951171875, 1.84796142578125, 1.9959716796875, 2.14398193359375, 2.2919921875, 2.44000244140625, 2.5880126953125, 2.73602294921875, 2.884033203125, 3.03204345703125, 3.1800537109375, 3.32806396484375, 3.47607421875, 3.62408447265625, 3.7720947265625, 3.92010498046875, 4.068115234375, 4.21612548828125, 4.3641357421875, 4.51214599609375, 4.66015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 1.0, 6.0, 4.0, 6.0, 5.0, 5.0, 6.0, 5.0, 12.0, 11.0, 11.0, 14.0, 31.0, 15.0, 29.0, 25.0, 30.0, 31.0, 35.0, 41.0, 38.0, 48.0, 49.0, 46.0, 55.0, 55.0, 43.0, 40.0, 38.0, 37.0, 36.0, 29.0, 27.0, 21.0, 16.0, 24.0, 9.0, 13.0, 2.0, 7.0, 5.0, 10.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.0919189453125, -4.902587890625, -4.7132568359375, -4.52392578125, -4.3345947265625, -4.145263671875, -3.9559326171875, -3.7666015625, -3.5772705078125, -3.387939453125, -3.1986083984375, -3.00927734375, -2.8199462890625, -2.630615234375, -2.4412841796875, -2.251953125, -2.0626220703125, -1.873291015625, -1.6839599609375, -1.49462890625, -1.3052978515625, -1.115966796875, -0.9266357421875, -0.7373046875, -0.5479736328125, -0.358642578125, -0.1693115234375, 0.02001953125, 0.2093505859375, 0.398681640625, 0.5880126953125, 0.77734375, 0.9666748046875, 1.156005859375, 1.3453369140625, 1.53466796875, 1.7239990234375, 1.913330078125, 2.1026611328125, 2.2919921875, 2.4813232421875, 2.670654296875, 2.8599853515625, 3.04931640625, 3.2386474609375, 3.427978515625, 3.6173095703125, 3.806640625, 3.9959716796875, 4.185302734375, 4.3746337890625, 4.56396484375, 4.7532958984375, 4.942626953125, 5.1319580078125, 5.3212890625, 5.5106201171875, 5.699951171875, 5.8892822265625, 6.07861328125, 6.2679443359375, 6.457275390625, 6.6466064453125, 6.8359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 6.0, 4.0, 8.0, 19.0, 44.0, 78.0, 112.0, 211.0, 542.0, 1301.0, 4327.0, 18847.0, 116518.0, 790987.0, 93583.0, 15939.0, 3844.0, 1248.0, 460.0, 203.0, 119.0, 58.0, 23.0, 20.0, 12.0, 7.0, 10.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.51611328125, -1.4541015625, -1.39208984375, -1.330078125, -1.26806640625, -1.2060546875, -1.14404296875, -1.08203125, -1.02001953125, -0.9580078125, -0.89599609375, -0.833984375, -0.77197265625, -0.7099609375, -0.64794921875, -0.5859375, -0.52392578125, -0.4619140625, -0.39990234375, -0.337890625, -0.27587890625, -0.2138671875, -0.15185546875, -0.08984375, -0.02783203125, 0.0341796875, 0.09619140625, 0.158203125, 0.22021484375, 0.2822265625, 0.34423828125, 0.40625, 0.46826171875, 0.5302734375, 0.59228515625, 0.654296875, 0.71630859375, 0.7783203125, 0.84033203125, 0.90234375, 0.96435546875, 1.0263671875, 1.08837890625, 1.150390625, 1.21240234375, 1.2744140625, 1.33642578125, 1.3984375, 1.46044921875, 1.5224609375, 1.58447265625, 1.646484375, 1.70849609375, 1.7705078125, 1.83251953125, 1.89453125, 1.95654296875, 2.0185546875, 2.08056640625, 2.142578125, 2.20458984375, 2.2666015625, 2.32861328125, 2.390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 4.0, 7.0, 15.0, 20.0, 11.0, 21.0, 34.0, 42.0, 60.0, 74.0, 122.0, 111.0, 122.0, 81.0, 61.0, 40.0, 33.0, 23.0, 29.0, 22.0, 10.0, 10.0, 9.0, 7.0, 8.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002899169921875, -0.00027972087264060974, -0.0002695247530937195, -0.0002593286335468292, -0.00024913251399993896, -0.0002389363944530487, -0.00022874027490615845, -0.0002185441553592682, -0.00020834803581237793, -0.00019815191626548767, -0.0001879557967185974, -0.00017775967717170715, -0.0001675635576248169, -0.00015736743807792664, -0.00014717131853103638, -0.00013697519898414612, -0.00012677907943725586, -0.0001165829598903656, -0.00010638684034347534, -9.619072079658508e-05, -8.599460124969482e-05, -7.579848170280457e-05, -6.56023621559143e-05, -5.540624260902405e-05, -4.521012306213379e-05, -3.501400351524353e-05, -2.481788396835327e-05, -1.4621764421463013e-05, -4.425644874572754e-06, 5.770474672317505e-06, 1.5966594219207764e-05, 2.6162713766098022e-05, 3.635883331298828e-05, 4.655495285987854e-05, 5.67510724067688e-05, 6.694719195365906e-05, 7.714331150054932e-05, 8.733943104743958e-05, 9.753555059432983e-05, 0.00010773167014122009, 0.00011792778968811035, 0.0001281239092350006, 0.00013832002878189087, 0.00014851614832878113, 0.0001587122678756714, 0.00016890838742256165, 0.0001791045069694519, 0.00018930062651634216, 0.00019949674606323242, 0.00020969286561012268, 0.00021988898515701294, 0.0002300851047039032, 0.00024028122425079346, 0.0002504773437976837, 0.000260673463344574, 0.00027086958289146423, 0.0002810657024383545, 0.00029126182198524475, 0.000301457941532135, 0.00031165406107902527, 0.00032185018062591553, 0.0003320463001728058, 0.00034224241971969604, 0.0003524385392665863, 0.00036263465881347656]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 7.0, 7.0, 4.0, 6.0, 8.0, 15.0, 18.0, 28.0, 47.0, 53.0, 89.0, 124.0, 243.0, 427.0, 808.0, 1561.0, 3585.0, 9050.0, 27788.0, 104383.0, 653586.0, 181503.0, 42420.0, 13415.0, 4909.0, 2146.0, 990.0, 535.0, 286.0, 199.0, 84.0, 70.0, 55.0, 32.0, 21.0, 16.0, 11.0, 12.0, 8.0, 5.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.310546875, -1.267822265625, -1.22509765625, -1.182373046875, -1.1396484375, -1.096923828125, -1.05419921875, -1.011474609375, -0.96875, -0.926025390625, -0.88330078125, -0.840576171875, -0.7978515625, -0.755126953125, -0.71240234375, -0.669677734375, -0.626953125, -0.584228515625, -0.54150390625, -0.498779296875, -0.4560546875, -0.413330078125, -0.37060546875, -0.327880859375, -0.28515625, -0.242431640625, -0.19970703125, -0.156982421875, -0.1142578125, -0.071533203125, -0.02880859375, 0.013916015625, 0.056640625, 0.099365234375, 0.14208984375, 0.184814453125, 0.2275390625, 0.270263671875, 0.31298828125, 0.355712890625, 0.3984375, 0.441162109375, 0.48388671875, 0.526611328125, 0.5693359375, 0.612060546875, 0.65478515625, 0.697509765625, 0.740234375, 0.782958984375, 0.82568359375, 0.868408203125, 0.9111328125, 0.953857421875, 0.99658203125, 1.039306640625, 1.08203125, 1.124755859375, 1.16748046875, 1.210205078125, 1.2529296875, 1.295654296875, 1.33837890625, 1.381103515625, 1.423828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 10.0, 10.0, 11.0, 20.0, 22.0, 40.0, 80.0, 80.0, 130.0, 122.0, 114.0, 100.0, 68.0, 43.0, 25.0, 24.0, 18.0, 16.0, 14.0, 14.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8681640625, -1.8090057373046875, -1.749847412109375, -1.6906890869140625, -1.63153076171875, -1.5723724365234375, -1.513214111328125, -1.4540557861328125, -1.3948974609375, -1.3357391357421875, -1.276580810546875, -1.2174224853515625, -1.15826416015625, -1.0991058349609375, -1.039947509765625, -0.9807891845703125, -0.921630859375, -0.8624725341796875, -0.803314208984375, -0.7441558837890625, -0.68499755859375, -0.6258392333984375, -0.566680908203125, -0.5075225830078125, -0.4483642578125, -0.3892059326171875, -0.330047607421875, -0.2708892822265625, -0.21173095703125, -0.1525726318359375, -0.093414306640625, -0.0342559814453125, 0.02490234375, 0.0840606689453125, 0.143218994140625, 0.2023773193359375, 0.26153564453125, 0.3206939697265625, 0.379852294921875, 0.4390106201171875, 0.4981689453125, 0.5573272705078125, 0.616485595703125, 0.6756439208984375, 0.73480224609375, 0.7939605712890625, 0.853118896484375, 0.9122772216796875, 0.971435546875, 1.0305938720703125, 1.089752197265625, 1.1489105224609375, 1.20806884765625, 1.2672271728515625, 1.326385498046875, 1.3855438232421875, 1.4447021484375, 1.5038604736328125, 1.563018798828125, 1.6221771240234375, 1.68133544921875, 1.7404937744140625, 1.799652099609375, 1.8588104248046875, 1.91796875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 6.0, 11.0, 11.0, 27.0, 46.0, 93.0, 150.0, 294.0, 140.0, 87.0, 48.0, 33.0, 21.0, 11.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.427356719970703, -17.297054290771484, -16.166751861572266, -15.03644847869873, -13.906146049499512, -12.775843620300293, -11.645540237426758, -10.515237808227539, -9.38493537902832, -8.254632949829102, -7.124330043792725, -5.994027137756348, -4.863724708557129, -3.73342227935791, -2.603119373321533, -1.4728164672851562, -0.3425140380859375, 0.7877886295318604, 1.9180912971496582, 3.048393964767456, 4.178696632385254, 5.308999061584473, 6.43930196762085, 7.569604873657227, 8.699907302856445, 9.830209732055664, 10.960512161254883, 12.090815544128418, 13.221117973327637, 14.351420402526855, 15.48172378540039, 16.61202621459961, 17.742324829101562, 18.87262725830078, 20.0029296875, 21.13323211669922, 22.263534545898438, 23.393836975097656, 24.524141311645508, 25.654443740844727, 26.784746170043945, 27.915048599243164, 29.045351028442383, 30.1756534576416, 31.305957794189453, 32.43626022338867, 33.56656265258789, 34.69686508178711, 35.82716751098633, 36.95746994018555, 38.087772369384766, 39.218074798583984, 40.3483772277832, 41.47867965698242, 42.60898208618164, 43.739288330078125, 44.869590759277344, 45.99989318847656, 47.13019561767578, 48.260498046875, 49.39080047607422, 50.52110290527344, 51.651405334472656, 52.781707763671875, 53.912010192871094]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 14.0, 11.0, 14.0, 17.0, 22.0, 20.0, 29.0, 30.0, 23.0, 45.0, 48.0, 67.0, 94.0, 113.0, 81.0, 66.0, 36.0, 38.0, 33.0, 29.0, 18.0, 20.0, 18.0, 17.0, 13.0, 13.0, 9.0, 6.0, 10.0, 6.0, 2.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.393543243408203, -23.50079917907715, -22.608055114746094, -21.71531105041504, -20.822566986083984, -19.929824829101562, -19.037080764770508, -18.144336700439453, -17.2515926361084, -16.358848571777344, -15.466104507446289, -14.57336139678955, -13.680617332458496, -12.787873268127441, -11.895130157470703, -11.002386093139648, -10.109642028808594, -9.216897964477539, -8.324153900146484, -7.431410789489746, -6.538666725158691, -5.645922660827637, -4.75317907333374, -3.8604354858398438, -2.967691421508789, -2.0749475955963135, -1.182203769683838, -0.2894599437713623, 0.6032838821411133, 1.496027946472168, 2.3887715339660645, 3.281515121459961, 4.174259185791016, 5.06700325012207, 5.959746837615967, 6.852490425109863, 7.745234489440918, 8.637978553771973, 9.530721664428711, 10.423465728759766, 11.31620979309082, 12.208953857421875, 13.10169792175293, 13.994441032409668, 14.887185096740723, 15.779929161071777, 16.672672271728516, 17.56541633605957, 18.458160400390625, 19.35090446472168, 20.243648529052734, 21.13639259338379, 22.029136657714844, 22.921878814697266, 23.81462287902832, 24.707366943359375, 25.60011100769043, 26.492855072021484, 27.38559913635254, 28.278343200683594, 29.171085357666016, 30.063831329345703, 30.956573486328125, 31.84931755065918, 32.742061614990234]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 6.0, 10.0, 21.0, 21.0, 16.0, 34.0, 58.0, 69.0, 100.0, 151.0, 220.0, 391.0, 649.0, 1135.0, 2125.0, 4724.0, 12189.0, 44157.0, 267923.0, 2096670.0, 1536958.0, 175578.0, 32645.0, 9979.0, 3907.0, 1921.0, 1056.0, 556.0, 336.0, 201.0, 157.0, 96.0, 43.0, 54.0, 22.0, 24.0, 21.0, 11.0, 8.0, 8.0, 6.0, 3.0, 1.0, 2.0, 8.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.357421875, -3.258392333984375, -3.15936279296875, -3.060333251953125, -2.9613037109375, -2.862274169921875, -2.76324462890625, -2.664215087890625, -2.565185546875, -2.466156005859375, -2.36712646484375, -2.268096923828125, -2.1690673828125, -2.070037841796875, -1.97100830078125, -1.871978759765625, -1.77294921875, -1.673919677734375, -1.57489013671875, -1.475860595703125, -1.3768310546875, -1.277801513671875, -1.17877197265625, -1.079742431640625, -0.980712890625, -0.881683349609375, -0.78265380859375, -0.683624267578125, -0.5845947265625, -0.485565185546875, -0.38653564453125, -0.287506103515625, -0.1884765625, -0.089447021484375, 0.00958251953125, 0.108612060546875, 0.2076416015625, 0.306671142578125, 0.40570068359375, 0.504730224609375, 0.603759765625, 0.702789306640625, 0.80181884765625, 0.900848388671875, 0.9998779296875, 1.098907470703125, 1.19793701171875, 1.296966552734375, 1.39599609375, 1.495025634765625, 1.59405517578125, 1.693084716796875, 1.7921142578125, 1.891143798828125, 1.99017333984375, 2.089202880859375, 2.188232421875, 2.287261962890625, 2.38629150390625, 2.485321044921875, 2.5843505859375, 2.683380126953125, 2.78240966796875, 2.881439208984375, 2.98046875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 7.0, 7.0, 10.0, 13.0, 14.0, 15.0, 15.0, 20.0, 28.0, 27.0, 24.0, 32.0, 44.0, 43.0, 42.0, 42.0, 60.0, 44.0, 53.0, 45.0, 34.0, 40.0, 39.0, 35.0, 36.0, 33.0, 28.0, 24.0, 19.0, 25.0, 19.0, 15.0, 14.0, 12.0, 10.0, 9.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.646484375, -1.5944671630859375, -1.542449951171875, -1.4904327392578125, -1.43841552734375, -1.3863983154296875, -1.334381103515625, -1.2823638916015625, -1.2303466796875, -1.1783294677734375, -1.126312255859375, -1.0742950439453125, -1.02227783203125, -0.9702606201171875, -0.918243408203125, -0.8662261962890625, -0.814208984375, -0.7621917724609375, -0.710174560546875, -0.6581573486328125, -0.60614013671875, -0.5541229248046875, -0.502105712890625, -0.4500885009765625, -0.3980712890625, -0.3460540771484375, -0.294036865234375, -0.2420196533203125, -0.19000244140625, -0.1379852294921875, -0.085968017578125, -0.0339508056640625, 0.01806640625, 0.0700836181640625, 0.122100830078125, 0.1741180419921875, 0.22613525390625, 0.2781524658203125, 0.330169677734375, 0.3821868896484375, 0.4342041015625, 0.4862213134765625, 0.538238525390625, 0.5902557373046875, 0.64227294921875, 0.6942901611328125, 0.746307373046875, 0.7983245849609375, 0.850341796875, 0.9023590087890625, 0.954376220703125, 1.0063934326171875, 1.05841064453125, 1.1104278564453125, 1.162445068359375, 1.2144622802734375, 1.2664794921875, 1.3184967041015625, 1.370513916015625, 1.4225311279296875, 1.47454833984375, 1.5265655517578125, 1.578582763671875, 1.6305999755859375, 1.6826171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 5.0, 9.0, 17.0, 27.0, 36.0, 46.0, 84.0, 134.0, 257.0, 587.0, 1550.0, 5590.0, 35269.0, 616427.0, 3363660.0, 151143.0, 14699.0, 2986.0, 917.0, 351.0, 177.0, 103.0, 52.0, 52.0, 27.0, 24.0, 15.0, 10.0, 4.0, 8.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.92578125, -4.76837158203125, -4.6109619140625, -4.45355224609375, -4.296142578125, -4.13873291015625, -3.9813232421875, -3.82391357421875, -3.66650390625, -3.50909423828125, -3.3516845703125, -3.19427490234375, -3.036865234375, -2.87945556640625, -2.7220458984375, -2.56463623046875, -2.4072265625, -2.24981689453125, -2.0924072265625, -1.93499755859375, -1.777587890625, -1.62017822265625, -1.4627685546875, -1.30535888671875, -1.14794921875, -0.99053955078125, -0.8331298828125, -0.67572021484375, -0.518310546875, -0.36090087890625, -0.2034912109375, -0.04608154296875, 0.111328125, 0.26873779296875, 0.4261474609375, 0.58355712890625, 0.740966796875, 0.89837646484375, 1.0557861328125, 1.21319580078125, 1.37060546875, 1.52801513671875, 1.6854248046875, 1.84283447265625, 2.000244140625, 2.15765380859375, 2.3150634765625, 2.47247314453125, 2.6298828125, 2.78729248046875, 2.9447021484375, 3.10211181640625, 3.259521484375, 3.41693115234375, 3.5743408203125, 3.73175048828125, 3.88916015625, 4.04656982421875, 4.2039794921875, 4.36138916015625, 4.518798828125, 4.67620849609375, 4.8336181640625, 4.99102783203125, 5.1484375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 2.0, 3.0, 10.0, 11.0, 18.0, 33.0, 27.0, 36.0, 62.0, 79.0, 125.0, 154.0, 303.0, 412.0, 536.0, 638.0, 515.0, 382.0, 235.0, 168.0, 102.0, 66.0, 40.0, 35.0, 20.0, 20.0, 16.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.609375, -4.4857177734375, -4.362060546875, -4.2384033203125, -4.11474609375, -3.9910888671875, -3.867431640625, -3.7437744140625, -3.6201171875, -3.4964599609375, -3.372802734375, -3.2491455078125, -3.12548828125, -3.0018310546875, -2.878173828125, -2.7545166015625, -2.630859375, -2.5072021484375, -2.383544921875, -2.2598876953125, -2.13623046875, -2.0125732421875, -1.888916015625, -1.7652587890625, -1.6416015625, -1.5179443359375, -1.394287109375, -1.2706298828125, -1.14697265625, -1.0233154296875, -0.899658203125, -0.7760009765625, -0.65234375, -0.5286865234375, -0.405029296875, -0.2813720703125, -0.15771484375, -0.0340576171875, 0.089599609375, 0.2132568359375, 0.3369140625, 0.4605712890625, 0.584228515625, 0.7078857421875, 0.83154296875, 0.9552001953125, 1.078857421875, 1.2025146484375, 1.326171875, 1.4498291015625, 1.573486328125, 1.6971435546875, 1.82080078125, 1.9444580078125, 2.068115234375, 2.1917724609375, 2.3154296875, 2.4390869140625, 2.562744140625, 2.6864013671875, 2.81005859375, 2.9337158203125, 3.057373046875, 3.1810302734375, 3.3046875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 10.0, 16.0, 26.0, 50.0, 104.0, 164.0, 186.0, 185.0, 121.0, 57.0, 30.0, 18.0, 12.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.79263687133789, -51.513572692871094, -50.2345085144043, -48.9554443359375, -47.6763801574707, -46.397315979003906, -45.11825180053711, -43.83918762207031, -42.56012725830078, -41.281063079833984, -40.00199890136719, -38.72293472290039, -37.443870544433594, -36.1648063659668, -34.8857421875, -33.60668182373047, -32.327613830566406, -31.04854965209961, -29.769485473632812, -28.490421295166016, -27.21135711669922, -25.932292938232422, -24.653230667114258, -23.37416648864746, -22.095102310180664, -20.816038131713867, -19.53697395324707, -18.257909774780273, -16.97884750366211, -15.699782371520996, -14.420719146728516, -13.141654968261719, -11.862590789794922, -10.583526611328125, -9.304462432861328, -8.025399208068848, -6.746335029602051, -5.467270851135254, -4.188207149505615, -2.9091434478759766, -1.6300792694091797, -0.3510153293609619, 0.9280486106872559, 2.2071125507354736, 3.4861764907836914, 4.765240669250488, 6.044304370880127, 7.323368072509766, 8.602432250976562, 9.88149642944336, 11.160560607910156, 12.439623832702637, 13.718688011169434, 14.99775218963623, 16.27681541442871, 17.555879592895508, 18.834943771362305, 20.1140079498291, 21.3930721282959, 22.672136306762695, 23.95119857788086, 25.230262756347656, 26.509326934814453, 27.78839111328125, 29.067455291748047]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 11.0, 14.0, 8.0, 12.0, 11.0, 21.0, 28.0, 35.0, 37.0, 36.0, 53.0, 54.0, 46.0, 68.0, 62.0, 63.0, 68.0, 65.0, 61.0, 40.0, 40.0, 38.0, 30.0, 24.0, 20.0, 9.0, 11.0, 10.0, 6.0, 10.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.372846603393555, -19.630903244018555, -18.888957977294922, -18.147014617919922, -17.405071258544922, -16.663127899169922, -15.921183586120605, -15.179239273071289, -14.437295913696289, -13.695352554321289, -12.953408241271973, -12.211463928222656, -11.469520568847656, -10.727577209472656, -9.98563289642334, -9.243688583374023, -8.501745223999023, -7.759801387786865, -7.017857551574707, -6.275913715362549, -5.533969879150391, -4.792026042938232, -4.050082206726074, -3.308138370513916, -2.566194534301758, -1.8242506980895996, -1.0823068618774414, -0.3403630256652832, 0.401580810546875, 1.1435246467590332, 1.8854684829711914, 2.6274123191833496, 3.3693580627441406, 4.111301898956299, 4.853245735168457, 5.595189571380615, 6.337133407592773, 7.079077243804932, 7.82102108001709, 8.562965393066406, 9.304908752441406, 10.046852111816406, 10.788796424865723, 11.530740737915039, 12.272684097290039, 13.014627456665039, 13.756571769714355, 14.498516082763672, 15.240459442138672, 15.982402801513672, 16.724346160888672, 17.466291427612305, 18.208234786987305, 18.950178146362305, 19.692123413085938, 20.434066772460938, 21.176010131835938, 21.917953491210938, 22.659896850585938, 23.40184211730957, 24.14378547668457, 24.88572883605957, 25.627674102783203, 26.369617462158203, 27.111560821533203]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 12.0, 14.0, 21.0, 29.0, 55.0, 70.0, 113.0, 203.0, 335.0, 564.0, 1086.0, 1889.0, 3826.0, 8161.0, 18525.0, 47356.0, 146054.0, 409238.0, 273934.0, 83098.0, 29879.0, 12422.0, 5699.0, 2664.0, 1407.0, 807.0, 417.0, 245.0, 148.0, 97.0, 60.0, 32.0, 24.0, 16.0, 12.0, 12.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.03515625, -2.92962646484375, -2.8240966796875, -2.71856689453125, -2.613037109375, -2.50750732421875, -2.4019775390625, -2.29644775390625, -2.19091796875, -2.08538818359375, -1.9798583984375, -1.87432861328125, -1.768798828125, -1.66326904296875, -1.5577392578125, -1.45220947265625, -1.3466796875, -1.24114990234375, -1.1356201171875, -1.03009033203125, -0.924560546875, -0.81903076171875, -0.7135009765625, -0.60797119140625, -0.50244140625, -0.39691162109375, -0.2913818359375, -0.18585205078125, -0.080322265625, 0.02520751953125, 0.1307373046875, 0.23626708984375, 0.341796875, 0.44732666015625, 0.5528564453125, 0.65838623046875, 0.763916015625, 0.86944580078125, 0.9749755859375, 1.08050537109375, 1.18603515625, 1.29156494140625, 1.3970947265625, 1.50262451171875, 1.608154296875, 1.71368408203125, 1.8192138671875, 1.92474365234375, 2.0302734375, 2.13580322265625, 2.2413330078125, 2.34686279296875, 2.452392578125, 2.55792236328125, 2.6634521484375, 2.76898193359375, 2.87451171875, 2.98004150390625, 3.0855712890625, 3.19110107421875, 3.296630859375, 3.40216064453125, 3.5076904296875, 3.61322021484375, 3.71875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 7.0, 12.0, 11.0, 12.0, 9.0, 17.0, 17.0, 23.0, 34.0, 28.0, 43.0, 30.0, 36.0, 35.0, 51.0, 48.0, 28.0, 38.0, 45.0, 43.0, 43.0, 45.0, 50.0, 31.0, 35.0, 31.0, 33.0, 29.0, 20.0, 24.0, 18.0, 18.0, 11.0, 8.0, 7.0, 5.0, 6.0, 3.0, 8.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4404296875, -1.3857879638671875, -1.331146240234375, -1.2765045166015625, -1.22186279296875, -1.1672210693359375, -1.112579345703125, -1.0579376220703125, -1.0032958984375, -0.9486541748046875, -0.894012451171875, -0.8393707275390625, -0.78472900390625, -0.7300872802734375, -0.675445556640625, -0.6208038330078125, -0.566162109375, -0.5115203857421875, -0.456878662109375, -0.4022369384765625, -0.34759521484375, -0.2929534912109375, -0.238311767578125, -0.1836700439453125, -0.1290283203125, -0.0743865966796875, -0.019744873046875, 0.0348968505859375, 0.08953857421875, 0.1441802978515625, 0.198822021484375, 0.2534637451171875, 0.30810546875, 0.3627471923828125, 0.417388916015625, 0.4720306396484375, 0.52667236328125, 0.5813140869140625, 0.635955810546875, 0.6905975341796875, 0.7452392578125, 0.7998809814453125, 0.854522705078125, 0.9091644287109375, 0.96380615234375, 1.0184478759765625, 1.073089599609375, 1.1277313232421875, 1.182373046875, 1.2370147705078125, 1.291656494140625, 1.3462982177734375, 1.40093994140625, 1.4555816650390625, 1.510223388671875, 1.5648651123046875, 1.6195068359375, 1.6741485595703125, 1.728790283203125, 1.7834320068359375, 1.83807373046875, 1.8927154541015625, 1.947357177734375, 2.0019989013671875, 2.056640625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 8.0, 12.0, 13.0, 17.0, 18.0, 32.0, 38.0, 46.0, 63.0, 105.0, 149.0, 238.0, 355.0, 543.0, 1042.0, 2466.0, 9041.0, 75111.0, 848240.0, 94675.0, 10552.0, 2757.0, 1183.0, 630.0, 383.0, 250.0, 164.0, 121.0, 78.0, 53.0, 30.0, 43.0, 16.0, 17.0, 21.0, 6.0, 8.0, 4.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.890625, -5.6767578125, -5.462890625, -5.2490234375, -5.03515625, -4.8212890625, -4.607421875, -4.3935546875, -4.1796875, -3.9658203125, -3.751953125, -3.5380859375, -3.32421875, -3.1103515625, -2.896484375, -2.6826171875, -2.46875, -2.2548828125, -2.041015625, -1.8271484375, -1.61328125, -1.3994140625, -1.185546875, -0.9716796875, -0.7578125, -0.5439453125, -0.330078125, -0.1162109375, 0.09765625, 0.3115234375, 0.525390625, 0.7392578125, 0.953125, 1.1669921875, 1.380859375, 1.5947265625, 1.80859375, 2.0224609375, 2.236328125, 2.4501953125, 2.6640625, 2.8779296875, 3.091796875, 3.3056640625, 3.51953125, 3.7333984375, 3.947265625, 4.1611328125, 4.375, 4.5888671875, 4.802734375, 5.0166015625, 5.23046875, 5.4443359375, 5.658203125, 5.8720703125, 6.0859375, 6.2998046875, 6.513671875, 6.7275390625, 6.94140625, 7.1552734375, 7.369140625, 7.5830078125, 7.796875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 6.0, 12.0, 12.0, 18.0, 25.0, 25.0, 27.0, 40.0, 47.0, 43.0, 58.0, 60.0, 41.0, 60.0, 64.0, 62.0, 52.0, 54.0, 42.0, 43.0, 27.0, 35.0, 21.0, 20.0, 19.0, 10.0, 9.0, 12.0, 6.0, 5.0, 10.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6796875, -6.453125, -6.2265625, -6.0, -5.7734375, -5.546875, -5.3203125, -5.09375, -4.8671875, -4.640625, -4.4140625, -4.1875, -3.9609375, -3.734375, -3.5078125, -3.28125, -3.0546875, -2.828125, -2.6015625, -2.375, -2.1484375, -1.921875, -1.6953125, -1.46875, -1.2421875, -1.015625, -0.7890625, -0.5625, -0.3359375, -0.109375, 0.1171875, 0.34375, 0.5703125, 0.796875, 1.0234375, 1.25, 1.4765625, 1.703125, 1.9296875, 2.15625, 2.3828125, 2.609375, 2.8359375, 3.0625, 3.2890625, 3.515625, 3.7421875, 3.96875, 4.1953125, 4.421875, 4.6484375, 4.875, 5.1015625, 5.328125, 5.5546875, 5.78125, 6.0078125, 6.234375, 6.4609375, 6.6875, 6.9140625, 7.140625, 7.3671875, 7.59375, 7.8203125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 14.0, 11.0, 21.0, 24.0, 43.0, 70.0, 99.0, 222.0, 565.0, 1831.0, 10349.0, 780077.0, 245067.0, 7603.0, 1508.0, 492.0, 193.0, 124.0, 63.0, 51.0, 29.0, 21.0, 12.0, 8.0, 5.0, 9.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.599609375, -3.49029541015625, -3.3809814453125, -3.27166748046875, -3.162353515625, -3.05303955078125, -2.9437255859375, -2.83441162109375, -2.72509765625, -2.61578369140625, -2.5064697265625, -2.39715576171875, -2.287841796875, -2.17852783203125, -2.0692138671875, -1.95989990234375, -1.8505859375, -1.74127197265625, -1.6319580078125, -1.52264404296875, -1.413330078125, -1.30401611328125, -1.1947021484375, -1.08538818359375, -0.97607421875, -0.86676025390625, -0.7574462890625, -0.64813232421875, -0.538818359375, -0.42950439453125, -0.3201904296875, -0.21087646484375, -0.1015625, 0.00775146484375, 0.1170654296875, 0.22637939453125, 0.335693359375, 0.44500732421875, 0.5543212890625, 0.66363525390625, 0.77294921875, 0.88226318359375, 0.9915771484375, 1.10089111328125, 1.210205078125, 1.31951904296875, 1.4288330078125, 1.53814697265625, 1.6474609375, 1.75677490234375, 1.8660888671875, 1.97540283203125, 2.084716796875, 2.19403076171875, 2.3033447265625, 2.41265869140625, 2.52197265625, 2.63128662109375, 2.7406005859375, 2.84991455078125, 2.959228515625, 3.06854248046875, 3.1778564453125, 3.28717041015625, 3.396484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 17.0, 19.0, 43.0, 61.0, 92.0, 128.0, 180.0, 133.0, 98.0, 64.0, 40.0, 23.0, 18.0, 11.0, 11.0, 8.0, 3.0, 7.0, 3.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041294097900390625, -0.00039945170283317566, -0.00038596242666244507, -0.0003724731504917145, -0.0003589838743209839, -0.0003454945981502533, -0.0003320053219795227, -0.0003185160458087921, -0.0003050267696380615, -0.00029153749346733093, -0.00027804821729660034, -0.00026455894112586975, -0.00025106966495513916, -0.00023758038878440857, -0.00022409111261367798, -0.0002106018364429474, -0.0001971125602722168, -0.0001836232841014862, -0.00017013400793075562, -0.00015664473176002502, -0.00014315545558929443, -0.00012966617941856384, -0.00011617690324783325, -0.00010268762707710266, -8.919835090637207e-05, -7.570907473564148e-05, -6.221979856491089e-05, -4.87305223941803e-05, -3.524124622344971e-05, -2.1751970052719116e-05, -8.262693881988525e-06, 5.2265822887420654e-06, 1.8715858459472656e-05, 3.220513463020325e-05, 4.569441080093384e-05, 5.918368697166443e-05, 7.267296314239502e-05, 8.616223931312561e-05, 9.96515154838562e-05, 0.00011314079165458679, 0.00012663006782531738, 0.00014011934399604797, 0.00015360862016677856, 0.00016709789633750916, 0.00018058717250823975, 0.00019407644867897034, 0.00020756572484970093, 0.00022105500102043152, 0.0002345442771911621, 0.0002480335533618927, 0.0002615228295326233, 0.0002750121057033539, 0.00028850138187408447, 0.00030199065804481506, 0.00031547993421554565, 0.00032896921038627625, 0.00034245848655700684, 0.0003559477627277374, 0.000369437038898468, 0.0003829263150691986, 0.0003964155912399292, 0.0004099048674106598, 0.0004233941435813904, 0.00043688341975212097, 0.00045037269592285156]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 8.0, 5.0, 9.0, 14.0, 25.0, 12.0, 25.0, 28.0, 55.0, 67.0, 81.0, 145.0, 186.0, 338.0, 581.0, 1051.0, 2324.0, 5692.0, 16908.0, 75865.0, 726709.0, 173759.0, 29240.0, 8680.0, 3309.0, 1507.0, 747.0, 395.0, 251.0, 154.0, 97.0, 68.0, 52.0, 30.0, 28.0, 21.0, 18.0, 21.0, 13.0, 9.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.3779296875, -1.3370513916015625, -1.296173095703125, -1.2552947998046875, -1.21441650390625, -1.1735382080078125, -1.132659912109375, -1.0917816162109375, -1.0509033203125, -1.0100250244140625, -0.969146728515625, -0.9282684326171875, -0.88739013671875, -0.8465118408203125, -0.805633544921875, -0.7647552490234375, -0.723876953125, -0.6829986572265625, -0.642120361328125, -0.6012420654296875, -0.56036376953125, -0.5194854736328125, -0.478607177734375, -0.4377288818359375, -0.3968505859375, -0.3559722900390625, -0.315093994140625, -0.2742156982421875, -0.23333740234375, -0.1924591064453125, -0.151580810546875, -0.1107025146484375, -0.06982421875, -0.0289459228515625, 0.011932373046875, 0.0528106689453125, 0.09368896484375, 0.1345672607421875, 0.175445556640625, 0.2163238525390625, 0.2572021484375, 0.2980804443359375, 0.338958740234375, 0.3798370361328125, 0.42071533203125, 0.4615936279296875, 0.502471923828125, 0.5433502197265625, 0.584228515625, 0.6251068115234375, 0.665985107421875, 0.7068634033203125, 0.74774169921875, 0.7886199951171875, 0.829498291015625, 0.8703765869140625, 0.9112548828125, 0.9521331787109375, 0.993011474609375, 1.0338897705078125, 1.07476806640625, 1.1156463623046875, 1.156524658203125, 1.1974029541015625, 1.23828125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 0.0, 7.0, 7.0, 5.0, 3.0, 5.0, 8.0, 8.0, 22.0, 17.0, 14.0, 29.0, 41.0, 33.0, 52.0, 77.0, 73.0, 82.0, 94.0, 87.0, 69.0, 47.0, 41.0, 38.0, 32.0, 23.0, 20.0, 13.0, 15.0, 5.0, 4.0, 3.0, 8.0, 4.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2424774169921875, -1.202728271484375, -1.1629791259765625, -1.12322998046875, -1.0834808349609375, -1.043731689453125, -1.0039825439453125, -0.9642333984375, -0.9244842529296875, -0.884735107421875, -0.8449859619140625, -0.80523681640625, -0.7654876708984375, -0.725738525390625, -0.6859893798828125, -0.646240234375, -0.6064910888671875, -0.566741943359375, -0.5269927978515625, -0.48724365234375, -0.4474945068359375, -0.407745361328125, -0.3679962158203125, -0.3282470703125, -0.2884979248046875, -0.248748779296875, -0.2089996337890625, -0.16925048828125, -0.1295013427734375, -0.089752197265625, -0.0500030517578125, -0.01025390625, 0.0294952392578125, 0.069244384765625, 0.1089935302734375, 0.14874267578125, 0.1884918212890625, 0.228240966796875, 0.2679901123046875, 0.3077392578125, 0.3474884033203125, 0.387237548828125, 0.4269866943359375, 0.46673583984375, 0.5064849853515625, 0.546234130859375, 0.5859832763671875, 0.625732421875, 0.6654815673828125, 0.705230712890625, 0.7449798583984375, 0.78472900390625, 0.8244781494140625, 0.864227294921875, 0.9039764404296875, 0.9437255859375, 0.9834747314453125, 1.023223876953125, 1.0629730224609375, 1.10272216796875, 1.1424713134765625, 1.182220458984375, 1.2219696044921875, 1.26171875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 13.0, 63.0, 573.0, 270.0, 63.0, 18.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.68977355957031, -51.23076629638672, -47.771759033203125, -44.3127555847168, -40.8537483215332, -37.39474105834961, -33.93573760986328, -30.476730346679688, -27.017723083496094, -23.5587158203125, -20.09971046447754, -16.640705108642578, -13.181697845458984, -9.72269058227539, -6.26368522644043, -2.8046798706054688, 0.654327392578125, 4.113333702087402, 7.57234001159668, 11.031346321105957, 14.490352630615234, 17.949359893798828, 21.40836524963379, 24.86737060546875, 28.326377868652344, 31.785385131835938, 35.24439239501953, 38.70339584350586, 42.16240310668945, 45.62141036987305, 49.080413818359375, 52.53942108154297, 55.99842834472656, 59.457435607910156, 62.91644287109375, 66.37545013427734, 69.83445739746094, 73.29345703125, 76.7524642944336, 80.21147155761719, 83.67047882080078, 87.12948608398438, 90.58849334716797, 94.04750061035156, 97.50650024414062, 100.96551513671875, 104.42451477050781, 107.8835220336914, 111.342529296875, 114.8015365600586, 118.26054382324219, 121.71955108642578, 125.17855834960938, 128.63755798339844, 132.09657287597656, 135.55557250976562, 139.01458740234375, 142.4735870361328, 145.93260192871094, 149.3916015625, 152.85061645507812, 156.3096160888672, 159.7686309814453, 163.22763061523438, 166.68663024902344]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 10.0, 12.0, 13.0, 18.0, 18.0, 29.0, 19.0, 31.0, 39.0, 34.0, 39.0, 58.0, 127.0, 163.0, 66.0, 42.0, 38.0, 34.0, 35.0, 26.0, 25.0, 16.0, 18.0, 12.0, 15.0, 9.0, 11.0, 8.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-33.54973602294922, -32.61933135986328, -31.688922882080078, -30.75851821899414, -29.82811164855957, -28.897705078125, -27.96729850769043, -27.03689193725586, -26.106487274169922, -25.17608070373535, -24.24567413330078, -23.315269470214844, -22.384862899780273, -21.454456329345703, -20.524049758911133, -19.593643188476562, -18.663236618041992, -17.732830047607422, -16.80242347717285, -15.872017860412598, -14.941612243652344, -14.011205673217773, -13.080799102783203, -12.150392532348633, -11.219986915588379, -10.289580345153809, -9.359174728393555, -8.428768157958984, -7.498362064361572, -6.56795597076416, -5.63754940032959, -4.707143306732178, -3.7767391204833984, -2.8463330268859863, -1.9159266948699951, -0.9855203628540039, -0.0551142692565918, 0.8752918243408203, 1.8056983947753906, 2.7361044883728027, 3.666510581970215, 4.596916675567627, 5.527322769165039, 6.457729339599609, 7.3881354331970215, 8.318541526794434, 9.248948097229004, 10.179353713989258, 11.109760284423828, 12.040166854858398, 12.970572471618652, 13.900979042053223, 14.831384658813477, 15.761791229248047, 16.692197799682617, 17.622604370117188, 18.553009033203125, 19.483415603637695, 20.413822174072266, 21.344226837158203, 22.274633407592773, 23.205039978027344, 24.135446548461914, 25.065853118896484, 25.996259689331055]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 11.0, 13.0, 14.0, 10.0, 19.0, 47.0, 53.0, 108.0, 154.0, 300.0, 584.0, 1141.0, 2549.0, 6865.0, 23090.0, 134455.0, 1011399.0, 2336302.0, 579223.0, 73992.0, 15038.0, 4846.0, 2057.0, 901.0, 458.0, 297.0, 152.0, 77.0, 51.0, 27.0, 20.0, 5.0, 7.0, 6.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5859375, -3.4715576171875, -3.357177734375, -3.2427978515625, -3.12841796875, -3.0140380859375, -2.899658203125, -2.7852783203125, -2.6708984375, -2.5565185546875, -2.442138671875, -2.3277587890625, -2.21337890625, -2.0989990234375, -1.984619140625, -1.8702392578125, -1.755859375, -1.6414794921875, -1.527099609375, -1.4127197265625, -1.29833984375, -1.1839599609375, -1.069580078125, -0.9552001953125, -0.8408203125, -0.7264404296875, -0.612060546875, -0.4976806640625, -0.38330078125, -0.2689208984375, -0.154541015625, -0.0401611328125, 0.07421875, 0.1885986328125, 0.302978515625, 0.4173583984375, 0.53173828125, 0.6461181640625, 0.760498046875, 0.8748779296875, 0.9892578125, 1.1036376953125, 1.218017578125, 1.3323974609375, 1.44677734375, 1.5611572265625, 1.675537109375, 1.7899169921875, 1.904296875, 2.0186767578125, 2.133056640625, 2.2474365234375, 2.36181640625, 2.4761962890625, 2.590576171875, 2.7049560546875, 2.8193359375, 2.9337158203125, 3.048095703125, 3.1624755859375, 3.27685546875, 3.3912353515625, 3.505615234375, 3.6199951171875, 3.734375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 11.0, 5.0, 8.0, 11.0, 11.0, 5.0, 14.0, 18.0, 16.0, 22.0, 26.0, 25.0, 29.0, 31.0, 29.0, 34.0, 51.0, 35.0, 33.0, 40.0, 42.0, 48.0, 46.0, 44.0, 34.0, 39.0, 35.0, 26.0, 24.0, 29.0, 28.0, 22.0, 27.0, 21.0, 11.0, 15.0, 7.0, 15.0, 10.0, 3.0, 5.0, 6.0, 2.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3017578125, -1.25518798828125, -1.2086181640625, -1.16204833984375, -1.115478515625, -1.06890869140625, -1.0223388671875, -0.97576904296875, -0.92919921875, -0.88262939453125, -0.8360595703125, -0.78948974609375, -0.742919921875, -0.69635009765625, -0.6497802734375, -0.60321044921875, -0.556640625, -0.51007080078125, -0.4635009765625, -0.41693115234375, -0.370361328125, -0.32379150390625, -0.2772216796875, -0.23065185546875, -0.18408203125, -0.13751220703125, -0.0909423828125, -0.04437255859375, 0.002197265625, 0.04876708984375, 0.0953369140625, 0.14190673828125, 0.1884765625, 0.23504638671875, 0.2816162109375, 0.32818603515625, 0.374755859375, 0.42132568359375, 0.4678955078125, 0.51446533203125, 0.56103515625, 0.60760498046875, 0.6541748046875, 0.70074462890625, 0.747314453125, 0.79388427734375, 0.8404541015625, 0.88702392578125, 0.93359375, 0.98016357421875, 1.0267333984375, 1.07330322265625, 1.119873046875, 1.16644287109375, 1.2130126953125, 1.25958251953125, 1.30615234375, 1.35272216796875, 1.3992919921875, 1.44586181640625, 1.492431640625, 1.53900146484375, 1.5855712890625, 1.63214111328125, 1.6787109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 8.0, 4.0, 10.0, 19.0, 27.0, 61.0, 75.0, 131.0, 240.0, 434.0, 859.0, 2447.0, 9639.0, 167787.0, 3924350.0, 77648.0, 7031.0, 1870.0, 814.0, 362.0, 185.0, 110.0, 64.0, 30.0, 24.0, 17.0, 13.0, 7.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.34375, -9.0260009765625, -8.708251953125, -8.3905029296875, -8.07275390625, -7.7550048828125, -7.437255859375, -7.1195068359375, -6.8017578125, -6.4840087890625, -6.166259765625, -5.8485107421875, -5.53076171875, -5.2130126953125, -4.895263671875, -4.5775146484375, -4.259765625, -3.9420166015625, -3.624267578125, -3.3065185546875, -2.98876953125, -2.6710205078125, -2.353271484375, -2.0355224609375, -1.7177734375, -1.4000244140625, -1.082275390625, -0.7645263671875, -0.44677734375, -0.1290283203125, 0.188720703125, 0.5064697265625, 0.82421875, 1.1419677734375, 1.459716796875, 1.7774658203125, 2.09521484375, 2.4129638671875, 2.730712890625, 3.0484619140625, 3.3662109375, 3.6839599609375, 4.001708984375, 4.3194580078125, 4.63720703125, 4.9549560546875, 5.272705078125, 5.5904541015625, 5.908203125, 6.2259521484375, 6.543701171875, 6.8614501953125, 7.17919921875, 7.4969482421875, 7.814697265625, 8.1324462890625, 8.4501953125, 8.7679443359375, 9.085693359375, 9.4034423828125, 9.72119140625, 10.0389404296875, 10.356689453125, 10.6744384765625, 10.9921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 13.0, 10.0, 31.0, 34.0, 26.0, 63.0, 91.0, 165.0, 226.0, 315.0, 488.0, 624.0, 620.0, 477.0, 301.0, 182.0, 126.0, 97.0, 53.0, 36.0, 25.0, 21.0, 15.0, 11.0, 6.0, 4.0, 4.0, 1.0, 1.0, 5.0, 1.0], "bins": [-9.1328125, -8.92889404296875, -8.7249755859375, -8.52105712890625, -8.317138671875, -8.11322021484375, -7.9093017578125, -7.70538330078125, -7.50146484375, -7.29754638671875, -7.0936279296875, -6.88970947265625, -6.685791015625, -6.48187255859375, -6.2779541015625, -6.07403564453125, -5.8701171875, -5.66619873046875, -5.4622802734375, -5.25836181640625, -5.054443359375, -4.85052490234375, -4.6466064453125, -4.44268798828125, -4.23876953125, -4.03485107421875, -3.8309326171875, -3.62701416015625, -3.423095703125, -3.21917724609375, -3.0152587890625, -2.81134033203125, -2.607421875, -2.40350341796875, -2.1995849609375, -1.99566650390625, -1.791748046875, -1.58782958984375, -1.3839111328125, -1.17999267578125, -0.97607421875, -0.77215576171875, -0.5682373046875, -0.36431884765625, -0.160400390625, 0.04351806640625, 0.2474365234375, 0.45135498046875, 0.6552734375, 0.85919189453125, 1.0631103515625, 1.26702880859375, 1.470947265625, 1.67486572265625, 1.8787841796875, 2.08270263671875, 2.28662109375, 2.49053955078125, 2.6944580078125, 2.89837646484375, 3.102294921875, 3.30621337890625, 3.5101318359375, 3.71405029296875, 3.91796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 13.0, 10.0, 17.0, 68.0, 128.0, 232.0, 237.0, 136.0, 70.0, 34.0, 18.0, 10.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.29667663574219, -87.48090362548828, -84.66513061523438, -81.84935760498047, -79.03358459472656, -76.21781158447266, -73.40203857421875, -70.58627319335938, -67.77049255371094, -64.95471954345703, -62.138946533203125, -59.32317352294922, -56.50740051269531, -53.691627502441406, -50.875858306884766, -48.06008529663086, -45.24431610107422, -42.42854309082031, -39.612770080566406, -36.7969970703125, -33.981224060058594, -31.16545295715332, -28.349681854248047, -25.53390884399414, -22.718135833740234, -19.902362823486328, -17.086589813232422, -14.270818710327148, -11.455045700073242, -8.639272689819336, -5.8235015869140625, -3.0077285766601562, -0.19196319580078125, 2.623809337615967, 5.439581871032715, 8.255353927612305, 11.071126937866211, 13.886899948120117, 16.70267105102539, 19.518444061279297, 22.334217071533203, 25.14999008178711, 27.965763092041016, 30.78153419494629, 33.59730529785156, 36.41307830810547, 39.228851318359375, 42.04462432861328, 44.86039733886719, 47.676170349121094, 50.491943359375, 53.307716369628906, 56.12348937988281, 58.93926239013672, 61.75503158569336, 64.57080078125, 67.38658142089844, 70.20235443115234, 73.01812744140625, 75.83390045166016, 78.64967346191406, 81.46544647216797, 84.28121948242188, 87.09698486328125, 89.91275787353516]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 19.0, 20.0, 27.0, 30.0, 33.0, 36.0, 32.0, 39.0, 69.0, 64.0, 103.0, 82.0, 76.0, 60.0, 57.0, 54.0, 38.0, 31.0, 36.0, 24.0, 16.0, 10.0, 10.0, 5.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.76939392089844, -41.46943283081055, -40.169471740722656, -38.86951446533203, -37.56955337524414, -36.26959228515625, -34.969635009765625, -33.669673919677734, -32.369712829589844, -31.069751739501953, -29.769792556762695, -28.469833374023438, -27.169872283935547, -25.869911193847656, -24.5699520111084, -23.26999282836914, -21.97003173828125, -20.67007064819336, -19.3701114654541, -18.070152282714844, -16.770191192626953, -15.470231056213379, -14.170270919799805, -12.87031078338623, -11.570350646972656, -10.270390510559082, -8.970430374145508, -7.670470237731934, -6.370510101318359, -5.070549964904785, -3.770589828491211, -2.4706296920776367, -1.1706657409667969, 0.12929439544677734, 1.4292545318603516, 2.729214668273926, 4.0291748046875, 5.329134941101074, 6.629095077514648, 7.929055213928223, 9.229015350341797, 10.528975486755371, 11.828935623168945, 13.12889575958252, 14.428855895996094, 15.728816032409668, 17.028776168823242, 18.3287353515625, 19.62869644165039, 20.92865753173828, 22.22861671447754, 23.528575897216797, 24.828536987304688, 26.128498077392578, 27.428457260131836, 28.728416442871094, 30.028377532958984, 31.328338623046875, 32.6282958984375, 33.92825698852539, 35.22821807861328, 36.52817916870117, 37.82814025878906, 39.12809753417969, 40.42805862426758]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 8.0, 18.0, 21.0, 37.0, 58.0, 87.0, 132.0, 291.0, 538.0, 1088.0, 2293.0, 5170.0, 13769.0, 50054.0, 276955.0, 583433.0, 81618.0, 20408.0, 6815.0, 2829.0, 1364.0, 653.0, 341.0, 202.0, 115.0, 87.0, 42.0, 30.0, 20.0, 16.0, 13.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.669921875, -3.555816650390625, -3.44171142578125, -3.327606201171875, -3.2135009765625, -3.099395751953125, -2.98529052734375, -2.871185302734375, -2.757080078125, -2.642974853515625, -2.52886962890625, -2.414764404296875, -2.3006591796875, -2.186553955078125, -2.07244873046875, -1.958343505859375, -1.84423828125, -1.730133056640625, -1.61602783203125, -1.501922607421875, -1.3878173828125, -1.273712158203125, -1.15960693359375, -1.045501708984375, -0.931396484375, -0.817291259765625, -0.70318603515625, -0.589080810546875, -0.4749755859375, -0.360870361328125, -0.24676513671875, -0.132659912109375, -0.0185546875, 0.095550537109375, 0.20965576171875, 0.323760986328125, 0.4378662109375, 0.551971435546875, 0.66607666015625, 0.780181884765625, 0.894287109375, 1.008392333984375, 1.12249755859375, 1.236602783203125, 1.3507080078125, 1.464813232421875, 1.57891845703125, 1.693023681640625, 1.80712890625, 1.921234130859375, 2.03533935546875, 2.149444580078125, 2.2635498046875, 2.377655029296875, 2.49176025390625, 2.605865478515625, 2.719970703125, 2.834075927734375, 2.94818115234375, 3.062286376953125, 3.1763916015625, 3.290496826171875, 3.40460205078125, 3.518707275390625, 3.6328125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 9.0, 19.0, 16.0, 23.0, 34.0, 29.0, 40.0, 50.0, 75.0, 50.0, 69.0, 72.0, 76.0, 70.0, 63.0, 56.0, 34.0, 39.0, 35.0, 37.0, 33.0, 18.0, 10.0, 11.0, 11.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.283203125, -2.19915771484375, -2.1151123046875, -2.03106689453125, -1.947021484375, -1.86297607421875, -1.7789306640625, -1.69488525390625, -1.61083984375, -1.52679443359375, -1.4427490234375, -1.35870361328125, -1.274658203125, -1.19061279296875, -1.1065673828125, -1.02252197265625, -0.9384765625, -0.85443115234375, -0.7703857421875, -0.68634033203125, -0.602294921875, -0.51824951171875, -0.4342041015625, -0.35015869140625, -0.26611328125, -0.18206787109375, -0.0980224609375, -0.01397705078125, 0.070068359375, 0.15411376953125, 0.2381591796875, 0.32220458984375, 0.40625, 0.49029541015625, 0.5743408203125, 0.65838623046875, 0.742431640625, 0.82647705078125, 0.9105224609375, 0.99456787109375, 1.07861328125, 1.16265869140625, 1.2467041015625, 1.33074951171875, 1.414794921875, 1.49884033203125, 1.5828857421875, 1.66693115234375, 1.7509765625, 1.83502197265625, 1.9190673828125, 2.00311279296875, 2.087158203125, 2.17120361328125, 2.2552490234375, 2.33929443359375, 2.42333984375, 2.50738525390625, 2.5914306640625, 2.67547607421875, 2.759521484375, 2.84356689453125, 2.9276123046875, 3.01165771484375, 3.095703125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 8.0, 5.0, 17.0, 13.0, 27.0, 32.0, 52.0, 42.0, 93.0, 158.0, 253.0, 439.0, 951.0, 2688.0, 13612.0, 208245.0, 796303.0, 19853.0, 3434.0, 1098.0, 482.0, 235.0, 164.0, 105.0, 56.0, 48.0, 33.0, 33.0, 28.0, 8.0, 5.0, 8.0, 3.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.38671875, -4.23590087890625, -4.0850830078125, -3.93426513671875, -3.783447265625, -3.63262939453125, -3.4818115234375, -3.33099365234375, -3.18017578125, -3.02935791015625, -2.8785400390625, -2.72772216796875, -2.576904296875, -2.42608642578125, -2.2752685546875, -2.12445068359375, -1.9736328125, -1.82281494140625, -1.6719970703125, -1.52117919921875, -1.370361328125, -1.21954345703125, -1.0687255859375, -0.91790771484375, -0.76708984375, -0.61627197265625, -0.4654541015625, -0.31463623046875, -0.163818359375, -0.01300048828125, 0.1378173828125, 0.28863525390625, 0.439453125, 0.59027099609375, 0.7410888671875, 0.89190673828125, 1.042724609375, 1.19354248046875, 1.3443603515625, 1.49517822265625, 1.64599609375, 1.79681396484375, 1.9476318359375, 2.09844970703125, 2.249267578125, 2.40008544921875, 2.5509033203125, 2.70172119140625, 2.8525390625, 3.00335693359375, 3.1541748046875, 3.30499267578125, 3.455810546875, 3.60662841796875, 3.7574462890625, 3.90826416015625, 4.05908203125, 4.20989990234375, 4.3607177734375, 4.51153564453125, 4.662353515625, 4.81317138671875, 4.9639892578125, 5.11480712890625, 5.265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 5.0, 7.0, 9.0, 11.0, 12.0, 9.0, 20.0, 24.0, 26.0, 36.0, 40.0, 49.0, 64.0, 83.0, 87.0, 80.0, 72.0, 78.0, 50.0, 42.0, 37.0, 23.0, 25.0, 15.0, 19.0, 17.0, 13.0, 8.0, 4.0, 5.0, 7.0, 5.0, 1.0, 1.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.078125, -8.8037109375, -8.529296875, -8.2548828125, -7.98046875, -7.7060546875, -7.431640625, -7.1572265625, -6.8828125, -6.6083984375, -6.333984375, -6.0595703125, -5.78515625, -5.5107421875, -5.236328125, -4.9619140625, -4.6875, -4.4130859375, -4.138671875, -3.8642578125, -3.58984375, -3.3154296875, -3.041015625, -2.7666015625, -2.4921875, -2.2177734375, -1.943359375, -1.6689453125, -1.39453125, -1.1201171875, -0.845703125, -0.5712890625, -0.296875, -0.0224609375, 0.251953125, 0.5263671875, 0.80078125, 1.0751953125, 1.349609375, 1.6240234375, 1.8984375, 2.1728515625, 2.447265625, 2.7216796875, 2.99609375, 3.2705078125, 3.544921875, 3.8193359375, 4.09375, 4.3681640625, 4.642578125, 4.9169921875, 5.19140625, 5.4658203125, 5.740234375, 6.0146484375, 6.2890625, 6.5634765625, 6.837890625, 7.1123046875, 7.38671875, 7.6611328125, 7.935546875, 8.2099609375, 8.484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 6.0, 4.0, 7.0, 7.0, 14.0, 30.0, 19.0, 40.0, 76.0, 73.0, 121.0, 185.0, 330.0, 620.0, 1246.0, 3351.0, 11720.0, 61755.0, 869864.0, 78132.0, 13934.0, 3901.0, 1461.0, 712.0, 345.0, 197.0, 111.0, 96.0, 53.0, 32.0, 24.0, 21.0, 8.0, 11.0, 6.0, 6.0, 7.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.60791015625, -0.5886459350585938, -0.5693817138671875, -0.5501174926757812, -0.530853271484375, -0.5115890502929688, -0.4923248291015625, -0.47306060791015625, -0.45379638671875, -0.43453216552734375, -0.4152679443359375, -0.39600372314453125, -0.376739501953125, -0.35747528076171875, -0.3382110595703125, -0.31894683837890625, -0.2996826171875, -0.28041839599609375, -0.2611541748046875, -0.24188995361328125, -0.222625732421875, -0.20336151123046875, -0.1840972900390625, -0.16483306884765625, -0.14556884765625, -0.12630462646484375, -0.1070404052734375, -0.08777618408203125, -0.068511962890625, -0.04924774169921875, -0.0299835205078125, -0.01071929931640625, 0.008544921875, 0.02780914306640625, 0.0470733642578125, 0.06633758544921875, 0.085601806640625, 0.10486602783203125, 0.1241302490234375, 0.14339447021484375, 0.16265869140625, 0.18192291259765625, 0.2011871337890625, 0.22045135498046875, 0.239715576171875, 0.25897979736328125, 0.2782440185546875, 0.29750823974609375, 0.3167724609375, 0.33603668212890625, 0.3553009033203125, 0.37456512451171875, 0.393829345703125, 0.41309356689453125, 0.4323577880859375, 0.45162200927734375, 0.47088623046875, 0.49015045166015625, 0.5094146728515625, 0.5286788940429688, 0.547943115234375, 0.5672073364257812, 0.5864715576171875, 0.6057357788085938, 0.625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 4.0, 5.0, 7.0, 16.0, 7.0, 14.0, 17.0, 13.0, 20.0, 23.0, 27.0, 34.0, 51.0, 57.0, 79.0, 106.0, 97.0, 84.0, 77.0, 61.0, 38.0, 37.0, 26.0, 15.0, 15.0, 13.0, 9.0, 11.0, 4.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.00013077259063720703, -0.00012726150453090668, -0.00012375041842460632, -0.00012023933231830597, -0.00011672824621200562, -0.00011321716010570526, -0.00010970607399940491, -0.00010619498789310455, -0.0001026839017868042, -9.917281568050385e-05, -9.566172957420349e-05, -9.215064346790314e-05, -8.863955736160278e-05, -8.512847125530243e-05, -8.161738514900208e-05, -7.810629904270172e-05, -7.459521293640137e-05, -7.108412683010101e-05, -6.757304072380066e-05, -6.40619546175003e-05, -6.055086851119995e-05, -5.70397824048996e-05, -5.352869629859924e-05, -5.001761019229889e-05, -4.6506524085998535e-05, -4.299543797969818e-05, -3.948435187339783e-05, -3.597326576709747e-05, -3.246217966079712e-05, -2.8951093554496765e-05, -2.544000744819641e-05, -2.1928921341896057e-05, -1.8417835235595703e-05, -1.4906749129295349e-05, -1.1395663022994995e-05, -7.884576916694641e-06, -4.373490810394287e-06, -8.624047040939331e-07, 2.648681402206421e-06, 6.159767508506775e-06, 9.670853614807129e-06, 1.3181939721107483e-05, 1.6693025827407837e-05, 2.020411193370819e-05, 2.3715198040008545e-05, 2.72262841463089e-05, 3.073737025260925e-05, 3.424845635890961e-05, 3.775954246520996e-05, 4.1270628571510315e-05, 4.478171467781067e-05, 4.829280078411102e-05, 5.180388689041138e-05, 5.531497299671173e-05, 5.8826059103012085e-05, 6.233714520931244e-05, 6.584823131561279e-05, 6.935931742191315e-05, 7.28704035282135e-05, 7.638148963451385e-05, 7.989257574081421e-05, 8.340366184711456e-05, 8.691474795341492e-05, 9.042583405971527e-05, 9.393692016601562e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 3.0, 6.0, 15.0, 16.0, 20.0, 35.0, 52.0, 89.0, 111.0, 189.0, 347.0, 584.0, 1145.0, 2252.0, 4989.0, 13080.0, 44336.0, 720181.0, 206869.0, 34729.0, 10901.0, 4320.0, 1889.0, 1033.0, 495.0, 297.0, 205.0, 108.0, 77.0, 47.0, 37.0, 30.0, 21.0, 13.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.53515625, -0.5193748474121094, -0.5035934448242188, -0.4878120422363281, -0.4720306396484375, -0.4562492370605469, -0.44046783447265625, -0.4246864318847656, -0.408905029296875, -0.3931236267089844, -0.37734222412109375, -0.3615608215332031, -0.3457794189453125, -0.3299980163574219, -0.31421661376953125, -0.2984352111816406, -0.28265380859375, -0.2668724060058594, -0.25109100341796875, -0.23530960083007812, -0.2195281982421875, -0.20374679565429688, -0.18796539306640625, -0.17218399047851562, -0.156402587890625, -0.14062118530273438, -0.12483978271484375, -0.10905838012695312, -0.0932769775390625, -0.07749557495117188, -0.06171417236328125, -0.045932769775390625, -0.0301513671875, -0.014369964599609375, 0.00141143798828125, 0.017192840576171875, 0.0329742431640625, 0.048755645751953125, 0.06453704833984375, 0.08031845092773438, 0.096099853515625, 0.11188125610351562, 0.12766265869140625, 0.14344406127929688, 0.1592254638671875, 0.17500686645507812, 0.19078826904296875, 0.20656967163085938, 0.22235107421875, 0.23813247680664062, 0.25391387939453125, 0.2696952819824219, 0.2854766845703125, 0.3012580871582031, 0.31703948974609375, 0.3328208923339844, 0.348602294921875, 0.3643836975097656, 0.38016510009765625, 0.3959465026855469, 0.4117279052734375, 0.4275093078613281, 0.44329071044921875, 0.4590721130371094, 0.474853515625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 6.0, 12.0, 13.0, 15.0, 22.0, 18.0, 35.0, 45.0, 55.0, 67.0, 90.0, 102.0, 83.0, 86.0, 76.0, 54.0, 43.0, 27.0, 27.0, 16.0, 16.0, 16.0, 8.0, 10.0, 12.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.6095657348632812, -0.5916900634765625, -0.5738143920898438, -0.555938720703125, -0.5380630493164062, -0.5201873779296875, -0.5023117065429688, -0.48443603515625, -0.46656036376953125, -0.4486846923828125, -0.43080902099609375, -0.412933349609375, -0.39505767822265625, -0.3771820068359375, -0.35930633544921875, -0.3414306640625, -0.32355499267578125, -0.3056793212890625, -0.28780364990234375, -0.269927978515625, -0.25205230712890625, -0.2341766357421875, -0.21630096435546875, -0.19842529296875, -0.18054962158203125, -0.1626739501953125, -0.14479827880859375, -0.126922607421875, -0.10904693603515625, -0.0911712646484375, -0.07329559326171875, -0.055419921875, -0.03754425048828125, -0.0196685791015625, -0.00179290771484375, 0.016082763671875, 0.03395843505859375, 0.0518341064453125, 0.06970977783203125, 0.08758544921875, 0.10546112060546875, 0.1233367919921875, 0.14121246337890625, 0.159088134765625, 0.17696380615234375, 0.1948394775390625, 0.21271514892578125, 0.2305908203125, 0.24846649169921875, 0.2663421630859375, 0.28421783447265625, 0.302093505859375, 0.31996917724609375, 0.3378448486328125, 0.35572052001953125, 0.37359619140625, 0.39147186279296875, 0.4093475341796875, 0.42722320556640625, 0.445098876953125, 0.46297454833984375, 0.4808502197265625, 0.49872589111328125, 0.5166015625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 7.0, 12.0, 22.0, 43.0, 78.0, 420.0, 224.0, 82.0, 48.0, 26.0, 13.0, 6.0, 13.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.276588439941406, -21.302501678466797, -20.328414916992188, -19.354328155517578, -18.38024139404297, -17.40615463256836, -16.43206787109375, -15.457982063293457, -14.483895301818848, -13.509808540344238, -12.535721778869629, -11.561635971069336, -10.587549209594727, -9.613462448120117, -8.639375686645508, -7.665288925170898, -6.691202163696289, -5.71711540222168, -4.74302864074707, -3.768942356109619, -2.7948555946350098, -1.8207688331604004, -0.8466825485229492, 0.12740421295166016, 1.1014909744262695, 2.075577735900879, 3.049664258956909, 4.0237507820129395, 4.997837543487549, 5.971924304962158, 6.946010589599609, 7.920097351074219, 8.894184112548828, 9.868270874023438, 10.842357635498047, 11.816444396972656, 12.790531158447266, 13.764617919921875, 14.738703727722168, 15.712790489196777, 16.686878204345703, 17.660964965820312, 18.635051727294922, 19.60913848876953, 20.58322525024414, 21.55731201171875, 22.53139877319336, 23.50548553466797, 24.479570388793945, 25.453657150268555, 26.427743911743164, 27.401830673217773, 28.375917434692383, 29.350004196166992, 30.32408905029297, 31.298175811767578, 32.27226257324219, 33.2463493347168, 34.220436096191406, 35.194522857666016, 36.168609619140625, 37.142696380615234, 38.116783142089844, 39.09086990356445, 40.06495666503906]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 2.0, 10.0, 9.0, 10.0, 10.0, 19.0, 21.0, 27.0, 29.0, 25.0, 37.0, 69.0, 260.0, 197.0, 47.0, 28.0, 34.0, 31.0, 23.0, 17.0, 16.0, 15.0, 11.0, 9.0, 10.0, 8.0, 3.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.47252082824707, -29.70720863342285, -28.941896438598633, -28.176584243774414, -27.411272048950195, -26.645959854125977, -25.88064956665039, -25.115337371826172, -24.350025177001953, -23.584712982177734, -22.819400787353516, -22.054088592529297, -21.288776397705078, -20.52346420288086, -19.75815200805664, -18.992839813232422, -18.227527618408203, -17.462215423583984, -16.696903228759766, -15.931591033935547, -15.166278839111328, -14.40096664428711, -13.635655403137207, -12.870343208312988, -12.10503101348877, -11.33971881866455, -10.574406623840332, -9.80909538269043, -9.043783187866211, -8.278470993041992, -7.513158798217773, -6.747846603393555, -5.982532501220703, -5.217220306396484, -4.451908111572266, -3.686596393585205, -2.9212841987609863, -2.1559720039367676, -1.390660285949707, -0.6253480911254883, 0.13996410369873047, 0.9052761793136597, 1.6705882549285889, 2.4359002113342285, 3.2012124061584473, 3.966524600982666, 4.731836318969727, 5.497148513793945, 6.262460708618164, 7.027772903442383, 7.793085098266602, 8.55839729309082, 9.323709487915039, 10.089021682739258, 10.85433292388916, 11.619645118713379, 12.384957313537598, 13.150269508361816, 13.915581703186035, 14.680892944335938, 15.446205139160156, 16.211517333984375, 16.976829528808594, 17.742141723632812, 18.50745391845703]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 5.0, 15.0, 14.0, 16.0, 17.0, 21.0, 18.0, 25.0, 30.0, 35.0, 53.0, 86.0, 284.0, 91.0, 48.0, 37.0, 39.0, 27.0, 24.0, 30.0, 10.0, 7.0, 9.0, 13.0, 9.0, 7.0, 8.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.89453125, -2.8213043212890625, -2.748077392578125, -2.6748504638671875, -2.60162353515625, -2.5283966064453125, -2.455169677734375, -2.3819427490234375, -2.3087158203125, -2.2354888916015625, -2.162261962890625, -2.0890350341796875, -2.01580810546875, -1.9425811767578125, -1.869354248046875, -1.7961273193359375, -1.722900390625, -1.6496734619140625, -1.576446533203125, -1.5032196044921875, -1.42999267578125, -1.3567657470703125, -1.283538818359375, -1.2103118896484375, -1.1370849609375, -1.0638580322265625, -0.990631103515625, -0.9174041748046875, -0.84417724609375, -0.7709503173828125, -0.697723388671875, -0.6244964599609375, -0.55126953125, -0.4780426025390625, -0.404815673828125, -0.3315887451171875, -0.25836181640625, -0.1851348876953125, -0.111907958984375, -0.0386810302734375, 0.0345458984375, 0.1077728271484375, 0.180999755859375, 0.2542266845703125, 0.32745361328125, 0.4006805419921875, 0.473907470703125, 0.5471343994140625, 0.620361328125, 0.6935882568359375, 0.766815185546875, 0.8400421142578125, 0.91326904296875, 0.9864959716796875, 1.059722900390625, 1.1329498291015625, 1.2061767578125, 1.2794036865234375, 1.352630615234375, 1.4258575439453125, 1.49908447265625, 1.5723114013671875, 1.645538330078125, 1.7187652587890625, 1.7919921875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 8.0, 18.0, 29.0, 31.0, 46.0, 75.0, 140.0, 299.0, 980.0, 3836.0, 32154.0, 8337489.0, 10193.0, 2070.0, 611.0, 229.0, 125.0, 68.0, 59.0, 34.0, 14.0, 12.0, 10.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.528486251831055, -22.821603775024414, -22.11471939086914, -21.4078369140625, -20.70095443725586, -19.99407196044922, -19.287189483642578, -18.580305099487305, -17.873422622680664, -17.166540145874023, -16.45965576171875, -15.75277328491211, -15.045890808105469, -14.339008331298828, -13.632124900817871, -12.925241470336914, -12.218358993530273, -11.511476516723633, -10.804593086242676, -10.097709655761719, -9.390827178955078, -8.683944702148438, -7.9770612716674805, -7.270178318023682, -6.563295364379883, -5.856412410736084, -5.149529457092285, -4.442646503448486, -3.7357635498046875, -3.0288805961608887, -2.32199764251709, -1.615114688873291, -0.9082298278808594, -0.20134687423706055, 0.5055360794067383, 1.212419033050537, 1.919301986694336, 2.6261849403381348, 3.3330678939819336, 4.039950847625732, 4.746833801269531, 5.45371675491333, 6.160599708557129, 6.867482662200928, 7.574365615844727, 8.281248092651367, 8.988131523132324, 9.695014953613281, 10.401897430419922, 11.108779907226562, 11.81566333770752, 12.522546768188477, 13.229429244995117, 13.936311721801758, 14.643195152282715, 15.350078582763672, 16.056961059570312, 16.763843536376953, 17.470726013183594, 18.177610397338867, 18.884492874145508, 19.59137535095215, 20.298259735107422, 21.005142211914062, 21.712024688720703]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 7.0, 3.0, 8.0, 7.0, 3.0, 6.0, 4.0, 2.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.96721267700195, -33.76334762573242, -32.559486389160156, -31.355623245239258, -30.15176010131836, -28.947895050048828, -27.74403190612793, -26.54016876220703, -25.336305618286133, -24.132442474365234, -22.928579330444336, -21.724716186523438, -20.520851135253906, -19.31698989868164, -18.11312484741211, -16.90926170349121, -15.705398559570312, -14.501535415649414, -13.297672271728516, -12.0938081741333, -10.889945030212402, -9.686081886291504, -8.482217788696289, -7.278354644775391, -6.074491500854492, -4.870628356933594, -3.666764736175537, -2.4629013538360596, -1.259037971496582, -0.055174827575683594, 1.148688793182373, 2.3525524139404297, 3.5564193725585938, 4.760282516479492, 5.964146137237549, 7.1680097579956055, 8.371872901916504, 9.575736045837402, 10.779600143432617, 11.983463287353516, 13.187326431274414, 14.391189575195312, 15.595052719116211, 16.79891586303711, 18.00278091430664, 19.206642150878906, 20.410507202148438, 21.614370346069336, 22.818233489990234, 24.022096633911133, 25.22595977783203, 26.42982292175293, 27.633686065673828, 28.83755111694336, 30.041414260864258, 31.245277404785156, 32.44914245605469, 33.65300750732422, 34.856868743896484, 36.060733795166016, 37.26459503173828, 38.46846008300781, 39.67232131958008, 40.87618637084961, 42.080047607421875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 9.0, 6.0, 8.0, 14.0, 20.0, 39.0, 42.0, 54.0, 89.0, 108.0, 203.0, 297.0, 579.0, 1217.0, 3338.0, 10502.0, 40830.0, 163389.0, 218609.0, 61467.0, 15723.0, 4519.0, 1508.0, 657.0, 409.0, 182.0, 140.0, 76.0, 66.0, 41.0, 30.0, 28.0, 13.0, 5.0, 13.0, 8.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.109375, -20.431640625, -19.75390625, -19.076171875, -18.3984375, -17.720703125, -17.04296875, -16.365234375, -15.6875, -15.009765625, -14.33203125, -13.654296875, -12.9765625, -12.298828125, -11.62109375, -10.943359375, -10.265625, -9.587890625, -8.91015625, -8.232421875, -7.5546875, -6.876953125, -6.19921875, -5.521484375, -4.84375, -4.166015625, -3.48828125, -2.810546875, -2.1328125, -1.455078125, -0.77734375, -0.099609375, 0.578125, 1.255859375, 1.93359375, 2.611328125, 3.2890625, 3.966796875, 4.64453125, 5.322265625, 6.0, 6.677734375, 7.35546875, 8.033203125, 8.7109375, 9.388671875, 10.06640625, 10.744140625, 11.421875, 12.099609375, 12.77734375, 13.455078125, 14.1328125, 14.810546875, 15.48828125, 16.166015625, 16.84375, 17.521484375, 18.19921875, 18.876953125, 19.5546875, 20.232421875, 20.91015625, 21.587890625, 22.265625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 2.0, 10.0, 10.0, 2.0, 11.0, 9.0, 21.0, 31.0, 29.0, 34.0, 60.0, 55.0, 67.0, 79.0, 81.0, 89.0, 76.0, 72.0, 55.0, 36.0, 39.0, 25.0, 30.0, 26.0, 17.0, 13.0, 8.0, 6.0, 3.0, 9.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.486328125, -2.3975830078125, -2.308837890625, -2.2200927734375, -2.13134765625, -2.0426025390625, -1.953857421875, -1.8651123046875, -1.7763671875, -1.6876220703125, -1.598876953125, -1.5101318359375, -1.42138671875, -1.3326416015625, -1.243896484375, -1.1551513671875, -1.06640625, -0.9776611328125, -0.888916015625, -0.8001708984375, -0.71142578125, -0.6226806640625, -0.533935546875, -0.4451904296875, -0.3564453125, -0.2677001953125, -0.178955078125, -0.0902099609375, -0.00146484375, 0.0872802734375, 0.176025390625, 0.2647705078125, 0.353515625, 0.4422607421875, 0.531005859375, 0.6197509765625, 0.70849609375, 0.7972412109375, 0.885986328125, 0.9747314453125, 1.0634765625, 1.1522216796875, 1.240966796875, 1.3297119140625, 1.41845703125, 1.5072021484375, 1.595947265625, 1.6846923828125, 1.7734375, 1.8621826171875, 1.950927734375, 2.0396728515625, 2.12841796875, 2.2171630859375, 2.305908203125, 2.3946533203125, 2.4833984375, 2.5721435546875, 2.660888671875, 2.7496337890625, 2.83837890625, 2.9271240234375, 3.015869140625, 3.1046142578125, 3.193359375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 11.0, 25.0, 55.0, 94.0, 129.0, 53.0, 49.0, 16.0, 11.0, 2.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.30025291442871, -19.579689025878906, -18.859127044677734, -18.138565063476562, -17.418001174926758, -16.697437286376953, -15.976875305175781, -15.256312370300293, -14.535749435424805, -13.815186500549316, -13.094623565673828, -12.37406063079834, -11.653497695922852, -10.932934761047363, -10.212371826171875, -9.491808891296387, -8.771245956420898, -8.05068302154541, -7.330120086669922, -6.609557151794434, -5.888994216918945, -5.168431282043457, -4.447868347167969, -3.7273054122924805, -3.006742477416992, -2.286179542541504, -1.5656166076660156, -0.8450536727905273, -0.12449073791503906, 0.5960721969604492, 1.3166351318359375, 2.037198066711426, 2.757762908935547, 3.478325843811035, 4.198888778686523, 4.919451713562012, 5.6400146484375, 6.360577583312988, 7.081140518188477, 7.801703453063965, 8.522266387939453, 9.242829322814941, 9.96339225769043, 10.683955192565918, 11.404518127441406, 12.125081062316895, 12.845643997192383, 13.566206932067871, 14.28676986694336, 15.007332801818848, 15.727895736694336, 16.44845962524414, 17.169021606445312, 17.889583587646484, 18.61014747619629, 19.330711364746094, 20.051273345947266, 20.771835327148438, 21.492399215698242, 22.212963104248047, 22.93352508544922, 23.65408706665039, 24.374650955200195, 25.09521484375, 25.815776824951172]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 12.0, 11.0, 6.0, 16.0, 43.0, 71.0, 108.0, 98.0, 53.0, 25.0, 14.0, 7.0, 5.0, 1.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.065173149108887, -13.424150466918945, -12.783127784729004, -12.142105102539062, -11.501082420349121, -10.86005973815918, -10.219037055969238, -9.578014373779297, -8.936991691589355, -8.295969009399414, -7.654946327209473, -7.013923645019531, -6.37290096282959, -5.731878280639648, -5.090855598449707, -4.449832916259766, -3.808810234069824, -3.167787551879883, -2.5267648696899414, -1.8857421875, -1.2447195053100586, -0.6036968231201172, 0.03732585906982422, 0.6783485412597656, 1.319371223449707, 1.9603939056396484, 2.60141658782959, 3.2424392700195312, 3.8834619522094727, 4.524484634399414, 5.1655073165893555, 5.806529998779297, 6.447553634643555, 7.088576316833496, 7.7295989990234375, 8.370621681213379, 9.01164436340332, 9.652667045593262, 10.293689727783203, 10.934712409973145, 11.575735092163086, 12.216757774353027, 12.857780456542969, 13.49880313873291, 14.139825820922852, 14.780848503112793, 15.421871185302734, 16.06289291381836, 16.703916549682617, 17.344940185546875, 17.9859619140625, 18.626983642578125, 19.268007278442383, 19.90903091430664, 20.550052642822266, 21.19107437133789, 21.83209800720215, 22.473121643066406, 23.11414337158203, 23.755165100097656, 24.396188735961914, 25.037212371826172, 25.678234100341797, 26.319255828857422, 26.96027946472168]}, "eval/loss": 6.086973190307617, "eval/wer": 1.4276643450999067, "eval/runtime": 935.3935, "eval/samples_per_second": 2.824, "eval/steps_per_second": 0.354} \ No newline at end of file